[ { "page_no": 0, "size": { "width": 612.0, "height": 792.0 }, "parsed_page": { "dimension": { "angle": 0.0, "rect": { "r_x0": 0.0, "r_y0": 0.0, "r_x1": 612.0, "r_y1": 0.0, "r_x2": 612.0, "r_y2": 792.0, "r_x3": 0.0, "r_y3": 792.0, "coord_origin": "BOTTOMLEFT" }, "boundary_type": "crop_box", "art_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "bleed_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "crop_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "media_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "trim_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" } }, "bitmap_resources": [], "char_cells": [], "word_cells": [], "textline_cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 128.58112000000006, "r_x1": 480.59735, "r_y1": 128.58112000000006, "r_x2": 480.59735, "r_y2": 115.89910999999995, "r_x3": 134.765, "r_y3": 115.89910999999995, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure", "orig": "Optimized Table Tokenization for Table Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 266.67499, "r_y0": 146.51409999999998, "r_x1": 348.68506, "r_y1": 146.51409999999998, "r_x2": 348.68506, "r_y2": 133.83209, "r_x3": 266.67499, "r_y3": 133.83209, "coord_origin": "TOPLEFT" }, "text": "Recognition", "orig": "Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.22598, "r_y0": 180.47069999999997, "r_x1": 217.04390999999998, "r_y1": 180.47069999999997, "r_x2": 217.04390999999998, "r_y2": 171.67371000000003, "r_x3": 151.22598, "r_y3": 171.67371000000003, "coord_origin": "TOPLEFT" }, "text": "Maksym Lysak", "orig": "Maksym Lysak", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 217.04599, "r_y0": 176.27484000000004, "r_x1": 235.18764, "r_y1": 176.27484000000004, "r_x2": 235.18764, "r_y2": 170.08209, "r_x3": 217.04599, "r_y3": 170.08209, "coord_origin": "TOPLEFT" }, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 235.18598999999998, "r_y0": 176.27484000000004, "r_x1": 241.4129, "r_y1": 176.27484000000004, "r_x2": 241.4129, "r_y2": 169.69159000000002, "r_x3": 235.18598999999998, "r_y3": 169.69159000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 241.41299000000004, "r_y0": 176.27484000000004, "r_x1": 257.29932, "r_y1": 176.27484000000004, "r_x2": 257.29932, "r_y2": 170.08209, "r_x3": 241.41299000000004, "r_y3": 170.08209, "coord_origin": "TOPLEFT" }, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 257.298, "r_y0": 176.27484000000004, "r_x1": 263.5249, "r_y1": 176.27484000000004, "r_x2": 263.5249, "r_y2": 169.69159000000002, "r_x3": 257.298, "r_y3": 169.69159000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.52499, "r_y0": 176.27484000000004, "r_x1": 279.41132, "r_y1": 176.27484000000004, "r_x2": 279.41132, "r_y2": 170.08209, "r_x3": 263.52499, "r_y3": 170.08209, "coord_origin": "TOPLEFT" }, "text": "3723", "orig": "3723", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 279.41, "r_y0": 176.27484000000004, "r_x1": 285.6369, "r_y1": 176.27484000000004, "r_x2": 285.6369, "r_y2": 169.69159000000002, "r_x3": 279.41, "r_y3": 169.69159000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.63602, "r_y0": 180.47069999999997, "r_x1": 392.27664, "r_y1": 180.47069999999997, "r_x2": 392.27664, "r_y2": 171.67371000000003, "r_x3": 285.63602, "r_y3": 171.67371000000003, "coord_origin": "TOPLEFT" }, "text": "$^{6960]}$, Ahmed Nassar[0000", "orig": "$^{6960]}$, Ahmed Nassar[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 392.27502, "r_y0": 176.27484000000004, "r_x1": 398.50192, "r_y1": 176.27484000000004, "r_x2": 398.50192, "r_y2": 169.69159000000002, "r_x3": 392.27502, "r_y3": 169.69159000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.50201, "r_y0": 176.27484000000004, "r_x1": 414.38834, "r_y1": 176.27484000000004, "r_x2": 414.38834, "r_y2": 170.08209, "r_x3": 398.50201, "r_y3": 170.08209, "coord_origin": "TOPLEFT" }, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 414.38702, "r_y0": 176.27484000000004, "r_x1": 420.61392, "r_y1": 176.27484000000004, "r_x2": 420.61392, "r_y2": 169.69159000000002, "r_x3": 414.38702, "r_y3": 169.69159000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 420.61304, "r_y0": 176.27484000000004, "r_x1": 436.49936, "r_y1": 176.27484000000004, "r_x2": 436.49936, "r_y2": 170.08209, "r_x3": 420.61304, "r_y3": 170.08209, "coord_origin": "TOPLEFT" }, "text": "9468", "orig": "9468", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.49805000000003, "r_y0": 176.27484000000004, "r_x1": 442.72495000000004, "r_y1": 176.27484000000004, "r_x2": 442.72495000000004, "r_y2": 169.69159000000002, "r_x3": 436.49805000000003, "r_y3": 169.69159000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.72504, "r_y0": 180.47069999999997, "r_x1": 464.12963999999994, "r_y1": 180.47069999999997, "r_x2": 464.12963999999994, "r_y2": 171.67371000000003, "r_x3": 442.72504, "r_y3": 171.67371000000003, "coord_origin": "TOPLEFT" }, "text": "$^{0822]}$,", "orig": "$^{0822]}$,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.34305, "r_y0": 192.42571999999996, "r_x1": 224.80720999999997, "r_y1": 192.42571999999996, "r_x2": 224.80720999999997, "r_y2": 183.62872000000004, "r_x3": 139.34305, "r_y3": 183.62872000000004, "coord_origin": "TOPLEFT" }, "text": "Nikolaos Livathinos", "orig": "Nikolaos Livathinos", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 224.80704000000003, "r_y0": 188.23090000000002, "r_x1": 242.94868, "r_y1": 188.23090000000002, "r_x2": 242.94868, "r_y2": 182.03814999999997, "r_x3": 224.80704000000003, "r_y3": 182.03814999999997, "coord_origin": "TOPLEFT" }, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 242.94704000000002, "r_y0": 188.23090000000002, "r_x1": 249.17394999999996, "r_y1": 188.23090000000002, "r_x2": 249.17394999999996, "r_y2": 181.64764000000002, "r_x3": 242.94704000000002, "r_y3": 181.64764000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.17404000000002, "r_y0": 188.23090000000002, "r_x1": 265.06036, "r_y1": 188.23090000000002, "r_x2": 265.06036, "r_y2": 182.03814999999997, "r_x3": 249.17404000000002, "r_y3": 182.03814999999997, "coord_origin": "TOPLEFT" }, "text": "0001", "orig": "0001", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 265.05905, "r_y0": 188.23090000000002, "r_x1": 271.28595, "r_y1": 188.23090000000002, "r_x2": 271.28595, "r_y2": 181.64764000000002, "r_x3": 265.05905, "r_y3": 181.64764000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 271.28506, "r_y0": 188.23090000000002, "r_x1": 287.17139, "r_y1": 188.23090000000002, "r_x2": 287.17139, "r_y2": 182.03814999999997, "r_x3": 271.28506, "r_y3": 182.03814999999997, "coord_origin": "TOPLEFT" }, "text": "8513", "orig": "8513", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 287.17007, "r_y0": 188.23090000000002, "r_x1": 293.39697, "r_y1": 188.23090000000002, "r_x2": 293.39697, "r_y2": 181.64764000000002, "r_x3": 287.17007, "r_y3": 181.64764000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.39706, "r_y0": 192.42571999999996, "r_x1": 404.1597, "r_y1": 192.42571999999996, "r_x2": 404.1597, "r_y2": 183.62872000000004, "r_x3": 293.39706, "r_y3": 183.62872000000004, "coord_origin": "TOPLEFT" }, "text": "$^{3491]}$, Christoph Auer[0000", "orig": "$^{3491]}$, Christoph Auer[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 404.15808, "r_y0": 188.23090000000002, "r_x1": 410.38498, "r_y1": 188.23090000000002, "r_x2": 410.38498, "r_y2": 181.64764000000002, "r_x3": 404.15808, "r_y3": 181.64764000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.38507, "r_y0": 188.23090000000002, "r_x1": 426.27139, "r_y1": 188.23090000000002, "r_x2": 426.27139, "r_y2": 182.03814999999997, "r_x3": 410.38507, "r_y3": 182.03814999999997, "coord_origin": "TOPLEFT" }, "text": "0001", "orig": "0001", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 426.27008, "r_y0": 188.23090000000002, "r_x1": 432.49697999999995, "r_y1": 188.23090000000002, "r_x2": 432.49697999999995, "r_y2": 181.64764000000002, "r_x3": 426.27008, "r_y3": 181.64764000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 432.49609, "r_y0": 188.23090000000002, "r_x1": 448.3824200000001, "r_y1": 188.23090000000002, "r_x2": 448.3824200000001, "r_y2": 182.03814999999997, "r_x3": 432.49609, "r_y3": 182.03814999999997, "coord_origin": "TOPLEFT" }, "text": "5761", "orig": "5761", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 448.3811, "r_y0": 188.23090000000002, "r_x1": 454.608, "r_y1": 188.23090000000002, "r_x2": 454.608, "r_y2": 181.64764000000002, "r_x3": 448.3811, "r_y3": 181.64764000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 454.60808999999995, "r_y0": 192.42571999999996, "r_x1": 476.01270000000005, "r_y1": 192.42571999999996, "r_x2": 476.01270000000005, "r_y2": 183.62872000000004, "r_x3": 454.60808999999995, "r_y3": 183.62872000000004, "coord_origin": "TOPLEFT" }, "text": "$^{0422]}$,", "orig": "$^{0422]}$,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.52109000000002, "r_y0": 204.38073999999995, "r_x1": 298.6087, "r_y1": 204.38073999999995, "r_x2": 298.6087, "r_y2": 195.58374000000003, "r_x3": 229.52109000000002, "r_y3": 195.58374000000003, "coord_origin": "TOPLEFT" }, "text": "and Peter Staar", "orig": "and Peter Staar", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 298.60608, "r_y0": 200.18591000000004, "r_x1": 316.74771, "r_y1": 200.18591000000004, "r_x2": 316.74771, "r_y2": 193.99316, "r_x3": 298.60608, "r_y3": 193.99316, "coord_origin": "TOPLEFT" }, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.74609, "r_y0": 200.18591000000004, "r_x1": 322.97299, "r_y1": 200.18591000000004, "r_x2": 322.97299, "r_y2": 193.60266000000001, "r_x3": 316.74609, "r_y3": 193.60266000000001, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.97308, "r_y0": 200.18591000000004, "r_x1": 338.85941, "r_y1": 200.18591000000004, "r_x2": 338.85941, "r_y2": 193.99316, "r_x3": 322.97308, "r_y3": 193.99316, "coord_origin": "TOPLEFT" }, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 338.85809, "r_y0": 200.18591000000004, "r_x1": 345.08499, "r_y1": 200.18591000000004, "r_x2": 345.08499, "r_y2": 193.60266000000001, "r_x3": 338.85809, "r_y3": 193.60266000000001, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.08508, "r_y0": 200.18591000000004, "r_x1": 360.97141, "r_y1": 200.18591000000004, "r_x2": 360.97141, "r_y2": 193.99316, "r_x3": 345.08508, "r_y3": 193.99316, "coord_origin": "TOPLEFT" }, "text": "8088", "orig": "8088", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 360.97009, "r_y0": 200.18591000000004, "r_x1": 367.19699, "r_y1": 200.18591000000004, "r_x2": 367.19699, "r_y2": 193.60266000000001, "r_x3": 360.97009, "r_y3": 193.60266000000001, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.19611, "r_y0": 200.18591000000004, "r_x1": 385.33774, "r_y1": 200.18591000000004, "r_x2": 385.33774, "r_y2": 193.99316, "r_x3": 367.19611, "r_y3": 193.99316, "coord_origin": "TOPLEFT" }, "text": "0823]", "orig": "0823]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 279.1051, "r_y0": 225.27368, "r_x1": 336.25153, "r_y1": 225.27368, "r_x2": 336.25153, "r_y2": 217.20398, "r_x3": 279.1051, "r_y3": 217.20398, "coord_origin": "TOPLEFT" }, "text": "IBM Research", "orig": "IBM Research", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.96609, "r_y0": 236.27752999999996, "r_x1": 392.38983, "r_y1": 236.27752999999996, "r_x2": 392.38983, "r_y2": 228.80853000000002, "r_x3": 222.96609, "r_y3": 228.80853000000002, "coord_origin": "TOPLEFT" }, "text": "{mly,ahn,nli,cau,taa}@zurich.ibm.com", "orig": "{mly,ahn,nli,cau,taa}@zurich.ibm.com", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1111, "r_y0": 278.22748, "r_x1": 206.6358, "r_y1": 278.22748, "r_x2": 206.6358, "r_y2": 270.30115, "r_x3": 163.1111, "r_y3": 270.30115, "coord_origin": "TOPLEFT" }, "text": "Abstract.", "orig": "Abstract.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 211.6171, "r_y0": 278.43364999999994, "r_x1": 452.2447199999999, "r_y1": 278.43364999999994, "r_x2": 452.2447199999999, "r_y2": 270.36395000000005, "r_x3": 211.6171, "r_y3": 270.36395000000005, "coord_origin": "TOPLEFT" }, "text": "Extracting tables from documents is a crucial task in any", "orig": "Extracting tables from documents is a crucial task in any", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1111, "r_y0": 289.39267, "r_x1": 452.24246, "r_y1": 289.39267, "r_x2": 452.24246, "r_y2": 281.3229099999999, "r_x3": 163.1111, "r_y3": 281.3229099999999, "coord_origin": "TOPLEFT" }, "text": "document conversion pipeline. Recently, transformer-based models have", "orig": "document conversion pipeline. Recently, transformer-based models have", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1111, "r_y0": 300.35165000000006, "r_x1": 452.24792, "r_y1": 300.35165000000006, "r_x2": 452.24792, "r_y2": 292.28189, "r_x3": 163.1111, "r_y3": 292.28189, "coord_origin": "TOPLEFT" }, "text": "demonstrated that table-structure can be recognized with impressive ac-", "orig": "demonstrated that table-structure can be recognized with impressive ac-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1111, "r_y0": 311.31064, "r_x1": 452.2407799999999, "r_y1": 311.31064, "r_x2": 452.2407799999999, "r_y2": 303.24088, "r_x3": 163.1111, "r_y3": 303.24088, "coord_origin": "TOPLEFT" }, "text": "curacy using Image-to-Markup-Sequence (Im2Seq) approaches. Taking", "orig": "curacy using Image-to-Markup-Sequence (Im2Seq) approaches. Taking", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1111, "r_y0": 322.26865, "r_x1": 452.24609, "r_y1": 322.26865, "r_x2": 452.24609, "r_y2": 314.19888, "r_x3": 163.1111, "r_y3": 314.19888, "coord_origin": "TOPLEFT" }, "text": "only the image of a table, such models predict a sequence of tokens (e.g.", "orig": "only the image of a table, such models predict a sequence of tokens (e.g.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1111, "r_y0": 333.22763, "r_x1": 452.24615000000006, "r_y1": 333.22763, "r_x2": 452.24615000000006, "r_y2": 325.15787, "r_x3": 163.1111, "r_y3": 325.15787, "coord_origin": "TOPLEFT" }, "text": "in HTML, LaTeX) which represent the structure of the table. Since the", "orig": "in HTML, LaTeX) which represent the structure of the table. Since the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1111, "r_y0": 344.18661, "r_x1": 452.24707, "r_y1": 344.18661, "r_x2": 452.24707, "r_y2": 336.11685, "r_x3": 163.1111, "r_y3": 336.11685, "coord_origin": "TOPLEFT" }, "text": "token representation of the table structure has a significant impact on", "orig": "token representation of the table structure has a significant impact on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1111, "r_y0": 355.1456, "r_x1": 452.2459999999999, "r_y1": 355.1456, "r_x2": 452.2459999999999, "r_y2": 347.07584, "r_x3": 163.1111, "r_y3": 347.07584, "coord_origin": "TOPLEFT" }, "text": "the accuracy and run-time performance of any Im2Seq model, we inves-", "orig": "the accuracy and run-time performance of any Im2Seq model, we inves-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1111, "r_y0": 366.10458, "r_x1": 452.2479900000001, "r_y1": 366.10458, "r_x2": 452.2479900000001, "r_y2": 358.03482, "r_x3": 163.1111, "r_y3": 358.03482, "coord_origin": "TOPLEFT" }, "text": "tigate in this paper how table-structure representation can be optimised.", "orig": "tigate in this paper how table-structure representation can be optimised.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1111, "r_y0": 377.06357, "r_x1": 452.24609, "r_y1": 377.06357, "r_x2": 452.24609, "r_y2": 368.9938, "r_x3": 163.1111, "r_y3": 368.9938, "coord_origin": "TOPLEFT" }, "text": "We propose a new, optimised table-structure language (OTSL) with a", "orig": "We propose a new, optimised table-structure language (OTSL) with a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1111, "r_y0": 388.02255, "r_x1": 452.2417, "r_y1": 388.02255, "r_x2": 452.2417, "r_y2": 379.95279, "r_x3": 163.1111, "r_y3": 379.95279, "coord_origin": "TOPLEFT" }, "text": "minimized vocabulary and specific rules. The benefits of OTSL are that", "orig": "minimized vocabulary and specific rules. The benefits of OTSL are that", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1111, "r_y0": 398.98154, "r_x1": 452.2443200000001, "r_y1": 398.98154, "r_x2": 452.2443200000001, "r_y2": 390.91177, "r_x3": 163.1111, "r_y3": 390.91177, "coord_origin": "TOPLEFT" }, "text": "it reduces the number of tokens to 5 (HTML needs 28+) and shortens", "orig": "it reduces the number of tokens to 5 (HTML needs 28+) and shortens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1111, "r_y0": 409.94052, "r_x1": 452.24878000000007, "r_y1": 409.94052, "r_x2": 452.24878000000007, "r_y2": 401.87076, "r_x3": 163.1111, "r_y3": 401.87076, "coord_origin": "TOPLEFT" }, "text": "the sequence length to half of HTML on average. Consequently, model", "orig": "the sequence length to half of HTML on average. Consequently, model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1111, "r_y0": 420.8995100000001, "r_x1": 452.24063000000007, "r_y1": 420.8995100000001, "r_x2": 452.24063000000007, "r_y2": 412.82974, "r_x3": 163.1111, "r_y3": 412.82974, "coord_origin": "TOPLEFT" }, "text": "accuracy improves significantly, inference time is halved compared to", "orig": "accuracy improves significantly, inference time is halved compared to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1111, "r_y0": 431.85751000000005, "r_x1": 452.24161, "r_y1": 431.85751000000005, "r_x2": 452.24161, "r_y2": 423.78774999999996, "r_x3": 163.1111, "r_y3": 423.78774999999996, "coord_origin": "TOPLEFT" }, "text": "HTML-based models, and the predicted table structures are always syn-", "orig": "HTML-based models, and the predicted table structures are always syn-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1111, "r_y0": 442.8165, "r_x1": 452.24429, "r_y1": 442.8165, "r_x2": 452.24429, "r_y2": 434.74673, "r_x3": 163.1111, "r_y3": 434.74673, "coord_origin": "TOPLEFT" }, "text": "tactically correct. This in turn eliminates most post-processing needs.", "orig": "tactically correct. This in turn eliminates most post-processing needs.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1111, "r_y0": 453.77547999999996, "r_x1": 452.24603, "r_y1": 453.77547999999996, "r_x2": 452.24603, "r_y2": 445.70572000000004, "r_x3": 163.1111, "r_y3": 445.70572000000004, "coord_origin": "TOPLEFT" }, "text": "Popular table structure data-sets will be published in OTSL format to", "orig": "Popular table structure data-sets will be published in OTSL format to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1111, "r_y0": 464.73447, "r_x1": 225.56116, "r_y1": 464.73447, "r_x2": 225.56116, "r_y2": 456.6647, "r_x3": 163.1111, "r_y3": 456.6647, "coord_origin": "TOPLEFT" }, "text": "the community.", "orig": "the community.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1111, "r_y0": 486.62024, "r_x1": 211.94211, "r_y1": 486.62024, "r_x2": 211.94211, "r_y2": 478.69394, "r_x3": 163.1111, "r_y3": 478.69394, "coord_origin": "TOPLEFT" }, "text": "Keywords:", "orig": "Keywords:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 216.55208999999996, "r_y0": 486.82648, "r_x1": 452.24158, "r_y1": 486.82648, "r_x2": 452.24158, "r_y2": 478.75671, "r_x3": 216.55208999999996, "r_y3": 478.75671, "coord_origin": "TOPLEFT" }, "text": "Table Structure Recognition \u00b7 Data Representation \u00b7 Trans-", "orig": "Table Structure Recognition \u00b7 Data Representation \u00b7 Trans-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11111, "r_y0": 497.78549, "r_x1": 257.64185, "r_y1": 497.78549, "r_x2": 257.64185, "r_y2": 489.71573, "r_x3": 163.11111, "r_y3": 489.71573, "coord_origin": "TOPLEFT" }, "text": "formers \u00b7 Optimization.", "orig": "formers \u00b7 Optimization.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76512, "r_y0": 532.68808, "r_x1": 141.48872, "r_y1": 532.68808, "r_x2": 141.48872, "r_y2": 522.11969, "r_x3": 134.76512, "r_y3": 522.11969, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.93832, "r_y0": 532.68808, "r_x1": 228.93384, "r_y1": 532.68808, "r_x2": 228.93384, "r_y2": 522.11969, "r_x3": 154.93832, "r_y3": 522.11969, "coord_origin": "TOPLEFT" }, "text": "Introduction", "orig": "Introduction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76512, "r_y0": 557.0835099999999, "r_x1": 480.5939, "r_y1": 557.0835099999999, "r_x2": 480.5939, "r_y2": 548.2865400000001, "r_x3": 134.76512, "r_y3": 548.2865400000001, "coord_origin": "TOPLEFT" }, "text": "Tables are ubiquitous in documents such as scientific papers, patents, reports,", "orig": "Tables are ubiquitous in documents such as scientific papers, patents, reports,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76512, "r_y0": 569.0395100000001, "r_x1": 480.59180000000003, "r_y1": 569.0395100000001, "r_x2": 480.59180000000003, "r_y2": 560.24254, "r_x3": 134.76512, "r_y3": 560.24254, "coord_origin": "TOPLEFT" }, "text": "manuals, specification sheets or marketing material. They often encode highly", "orig": "manuals, specification sheets or marketing material. They often encode highly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76512, "r_y0": 580.99451, "r_x1": 480.59283000000005, "r_y1": 580.99451, "r_x2": 480.59283000000005, "r_y2": 572.19754, "r_x3": 134.76512, "r_y3": 572.19754, "coord_origin": "TOPLEFT" }, "text": "valuable information and therefore need to be extracted with high accuracy.", "orig": "valuable information and therefore need to be extracted with high accuracy.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76512, "r_y0": 592.9495099999999, "r_x1": 480.5959500000001, "r_y1": 592.9495099999999, "r_x2": 480.5959500000001, "r_y2": 584.15254, "r_x3": 134.76512, "r_y3": 584.15254, "coord_origin": "TOPLEFT" }, "text": "Unfortunately, tables appear in documents in various sizes, styling and struc-", "orig": "Unfortunately, tables appear in documents in various sizes, styling and struc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76512, "r_y0": 604.90451, "r_x1": 480.58688, "r_y1": 604.90451, "r_x2": 480.58688, "r_y2": 596.10754, "r_x3": 134.76512, "r_y3": 596.10754, "coord_origin": "TOPLEFT" }, "text": "ture, making it difficult to recover their correct structure with simple analyt-", "orig": "ture, making it difficult to recover their correct structure with simple analyt-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76512, "r_y0": 616.85951, "r_x1": 480.59088, "r_y1": 616.85951, "r_x2": 480.59088, "r_y2": 608.06255, "r_x3": 134.76512, "r_y3": 608.06255, "coord_origin": "TOPLEFT" }, "text": "ical methods. Therefore, accurate table extraction is achieved these days with", "orig": "ical methods. Therefore, accurate table extraction is achieved these days with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76512, "r_y0": 628.81451, "r_x1": 279.32745, "r_y1": 628.81451, "r_x2": 279.32745, "r_y2": 620.01755, "r_x3": 134.76512, "r_y3": 620.01755, "coord_origin": "TOPLEFT" }, "text": "machine-learning based methods.", "orig": "machine-learning based methods.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.70811, "r_y0": 640.94452, "r_x1": 480.58899, "r_y1": 640.94452, "r_x2": 480.58899, "r_y2": 632.14755, "r_x3": 149.70811, "r_y3": 632.14755, "coord_origin": "TOPLEFT" }, "text": "In modern document understanding systems [1,15], table extraction is typi-", "orig": "In modern document understanding systems [1,15], table extraction is typi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76512, "r_y0": 652.8995199999999, "r_x1": 480.59583, "r_y1": 652.8995199999999, "r_x2": 480.59583, "r_y2": 644.1025500000001, "r_x3": 134.76512, "r_y3": 644.1025500000001, "coord_origin": "TOPLEFT" }, "text": "cally a two-step process. Firstly, every table on a page is located with a bounding", "orig": "cally a two-step process. Firstly, every table on a page is located with a bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76512, "r_y0": 664.85453, "r_x1": 480.59496999999993, "r_y1": 664.85453, "r_x2": 480.59496999999993, "r_y2": 656.05756, "r_x3": 134.76512, "r_y3": 656.05756, "coord_origin": "TOPLEFT" }, "text": "box, and secondly, their logical row and column structure is recognized. As of", "orig": "box, and secondly, their logical row and column structure is recognized. As of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 18.340218, "r_y0": 555.00003, "r_x1": 36.339787, "r_y1": 555.00003, "r_x2": 36.339787, "r_y2": 209.47997999999995, "r_x3": 18.340218, "r_y3": 209.47997999999995, "coord_origin": "TOPLEFT" }, "text": "arXiv:2305.03393v1 [cs.CV] 5 May 2023", "orig": "arXiv:2305.03393v1 [cs.CV] 5 May 2023", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "has_chars": false, "has_words": false, "has_lines": true, "image": null, "lines": [] }, "predictions": { "layout": { "clusters": [ { "id": 5, "label": "section_header", "bbox": { "l": 134.765, "t": 115.89910999999995, "r": 480.59735, "b": 146.51409999999998, "coord_origin": "TOPLEFT" }, "confidence": 0.8918349742889404, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 128.58112000000006, "r_x1": 480.59735, "r_y1": 128.58112000000006, "r_x2": 480.59735, "r_y2": 115.89910999999995, "r_x3": 134.765, "r_y3": 115.89910999999995, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure", "orig": "Optimized Table Tokenization for Table Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 266.67499, "r_y0": 146.51409999999998, "r_x1": 348.68506, "r_y1": 146.51409999999998, "r_x2": 348.68506, "r_y2": 133.83209, "r_x3": 266.67499, "r_y3": 133.83209, "coord_origin": "TOPLEFT" }, "text": "Recognition", "orig": "Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 16, "label": "key_value_region", "bbox": { "l": 139.34305, "t": 169.69159000000002, "r": 476.01270000000005, "b": 236.27752999999996, "coord_origin": "TOPLEFT" }, "confidence": 0.48445820808410645, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.22598, "r_y0": 180.47069999999997, "r_x1": 217.04390999999998, "r_y1": 180.47069999999997, "r_x2": 217.04390999999998, "r_y2": 171.67371000000003, "r_x3": 151.22598, "r_y3": 171.67371000000003, "coord_origin": "TOPLEFT" }, "text": "Maksym Lysak", "orig": "Maksym Lysak", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 217.04599, "r_y0": 176.27484000000004, "r_x1": 235.18764, "r_y1": 176.27484000000004, "r_x2": 235.18764, "r_y2": 170.08209, "r_x3": 217.04599, "r_y3": 170.08209, "coord_origin": "TOPLEFT" }, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 235.18598999999998, "r_y0": 176.27484000000004, "r_x1": 241.4129, "r_y1": 176.27484000000004, "r_x2": 241.4129, "r_y2": 169.69159000000002, "r_x3": 235.18598999999998, "r_y3": 169.69159000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 241.41299000000004, "r_y0": 176.27484000000004, "r_x1": 257.29932, "r_y1": 176.27484000000004, "r_x2": 257.29932, "r_y2": 170.08209, "r_x3": 241.41299000000004, "r_y3": 170.08209, "coord_origin": "TOPLEFT" }, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 257.298, "r_y0": 176.27484000000004, "r_x1": 263.5249, "r_y1": 176.27484000000004, "r_x2": 263.5249, "r_y2": 169.69159000000002, "r_x3": 257.298, "r_y3": 169.69159000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.52499, "r_y0": 176.27484000000004, "r_x1": 279.41132, "r_y1": 176.27484000000004, "r_x2": 279.41132, "r_y2": 170.08209, "r_x3": 263.52499, "r_y3": 170.08209, "coord_origin": "TOPLEFT" }, "text": "3723", "orig": "3723", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 279.41, "r_y0": 176.27484000000004, "r_x1": 285.6369, "r_y1": 176.27484000000004, "r_x2": 285.6369, "r_y2": 169.69159000000002, "r_x3": 279.41, "r_y3": 169.69159000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.63602, "r_y0": 180.47069999999997, "r_x1": 392.27664, "r_y1": 180.47069999999997, "r_x2": 392.27664, "r_y2": 171.67371000000003, "r_x3": 285.63602, "r_y3": 171.67371000000003, "coord_origin": "TOPLEFT" }, "text": "$^{6960]}$, Ahmed Nassar[0000", "orig": "$^{6960]}$, Ahmed Nassar[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 392.27502, "r_y0": 176.27484000000004, "r_x1": 398.50192, "r_y1": 176.27484000000004, "r_x2": 398.50192, "r_y2": 169.69159000000002, "r_x3": 392.27502, "r_y3": 169.69159000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.50201, "r_y0": 176.27484000000004, "r_x1": 414.38834, "r_y1": 176.27484000000004, "r_x2": 414.38834, "r_y2": 170.08209, "r_x3": 398.50201, "r_y3": 170.08209, "coord_origin": "TOPLEFT" }, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 414.38702, "r_y0": 176.27484000000004, "r_x1": 420.61392, "r_y1": 176.27484000000004, "r_x2": 420.61392, "r_y2": 169.69159000000002, "r_x3": 414.38702, "r_y3": 169.69159000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 420.61304, "r_y0": 176.27484000000004, "r_x1": 436.49936, "r_y1": 176.27484000000004, "r_x2": 436.49936, "r_y2": 170.08209, "r_x3": 420.61304, "r_y3": 170.08209, "coord_origin": "TOPLEFT" }, "text": "9468", "orig": "9468", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.49805000000003, "r_y0": 176.27484000000004, "r_x1": 442.72495000000004, "r_y1": 176.27484000000004, "r_x2": 442.72495000000004, "r_y2": 169.69159000000002, "r_x3": 436.49805000000003, "r_y3": 169.69159000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.72504, "r_y0": 180.47069999999997, "r_x1": 464.12963999999994, "r_y1": 180.47069999999997, "r_x2": 464.12963999999994, "r_y2": 171.67371000000003, "r_x3": 442.72504, "r_y3": 171.67371000000003, "coord_origin": "TOPLEFT" }, "text": "$^{0822]}$,", "orig": "$^{0822]}$,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.34305, "r_y0": 192.42571999999996, "r_x1": 224.80720999999997, "r_y1": 192.42571999999996, "r_x2": 224.80720999999997, "r_y2": 183.62872000000004, "r_x3": 139.34305, "r_y3": 183.62872000000004, "coord_origin": "TOPLEFT" }, "text": "Nikolaos Livathinos", "orig": "Nikolaos Livathinos", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 224.80704000000003, "r_y0": 188.23090000000002, "r_x1": 242.94868, "r_y1": 188.23090000000002, "r_x2": 242.94868, "r_y2": 182.03814999999997, "r_x3": 224.80704000000003, "r_y3": 182.03814999999997, "coord_origin": "TOPLEFT" }, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 242.94704000000002, "r_y0": 188.23090000000002, "r_x1": 249.17394999999996, "r_y1": 188.23090000000002, "r_x2": 249.17394999999996, "r_y2": 181.64764000000002, "r_x3": 242.94704000000002, "r_y3": 181.64764000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.17404000000002, "r_y0": 188.23090000000002, "r_x1": 265.06036, "r_y1": 188.23090000000002, "r_x2": 265.06036, "r_y2": 182.03814999999997, "r_x3": 249.17404000000002, "r_y3": 182.03814999999997, "coord_origin": "TOPLEFT" }, "text": "0001", "orig": "0001", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 265.05905, "r_y0": 188.23090000000002, "r_x1": 271.28595, "r_y1": 188.23090000000002, "r_x2": 271.28595, "r_y2": 181.64764000000002, "r_x3": 265.05905, "r_y3": 181.64764000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 271.28506, "r_y0": 188.23090000000002, "r_x1": 287.17139, "r_y1": 188.23090000000002, "r_x2": 287.17139, "r_y2": 182.03814999999997, "r_x3": 271.28506, "r_y3": 182.03814999999997, "coord_origin": "TOPLEFT" }, "text": "8513", "orig": "8513", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 287.17007, "r_y0": 188.23090000000002, "r_x1": 293.39697, "r_y1": 188.23090000000002, "r_x2": 293.39697, "r_y2": 181.64764000000002, "r_x3": 287.17007, "r_y3": 181.64764000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.39706, "r_y0": 192.42571999999996, "r_x1": 404.1597, "r_y1": 192.42571999999996, "r_x2": 404.1597, "r_y2": 183.62872000000004, "r_x3": 293.39706, "r_y3": 183.62872000000004, "coord_origin": "TOPLEFT" }, "text": "$^{3491]}$, Christoph Auer[0000", "orig": "$^{3491]}$, Christoph Auer[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 404.15808, "r_y0": 188.23090000000002, "r_x1": 410.38498, "r_y1": 188.23090000000002, "r_x2": 410.38498, "r_y2": 181.64764000000002, "r_x3": 404.15808, "r_y3": 181.64764000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.38507, "r_y0": 188.23090000000002, "r_x1": 426.27139, "r_y1": 188.23090000000002, "r_x2": 426.27139, "r_y2": 182.03814999999997, "r_x3": 410.38507, "r_y3": 182.03814999999997, "coord_origin": "TOPLEFT" }, "text": "0001", "orig": "0001", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 426.27008, "r_y0": 188.23090000000002, "r_x1": 432.49697999999995, "r_y1": 188.23090000000002, "r_x2": 432.49697999999995, "r_y2": 181.64764000000002, "r_x3": 426.27008, "r_y3": 181.64764000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 432.49609, "r_y0": 188.23090000000002, "r_x1": 448.3824200000001, "r_y1": 188.23090000000002, "r_x2": 448.3824200000001, "r_y2": 182.03814999999997, "r_x3": 432.49609, "r_y3": 182.03814999999997, "coord_origin": "TOPLEFT" }, "text": "5761", "orig": "5761", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 448.3811, "r_y0": 188.23090000000002, "r_x1": 454.608, "r_y1": 188.23090000000002, "r_x2": 454.608, "r_y2": 181.64764000000002, "r_x3": 448.3811, "r_y3": 181.64764000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 454.60808999999995, "r_y0": 192.42571999999996, "r_x1": 476.01270000000005, "r_y1": 192.42571999999996, "r_x2": 476.01270000000005, "r_y2": 183.62872000000004, "r_x3": 454.60808999999995, "r_y3": 183.62872000000004, "coord_origin": "TOPLEFT" }, "text": "$^{0422]}$,", "orig": "$^{0422]}$,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.52109000000002, "r_y0": 204.38073999999995, "r_x1": 298.6087, "r_y1": 204.38073999999995, "r_x2": 298.6087, "r_y2": 195.58374000000003, "r_x3": 229.52109000000002, "r_y3": 195.58374000000003, "coord_origin": "TOPLEFT" }, "text": "and Peter Staar", "orig": "and Peter Staar", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 298.60608, "r_y0": 200.18591000000004, "r_x1": 316.74771, "r_y1": 200.18591000000004, "r_x2": 316.74771, "r_y2": 193.99316, "r_x3": 298.60608, "r_y3": 193.99316, "coord_origin": "TOPLEFT" }, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.74609, "r_y0": 200.18591000000004, "r_x1": 322.97299, "r_y1": 200.18591000000004, "r_x2": 322.97299, "r_y2": 193.60266000000001, "r_x3": 316.74609, "r_y3": 193.60266000000001, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.97308, "r_y0": 200.18591000000004, "r_x1": 338.85941, "r_y1": 200.18591000000004, "r_x2": 338.85941, "r_y2": 193.99316, "r_x3": 322.97308, "r_y3": 193.99316, "coord_origin": "TOPLEFT" }, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 338.85809, "r_y0": 200.18591000000004, "r_x1": 345.08499, "r_y1": 200.18591000000004, "r_x2": 345.08499, "r_y2": 193.60266000000001, "r_x3": 338.85809, "r_y3": 193.60266000000001, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.08508, "r_y0": 200.18591000000004, "r_x1": 360.97141, "r_y1": 200.18591000000004, "r_x2": 360.97141, "r_y2": 193.99316, "r_x3": 345.08508, "r_y3": 193.99316, "coord_origin": "TOPLEFT" }, "text": "8088", "orig": "8088", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 360.97009, "r_y0": 200.18591000000004, "r_x1": 367.19699, "r_y1": 200.18591000000004, "r_x2": 367.19699, "r_y2": 193.60266000000001, "r_x3": 360.97009, "r_y3": 193.60266000000001, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.19611, "r_y0": 200.18591000000004, "r_x1": 385.33774, "r_y1": 200.18591000000004, "r_x2": 385.33774, "r_y2": 193.99316, "r_x3": 367.19611, "r_y3": 193.99316, "coord_origin": "TOPLEFT" }, "text": "0823]", "orig": "0823]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 279.1051, "r_y0": 225.27368, "r_x1": 336.25153, "r_y1": 225.27368, "r_x2": 336.25153, "r_y2": 217.20398, "r_x3": 279.1051, "r_y3": 217.20398, "coord_origin": "TOPLEFT" }, "text": "IBM Research", "orig": "IBM Research", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.96609, "r_y0": 236.27752999999996, "r_x1": 392.38983, "r_y1": 236.27752999999996, "r_x2": 392.38983, "r_y2": 228.80853000000002, "r_x3": 222.96609, "r_y3": 228.80853000000002, "coord_origin": "TOPLEFT" }, "text": "{mly,ahn,nli,cau,taa}@zurich.ibm.com", "orig": "{mly,ahn,nli,cau,taa}@zurich.ibm.com", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 7, "label": "text", "bbox": { "l": 139.34305, "t": 169.69159000000002, "r": 476.01270000000005, "b": 200.18591000000004, "coord_origin": "TOPLEFT" }, "confidence": 0.7918068766593933, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.22598, "r_y0": 180.47069999999997, "r_x1": 217.04390999999998, "r_y1": 180.47069999999997, "r_x2": 217.04390999999998, "r_y2": 171.67371000000003, "r_x3": 151.22598, "r_y3": 171.67371000000003, "coord_origin": "TOPLEFT" }, "text": "Maksym Lysak", "orig": "Maksym Lysak", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 217.04599, "r_y0": 176.27484000000004, "r_x1": 235.18764, "r_y1": 176.27484000000004, "r_x2": 235.18764, "r_y2": 170.08209, "r_x3": 217.04599, "r_y3": 170.08209, "coord_origin": "TOPLEFT" }, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 235.18598999999998, "r_y0": 176.27484000000004, "r_x1": 241.4129, "r_y1": 176.27484000000004, "r_x2": 241.4129, "r_y2": 169.69159000000002, "r_x3": 235.18598999999998, "r_y3": 169.69159000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 241.41299000000004, "r_y0": 176.27484000000004, "r_x1": 257.29932, "r_y1": 176.27484000000004, "r_x2": 257.29932, "r_y2": 170.08209, "r_x3": 241.41299000000004, "r_y3": 170.08209, "coord_origin": "TOPLEFT" }, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 257.298, "r_y0": 176.27484000000004, "r_x1": 263.5249, "r_y1": 176.27484000000004, "r_x2": 263.5249, "r_y2": 169.69159000000002, "r_x3": 257.298, "r_y3": 169.69159000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.52499, "r_y0": 176.27484000000004, "r_x1": 279.41132, "r_y1": 176.27484000000004, "r_x2": 279.41132, "r_y2": 170.08209, "r_x3": 263.52499, "r_y3": 170.08209, "coord_origin": "TOPLEFT" }, "text": "3723", "orig": "3723", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 279.41, "r_y0": 176.27484000000004, "r_x1": 285.6369, "r_y1": 176.27484000000004, "r_x2": 285.6369, "r_y2": 169.69159000000002, "r_x3": 279.41, "r_y3": 169.69159000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.63602, "r_y0": 180.47069999999997, "r_x1": 392.27664, "r_y1": 180.47069999999997, "r_x2": 392.27664, "r_y2": 171.67371000000003, "r_x3": 285.63602, "r_y3": 171.67371000000003, "coord_origin": "TOPLEFT" }, "text": "$^{6960]}$, Ahmed Nassar[0000", "orig": "$^{6960]}$, Ahmed Nassar[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 392.27502, "r_y0": 176.27484000000004, "r_x1": 398.50192, "r_y1": 176.27484000000004, "r_x2": 398.50192, "r_y2": 169.69159000000002, "r_x3": 392.27502, "r_y3": 169.69159000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.50201, "r_y0": 176.27484000000004, "r_x1": 414.38834, "r_y1": 176.27484000000004, "r_x2": 414.38834, "r_y2": 170.08209, "r_x3": 398.50201, "r_y3": 170.08209, "coord_origin": "TOPLEFT" }, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 414.38702, "r_y0": 176.27484000000004, "r_x1": 420.61392, "r_y1": 176.27484000000004, "r_x2": 420.61392, "r_y2": 169.69159000000002, "r_x3": 414.38702, "r_y3": 169.69159000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 420.61304, "r_y0": 176.27484000000004, "r_x1": 436.49936, "r_y1": 176.27484000000004, "r_x2": 436.49936, "r_y2": 170.08209, "r_x3": 420.61304, "r_y3": 170.08209, "coord_origin": "TOPLEFT" }, "text": "9468", "orig": "9468", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.49805000000003, "r_y0": 176.27484000000004, "r_x1": 442.72495000000004, "r_y1": 176.27484000000004, "r_x2": 442.72495000000004, "r_y2": 169.69159000000002, "r_x3": 436.49805000000003, "r_y3": 169.69159000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.72504, "r_y0": 180.47069999999997, "r_x1": 464.12963999999994, "r_y1": 180.47069999999997, "r_x2": 464.12963999999994, "r_y2": 171.67371000000003, "r_x3": 442.72504, "r_y3": 171.67371000000003, "coord_origin": "TOPLEFT" }, "text": "$^{0822]}$,", "orig": "$^{0822]}$,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.34305, "r_y0": 192.42571999999996, "r_x1": 224.80720999999997, "r_y1": 192.42571999999996, "r_x2": 224.80720999999997, "r_y2": 183.62872000000004, "r_x3": 139.34305, "r_y3": 183.62872000000004, "coord_origin": "TOPLEFT" }, "text": "Nikolaos Livathinos", "orig": "Nikolaos Livathinos", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 224.80704000000003, "r_y0": 188.23090000000002, "r_x1": 242.94868, "r_y1": 188.23090000000002, "r_x2": 242.94868, "r_y2": 182.03814999999997, "r_x3": 224.80704000000003, "r_y3": 182.03814999999997, "coord_origin": "TOPLEFT" }, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 242.94704000000002, "r_y0": 188.23090000000002, "r_x1": 249.17394999999996, "r_y1": 188.23090000000002, "r_x2": 249.17394999999996, "r_y2": 181.64764000000002, "r_x3": 242.94704000000002, "r_y3": 181.64764000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.17404000000002, "r_y0": 188.23090000000002, "r_x1": 265.06036, "r_y1": 188.23090000000002, "r_x2": 265.06036, "r_y2": 182.03814999999997, "r_x3": 249.17404000000002, "r_y3": 182.03814999999997, "coord_origin": "TOPLEFT" }, "text": "0001", "orig": "0001", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 265.05905, "r_y0": 188.23090000000002, "r_x1": 271.28595, "r_y1": 188.23090000000002, "r_x2": 271.28595, "r_y2": 181.64764000000002, "r_x3": 265.05905, "r_y3": 181.64764000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 271.28506, "r_y0": 188.23090000000002, "r_x1": 287.17139, "r_y1": 188.23090000000002, "r_x2": 287.17139, "r_y2": 182.03814999999997, "r_x3": 271.28506, "r_y3": 182.03814999999997, "coord_origin": "TOPLEFT" }, "text": "8513", "orig": "8513", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 287.17007, "r_y0": 188.23090000000002, "r_x1": 293.39697, "r_y1": 188.23090000000002, "r_x2": 293.39697, "r_y2": 181.64764000000002, "r_x3": 287.17007, "r_y3": 181.64764000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.39706, "r_y0": 192.42571999999996, "r_x1": 404.1597, "r_y1": 192.42571999999996, "r_x2": 404.1597, "r_y2": 183.62872000000004, "r_x3": 293.39706, "r_y3": 183.62872000000004, "coord_origin": "TOPLEFT" }, "text": "$^{3491]}$, Christoph Auer[0000", "orig": "$^{3491]}$, Christoph Auer[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 404.15808, "r_y0": 188.23090000000002, "r_x1": 410.38498, "r_y1": 188.23090000000002, "r_x2": 410.38498, "r_y2": 181.64764000000002, "r_x3": 404.15808, "r_y3": 181.64764000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.38507, "r_y0": 188.23090000000002, "r_x1": 426.27139, "r_y1": 188.23090000000002, "r_x2": 426.27139, "r_y2": 182.03814999999997, "r_x3": 410.38507, "r_y3": 182.03814999999997, "coord_origin": "TOPLEFT" }, "text": "0001", "orig": "0001", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 426.27008, "r_y0": 188.23090000000002, "r_x1": 432.49697999999995, "r_y1": 188.23090000000002, "r_x2": 432.49697999999995, "r_y2": 181.64764000000002, "r_x3": 426.27008, "r_y3": 181.64764000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 432.49609, "r_y0": 188.23090000000002, "r_x1": 448.3824200000001, "r_y1": 188.23090000000002, "r_x2": 448.3824200000001, "r_y2": 182.03814999999997, "r_x3": 432.49609, "r_y3": 182.03814999999997, "coord_origin": "TOPLEFT" }, "text": "5761", "orig": "5761", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 448.3811, "r_y0": 188.23090000000002, "r_x1": 454.608, "r_y1": 188.23090000000002, "r_x2": 454.608, "r_y2": 181.64764000000002, "r_x3": 448.3811, "r_y3": 181.64764000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 454.60808999999995, "r_y0": 192.42571999999996, "r_x1": 476.01270000000005, "r_y1": 192.42571999999996, "r_x2": 476.01270000000005, "r_y2": 183.62872000000004, "r_x3": 454.60808999999995, "r_y3": 183.62872000000004, "coord_origin": "TOPLEFT" }, "text": "$^{0422]}$,", "orig": "$^{0422]}$,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 298.60608, "r_y0": 200.18591000000004, "r_x1": 316.74771, "r_y1": 200.18591000000004, "r_x2": 316.74771, "r_y2": 193.99316, "r_x3": 298.60608, "r_y3": 193.99316, "coord_origin": "TOPLEFT" }, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.74609, "r_y0": 200.18591000000004, "r_x1": 322.97299, "r_y1": 200.18591000000004, "r_x2": 322.97299, "r_y2": 193.60266000000001, "r_x3": 316.74609, "r_y3": 193.60266000000001, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.97308, "r_y0": 200.18591000000004, "r_x1": 338.85941, "r_y1": 200.18591000000004, "r_x2": 338.85941, "r_y2": 193.99316, "r_x3": 322.97308, "r_y3": 193.99316, "coord_origin": "TOPLEFT" }, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 338.85809, "r_y0": 200.18591000000004, "r_x1": 345.08499, "r_y1": 200.18591000000004, "r_x2": 345.08499, "r_y2": 193.60266000000001, "r_x3": 338.85809, "r_y3": 193.60266000000001, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.08508, "r_y0": 200.18591000000004, "r_x1": 360.97141, "r_y1": 200.18591000000004, "r_x2": 360.97141, "r_y2": 193.99316, "r_x3": 345.08508, "r_y3": 193.99316, "coord_origin": "TOPLEFT" }, "text": "8088", "orig": "8088", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 360.97009, "r_y0": 200.18591000000004, "r_x1": 367.19699, "r_y1": 200.18591000000004, "r_x2": 367.19699, "r_y2": 193.60266000000001, "r_x3": 360.97009, "r_y3": 193.60266000000001, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.19611, "r_y0": 200.18591000000004, "r_x1": 385.33774, "r_y1": 200.18591000000004, "r_x2": 385.33774, "r_y2": 193.99316, "r_x3": 367.19611, "r_y3": 193.99316, "coord_origin": "TOPLEFT" }, "text": "0823]", "orig": "0823]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 13, "label": "text", "bbox": { "l": 229.52109000000002, "t": 195.58374000000003, "r": 298.6087, "b": 204.38073999999995, "coord_origin": "TOPLEFT" }, "confidence": 0.5015263557434082, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.52109000000002, "r_y0": 204.38073999999995, "r_x1": 298.6087, "r_y1": 204.38073999999995, "r_x2": 298.6087, "r_y2": 195.58374000000003, "r_x3": 229.52109000000002, "r_y3": 195.58374000000003, "coord_origin": "TOPLEFT" }, "text": "and Peter Staar", "orig": "and Peter Staar", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 9, "label": "text", "bbox": { "l": 279.1051, "t": 217.20398, "r": 336.25153, "b": 225.27368, "coord_origin": "TOPLEFT" }, "confidence": 0.6310867667198181, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 279.1051, "r_y0": 225.27368, "r_x1": 336.25153, "r_y1": 225.27368, "r_x2": 336.25153, "r_y2": 217.20398, "r_x3": 279.1051, "r_y3": 217.20398, "coord_origin": "TOPLEFT" }, "text": "IBM Research", "orig": "IBM Research", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 8, "label": "text", "bbox": { "l": 222.96609, "t": 228.80853000000002, "r": 392.38983, "b": 236.27752999999996, "coord_origin": "TOPLEFT" }, "confidence": 0.6924149990081787, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.96609, "r_y0": 236.27752999999996, "r_x1": 392.38983, "r_y1": 236.27752999999996, "r_x2": 392.38983, "r_y2": 228.80853000000002, "r_x3": 222.96609, "r_y3": 228.80853000000002, "coord_origin": "TOPLEFT" }, "text": "{mly,ahn,nli,cau,taa}@zurich.ibm.com", "orig": "{mly,ahn,nli,cau,taa}@zurich.ibm.com", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, { "id": 1, "label": "text", "bbox": { "l": 163.1111, "t": 270.30115, "r": 452.24878000000007, "b": 464.73447, "coord_origin": "TOPLEFT" }, "confidence": 0.9807654023170471, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1111, "r_y0": 278.22748, "r_x1": 206.6358, "r_y1": 278.22748, "r_x2": 206.6358, "r_y2": 270.30115, "r_x3": 163.1111, "r_y3": 270.30115, "coord_origin": "TOPLEFT" }, "text": "Abstract.", "orig": "Abstract.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 211.6171, "r_y0": 278.43364999999994, "r_x1": 452.2447199999999, "r_y1": 278.43364999999994, "r_x2": 452.2447199999999, "r_y2": 270.36395000000005, "r_x3": 211.6171, "r_y3": 270.36395000000005, "coord_origin": "TOPLEFT" }, "text": "Extracting tables from documents is a crucial task in any", "orig": "Extracting tables from documents is a crucial task in any", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1111, "r_y0": 289.39267, "r_x1": 452.24246, "r_y1": 289.39267, "r_x2": 452.24246, "r_y2": 281.3229099999999, "r_x3": 163.1111, "r_y3": 281.3229099999999, "coord_origin": "TOPLEFT" }, "text": "document conversion pipeline. Recently, transformer-based models have", "orig": "document conversion pipeline. Recently, transformer-based models have", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1111, "r_y0": 300.35165000000006, "r_x1": 452.24792, "r_y1": 300.35165000000006, "r_x2": 452.24792, "r_y2": 292.28189, "r_x3": 163.1111, "r_y3": 292.28189, "coord_origin": "TOPLEFT" }, "text": "demonstrated that table-structure can be recognized with impressive ac-", "orig": "demonstrated that table-structure can be recognized with impressive ac-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1111, "r_y0": 311.31064, "r_x1": 452.2407799999999, "r_y1": 311.31064, "r_x2": 452.2407799999999, "r_y2": 303.24088, "r_x3": 163.1111, "r_y3": 303.24088, "coord_origin": "TOPLEFT" }, "text": "curacy using Image-to-Markup-Sequence (Im2Seq) approaches. Taking", "orig": "curacy using Image-to-Markup-Sequence (Im2Seq) approaches. Taking", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1111, "r_y0": 322.26865, "r_x1": 452.24609, "r_y1": 322.26865, "r_x2": 452.24609, "r_y2": 314.19888, "r_x3": 163.1111, "r_y3": 314.19888, "coord_origin": "TOPLEFT" }, "text": "only the image of a table, such models predict a sequence of tokens (e.g.", "orig": "only the image of a table, such models predict a sequence of tokens (e.g.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1111, "r_y0": 333.22763, "r_x1": 452.24615000000006, "r_y1": 333.22763, "r_x2": 452.24615000000006, "r_y2": 325.15787, "r_x3": 163.1111, "r_y3": 325.15787, "coord_origin": "TOPLEFT" }, "text": "in HTML, LaTeX) which represent the structure of the table. Since the", "orig": "in HTML, LaTeX) which represent the structure of the table. Since the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1111, "r_y0": 344.18661, "r_x1": 452.24707, "r_y1": 344.18661, "r_x2": 452.24707, "r_y2": 336.11685, "r_x3": 163.1111, "r_y3": 336.11685, "coord_origin": "TOPLEFT" }, "text": "token representation of the table structure has a significant impact on", "orig": "token representation of the table structure has a significant impact on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1111, "r_y0": 355.1456, "r_x1": 452.2459999999999, "r_y1": 355.1456, "r_x2": 452.2459999999999, "r_y2": 347.07584, "r_x3": 163.1111, "r_y3": 347.07584, "coord_origin": "TOPLEFT" }, "text": "the accuracy and run-time performance of any Im2Seq model, we inves-", "orig": "the accuracy and run-time performance of any Im2Seq model, we inves-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1111, "r_y0": 366.10458, "r_x1": 452.2479900000001, "r_y1": 366.10458, "r_x2": 452.2479900000001, "r_y2": 358.03482, "r_x3": 163.1111, "r_y3": 358.03482, "coord_origin": "TOPLEFT" }, "text": "tigate in this paper how table-structure representation can be optimised.", "orig": "tigate in this paper how table-structure representation can be optimised.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1111, "r_y0": 377.06357, "r_x1": 452.24609, "r_y1": 377.06357, "r_x2": 452.24609, "r_y2": 368.9938, "r_x3": 163.1111, "r_y3": 368.9938, "coord_origin": "TOPLEFT" }, "text": "We propose a new, optimised table-structure language (OTSL) with a", "orig": "We propose a new, optimised table-structure language (OTSL) with a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1111, "r_y0": 388.02255, "r_x1": 452.2417, "r_y1": 388.02255, "r_x2": 452.2417, "r_y2": 379.95279, "r_x3": 163.1111, "r_y3": 379.95279, "coord_origin": "TOPLEFT" }, "text": "minimized vocabulary and specific rules. The benefits of OTSL are that", "orig": "minimized vocabulary and specific rules. The benefits of OTSL are that", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1111, "r_y0": 398.98154, "r_x1": 452.2443200000001, "r_y1": 398.98154, "r_x2": 452.2443200000001, "r_y2": 390.91177, "r_x3": 163.1111, "r_y3": 390.91177, "coord_origin": "TOPLEFT" }, "text": "it reduces the number of tokens to 5 (HTML needs 28+) and shortens", "orig": "it reduces the number of tokens to 5 (HTML needs 28+) and shortens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1111, "r_y0": 409.94052, "r_x1": 452.24878000000007, "r_y1": 409.94052, "r_x2": 452.24878000000007, "r_y2": 401.87076, "r_x3": 163.1111, "r_y3": 401.87076, "coord_origin": "TOPLEFT" }, "text": "the sequence length to half of HTML on average. Consequently, model", "orig": "the sequence length to half of HTML on average. Consequently, model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1111, "r_y0": 420.8995100000001, "r_x1": 452.24063000000007, "r_y1": 420.8995100000001, "r_x2": 452.24063000000007, "r_y2": 412.82974, "r_x3": 163.1111, "r_y3": 412.82974, "coord_origin": "TOPLEFT" }, "text": "accuracy improves significantly, inference time is halved compared to", "orig": "accuracy improves significantly, inference time is halved compared to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1111, "r_y0": 431.85751000000005, "r_x1": 452.24161, "r_y1": 431.85751000000005, "r_x2": 452.24161, "r_y2": 423.78774999999996, "r_x3": 163.1111, "r_y3": 423.78774999999996, "coord_origin": "TOPLEFT" }, "text": "HTML-based models, and the predicted table structures are always syn-", "orig": "HTML-based models, and the predicted table structures are always syn-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1111, "r_y0": 442.8165, "r_x1": 452.24429, "r_y1": 442.8165, "r_x2": 452.24429, "r_y2": 434.74673, "r_x3": 163.1111, "r_y3": 434.74673, "coord_origin": "TOPLEFT" }, "text": "tactically correct. This in turn eliminates most post-processing needs.", "orig": "tactically correct. This in turn eliminates most post-processing needs.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1111, "r_y0": 453.77547999999996, "r_x1": 452.24603, "r_y1": 453.77547999999996, "r_x2": 452.24603, "r_y2": 445.70572000000004, "r_x3": 163.1111, "r_y3": 445.70572000000004, "coord_origin": "TOPLEFT" }, "text": "Popular table structure data-sets will be published in OTSL format to", "orig": "Popular table structure data-sets will be published in OTSL format to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1111, "r_y0": 464.73447, "r_x1": 225.56116, "r_y1": 464.73447, "r_x2": 225.56116, "r_y2": 456.6647, "r_x3": 163.1111, "r_y3": 456.6647, "coord_origin": "TOPLEFT" }, "text": "the community.", "orig": "the community.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 4, "label": "text", "bbox": { "l": 163.1111, "t": 478.69394, "r": 452.24158, "b": 497.78549, "coord_origin": "TOPLEFT" }, "confidence": 0.9304055571556091, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1111, "r_y0": 486.62024, "r_x1": 211.94211, "r_y1": 486.62024, "r_x2": 211.94211, "r_y2": 478.69394, "r_x3": 163.1111, "r_y3": 478.69394, "coord_origin": "TOPLEFT" }, "text": "Keywords:", "orig": "Keywords:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 216.55208999999996, "r_y0": 486.82648, "r_x1": 452.24158, "r_y1": 486.82648, "r_x2": 452.24158, "r_y2": 478.75671, "r_x3": 216.55208999999996, "r_y3": 478.75671, "coord_origin": "TOPLEFT" }, "text": "Table Structure Recognition \u00b7 Data Representation \u00b7 Trans-", "orig": "Table Structure Recognition \u00b7 Data Representation \u00b7 Trans-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11111, "r_y0": 497.78549, "r_x1": 257.64185, "r_y1": 497.78549, "r_x2": 257.64185, "r_y2": 489.71573, "r_x3": 163.11111, "r_y3": 489.71573, "coord_origin": "TOPLEFT" }, "text": "formers \u00b7 Optimization.", "orig": "formers \u00b7 Optimization.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 3, "label": "section_header", "bbox": { "l": 134.76512, "t": 522.11969, "r": 228.93384, "b": 532.68808, "coord_origin": "TOPLEFT" }, "confidence": 0.9392016530036926, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76512, "r_y0": 532.68808, "r_x1": 141.48872, "r_y1": 532.68808, "r_x2": 141.48872, "r_y2": 522.11969, "r_x3": 134.76512, "r_y3": 522.11969, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.93832, "r_y0": 532.68808, "r_x1": 228.93384, "r_y1": 532.68808, "r_x2": 228.93384, "r_y2": 522.11969, "r_x3": 154.93832, "r_y3": 522.11969, "coord_origin": "TOPLEFT" }, "text": "Introduction", "orig": "Introduction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 0, "label": "text", "bbox": { "l": 134.76512, "t": 548.2865400000001, "r": 480.5959500000001, "b": 628.81451, "coord_origin": "TOPLEFT" }, "confidence": 0.9835679531097412, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76512, "r_y0": 557.0835099999999, "r_x1": 480.5939, "r_y1": 557.0835099999999, "r_x2": 480.5939, "r_y2": 548.2865400000001, "r_x3": 134.76512, "r_y3": 548.2865400000001, "coord_origin": "TOPLEFT" }, "text": "Tables are ubiquitous in documents such as scientific papers, patents, reports,", "orig": "Tables are ubiquitous in documents such as scientific papers, patents, reports,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76512, "r_y0": 569.0395100000001, "r_x1": 480.59180000000003, "r_y1": 569.0395100000001, "r_x2": 480.59180000000003, "r_y2": 560.24254, "r_x3": 134.76512, "r_y3": 560.24254, "coord_origin": "TOPLEFT" }, "text": "manuals, specification sheets or marketing material. They often encode highly", "orig": "manuals, specification sheets or marketing material. They often encode highly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76512, "r_y0": 580.99451, "r_x1": 480.59283000000005, "r_y1": 580.99451, "r_x2": 480.59283000000005, "r_y2": 572.19754, "r_x3": 134.76512, "r_y3": 572.19754, "coord_origin": "TOPLEFT" }, "text": "valuable information and therefore need to be extracted with high accuracy.", "orig": "valuable information and therefore need to be extracted with high accuracy.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76512, "r_y0": 592.9495099999999, "r_x1": 480.5959500000001, "r_y1": 592.9495099999999, "r_x2": 480.5959500000001, "r_y2": 584.15254, "r_x3": 134.76512, "r_y3": 584.15254, "coord_origin": "TOPLEFT" }, "text": "Unfortunately, tables appear in documents in various sizes, styling and struc-", "orig": "Unfortunately, tables appear in documents in various sizes, styling and struc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76512, "r_y0": 604.90451, "r_x1": 480.58688, "r_y1": 604.90451, "r_x2": 480.58688, "r_y2": 596.10754, "r_x3": 134.76512, "r_y3": 596.10754, "coord_origin": "TOPLEFT" }, "text": "ture, making it difficult to recover their correct structure with simple analyt-", "orig": "ture, making it difficult to recover their correct structure with simple analyt-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76512, "r_y0": 616.85951, "r_x1": 480.59088, "r_y1": 616.85951, "r_x2": 480.59088, "r_y2": 608.06255, "r_x3": 134.76512, "r_y3": 608.06255, "coord_origin": "TOPLEFT" }, "text": "ical methods. Therefore, accurate table extraction is achieved these days with", "orig": "ical methods. Therefore, accurate table extraction is achieved these days with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76512, "r_y0": 628.81451, "r_x1": 279.32745, "r_y1": 628.81451, "r_x2": 279.32745, "r_y2": 620.01755, "r_x3": 134.76512, "r_y3": 620.01755, "coord_origin": "TOPLEFT" }, "text": "machine-learning based methods.", "orig": "machine-learning based methods.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 2, "label": "text", "bbox": { "l": 134.76512, "t": 632.14755, "r": 480.59583, "b": 664.85453, "coord_origin": "TOPLEFT" }, "confidence": 0.9696458578109741, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.70811, "r_y0": 640.94452, "r_x1": 480.58899, "r_y1": 640.94452, "r_x2": 480.58899, "r_y2": 632.14755, "r_x3": 149.70811, "r_y3": 632.14755, "coord_origin": "TOPLEFT" }, "text": "In modern document understanding systems [1,15], table extraction is typi-", "orig": "In modern document understanding systems [1,15], table extraction is typi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76512, "r_y0": 652.8995199999999, "r_x1": 480.59583, "r_y1": 652.8995199999999, "r_x2": 480.59583, "r_y2": 644.1025500000001, "r_x3": 134.76512, "r_y3": 644.1025500000001, "coord_origin": "TOPLEFT" }, "text": "cally a two-step process. Firstly, every table on a page is located with a bounding", "orig": "cally a two-step process. Firstly, every table on a page is located with a bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76512, "r_y0": 664.85453, "r_x1": 480.59496999999993, "r_y1": 664.85453, "r_x2": 480.59496999999993, "r_y2": 656.05756, "r_x3": 134.76512, "r_y3": 656.05756, "coord_origin": "TOPLEFT" }, "text": "box, and secondly, their logical row and column structure is recognized. As of", "orig": "box, and secondly, their logical row and column structure is recognized. As of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 6, "label": "page_header", "bbox": { "l": 18.340218, "t": 209.47997999999995, "r": 36.339787, "b": 555.00003, "coord_origin": "TOPLEFT" }, "confidence": 0.8899643421173096, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 18.340218, "r_y0": 555.00003, "r_x1": 36.339787, "r_y1": 555.00003, "r_x2": 36.339787, "r_y2": 209.47997999999995, "r_x3": 18.340218, "r_y3": 209.47997999999995, "coord_origin": "TOPLEFT" }, "text": "arXiv:2305.03393v1 [cs.CV] 5 May 2023", "orig": "arXiv:2305.03393v1 [cs.CV] 5 May 2023", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "tablestructure": { "table_map": {} }, "figures_classification": null, "equations_prediction": null, "vlm_response": null }, "assembled": { "elements": [ { "label": "section_header", "id": 5, "page_no": 0, "cluster": { "id": 5, "label": "section_header", "bbox": { "l": 134.765, "t": 115.89910999999995, "r": 480.59735, "b": 146.51409999999998, "coord_origin": "TOPLEFT" }, "confidence": 0.8918349742889404, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 128.58112000000006, "r_x1": 480.59735, "r_y1": 128.58112000000006, "r_x2": 480.59735, "r_y2": 115.89910999999995, "r_x3": 134.765, "r_y3": 115.89910999999995, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure", "orig": "Optimized Table Tokenization for Table Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 266.67499, "r_y0": 146.51409999999998, "r_x1": 348.68506, "r_y1": 146.51409999999998, "r_x2": 348.68506, "r_y2": 133.83209, "r_x3": 266.67499, "r_y3": 133.83209, "coord_origin": "TOPLEFT" }, "text": "Recognition", "orig": "Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Optimized Table Tokenization for Table Structure Recognition" }, { "label": "key_value_region", "id": 16, "page_no": 0, "cluster": { "id": 16, "label": "key_value_region", "bbox": { "l": 139.34305, "t": 169.69159000000002, "r": 476.01270000000005, "b": 236.27752999999996, "coord_origin": "TOPLEFT" }, "confidence": 0.48445820808410645, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.22598, "r_y0": 180.47069999999997, "r_x1": 217.04390999999998, "r_y1": 180.47069999999997, "r_x2": 217.04390999999998, "r_y2": 171.67371000000003, "r_x3": 151.22598, "r_y3": 171.67371000000003, "coord_origin": "TOPLEFT" }, "text": "Maksym Lysak", "orig": "Maksym Lysak", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 217.04599, "r_y0": 176.27484000000004, "r_x1": 235.18764, "r_y1": 176.27484000000004, "r_x2": 235.18764, "r_y2": 170.08209, "r_x3": 217.04599, "r_y3": 170.08209, "coord_origin": "TOPLEFT" }, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 235.18598999999998, "r_y0": 176.27484000000004, "r_x1": 241.4129, "r_y1": 176.27484000000004, "r_x2": 241.4129, "r_y2": 169.69159000000002, "r_x3": 235.18598999999998, "r_y3": 169.69159000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 241.41299000000004, "r_y0": 176.27484000000004, "r_x1": 257.29932, "r_y1": 176.27484000000004, "r_x2": 257.29932, "r_y2": 170.08209, "r_x3": 241.41299000000004, "r_y3": 170.08209, "coord_origin": "TOPLEFT" }, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 257.298, "r_y0": 176.27484000000004, "r_x1": 263.5249, "r_y1": 176.27484000000004, "r_x2": 263.5249, "r_y2": 169.69159000000002, "r_x3": 257.298, "r_y3": 169.69159000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.52499, "r_y0": 176.27484000000004, "r_x1": 279.41132, "r_y1": 176.27484000000004, "r_x2": 279.41132, "r_y2": 170.08209, "r_x3": 263.52499, "r_y3": 170.08209, "coord_origin": "TOPLEFT" }, "text": "3723", "orig": "3723", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 279.41, "r_y0": 176.27484000000004, "r_x1": 285.6369, "r_y1": 176.27484000000004, "r_x2": 285.6369, "r_y2": 169.69159000000002, "r_x3": 279.41, "r_y3": 169.69159000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.63602, "r_y0": 180.47069999999997, "r_x1": 392.27664, "r_y1": 180.47069999999997, "r_x2": 392.27664, "r_y2": 171.67371000000003, "r_x3": 285.63602, "r_y3": 171.67371000000003, "coord_origin": "TOPLEFT" }, "text": "$^{6960]}$, Ahmed Nassar[0000", "orig": "$^{6960]}$, Ahmed Nassar[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 392.27502, "r_y0": 176.27484000000004, "r_x1": 398.50192, "r_y1": 176.27484000000004, "r_x2": 398.50192, "r_y2": 169.69159000000002, "r_x3": 392.27502, "r_y3": 169.69159000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.50201, "r_y0": 176.27484000000004, "r_x1": 414.38834, "r_y1": 176.27484000000004, "r_x2": 414.38834, "r_y2": 170.08209, "r_x3": 398.50201, "r_y3": 170.08209, "coord_origin": "TOPLEFT" }, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 414.38702, "r_y0": 176.27484000000004, "r_x1": 420.61392, "r_y1": 176.27484000000004, "r_x2": 420.61392, "r_y2": 169.69159000000002, "r_x3": 414.38702, "r_y3": 169.69159000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 420.61304, "r_y0": 176.27484000000004, "r_x1": 436.49936, "r_y1": 176.27484000000004, "r_x2": 436.49936, "r_y2": 170.08209, "r_x3": 420.61304, "r_y3": 170.08209, "coord_origin": "TOPLEFT" }, "text": "9468", "orig": "9468", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.49805000000003, "r_y0": 176.27484000000004, "r_x1": 442.72495000000004, "r_y1": 176.27484000000004, "r_x2": 442.72495000000004, "r_y2": 169.69159000000002, "r_x3": 436.49805000000003, "r_y3": 169.69159000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.72504, "r_y0": 180.47069999999997, "r_x1": 464.12963999999994, "r_y1": 180.47069999999997, "r_x2": 464.12963999999994, "r_y2": 171.67371000000003, "r_x3": 442.72504, "r_y3": 171.67371000000003, "coord_origin": "TOPLEFT" }, "text": "$^{0822]}$,", "orig": "$^{0822]}$,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.34305, "r_y0": 192.42571999999996, "r_x1": 224.80720999999997, "r_y1": 192.42571999999996, "r_x2": 224.80720999999997, "r_y2": 183.62872000000004, "r_x3": 139.34305, "r_y3": 183.62872000000004, "coord_origin": "TOPLEFT" }, "text": "Nikolaos Livathinos", "orig": "Nikolaos Livathinos", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 224.80704000000003, "r_y0": 188.23090000000002, "r_x1": 242.94868, "r_y1": 188.23090000000002, "r_x2": 242.94868, "r_y2": 182.03814999999997, "r_x3": 224.80704000000003, "r_y3": 182.03814999999997, "coord_origin": "TOPLEFT" }, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 242.94704000000002, "r_y0": 188.23090000000002, "r_x1": 249.17394999999996, "r_y1": 188.23090000000002, "r_x2": 249.17394999999996, "r_y2": 181.64764000000002, "r_x3": 242.94704000000002, "r_y3": 181.64764000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.17404000000002, "r_y0": 188.23090000000002, "r_x1": 265.06036, "r_y1": 188.23090000000002, "r_x2": 265.06036, "r_y2": 182.03814999999997, "r_x3": 249.17404000000002, "r_y3": 182.03814999999997, "coord_origin": "TOPLEFT" }, "text": "0001", "orig": "0001", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 265.05905, "r_y0": 188.23090000000002, "r_x1": 271.28595, "r_y1": 188.23090000000002, "r_x2": 271.28595, "r_y2": 181.64764000000002, "r_x3": 265.05905, "r_y3": 181.64764000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 271.28506, "r_y0": 188.23090000000002, "r_x1": 287.17139, "r_y1": 188.23090000000002, "r_x2": 287.17139, "r_y2": 182.03814999999997, "r_x3": 271.28506, "r_y3": 182.03814999999997, "coord_origin": "TOPLEFT" }, "text": "8513", "orig": "8513", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 287.17007, "r_y0": 188.23090000000002, "r_x1": 293.39697, "r_y1": 188.23090000000002, "r_x2": 293.39697, "r_y2": 181.64764000000002, "r_x3": 287.17007, "r_y3": 181.64764000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.39706, "r_y0": 192.42571999999996, "r_x1": 404.1597, "r_y1": 192.42571999999996, "r_x2": 404.1597, "r_y2": 183.62872000000004, "r_x3": 293.39706, "r_y3": 183.62872000000004, "coord_origin": "TOPLEFT" }, "text": "$^{3491]}$, Christoph Auer[0000", "orig": "$^{3491]}$, Christoph Auer[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 404.15808, "r_y0": 188.23090000000002, "r_x1": 410.38498, "r_y1": 188.23090000000002, "r_x2": 410.38498, "r_y2": 181.64764000000002, "r_x3": 404.15808, "r_y3": 181.64764000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.38507, "r_y0": 188.23090000000002, "r_x1": 426.27139, "r_y1": 188.23090000000002, "r_x2": 426.27139, "r_y2": 182.03814999999997, "r_x3": 410.38507, "r_y3": 182.03814999999997, "coord_origin": "TOPLEFT" }, "text": "0001", "orig": "0001", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 426.27008, "r_y0": 188.23090000000002, "r_x1": 432.49697999999995, "r_y1": 188.23090000000002, "r_x2": 432.49697999999995, "r_y2": 181.64764000000002, "r_x3": 426.27008, "r_y3": 181.64764000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 432.49609, "r_y0": 188.23090000000002, "r_x1": 448.3824200000001, "r_y1": 188.23090000000002, "r_x2": 448.3824200000001, "r_y2": 182.03814999999997, "r_x3": 432.49609, "r_y3": 182.03814999999997, "coord_origin": "TOPLEFT" }, "text": "5761", "orig": "5761", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 448.3811, "r_y0": 188.23090000000002, "r_x1": 454.608, "r_y1": 188.23090000000002, "r_x2": 454.608, "r_y2": 181.64764000000002, "r_x3": 448.3811, "r_y3": 181.64764000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 454.60808999999995, "r_y0": 192.42571999999996, "r_x1": 476.01270000000005, "r_y1": 192.42571999999996, "r_x2": 476.01270000000005, "r_y2": 183.62872000000004, "r_x3": 454.60808999999995, "r_y3": 183.62872000000004, "coord_origin": "TOPLEFT" }, "text": "$^{0422]}$,", "orig": "$^{0422]}$,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.52109000000002, "r_y0": 204.38073999999995, "r_x1": 298.6087, "r_y1": 204.38073999999995, "r_x2": 298.6087, "r_y2": 195.58374000000003, "r_x3": 229.52109000000002, "r_y3": 195.58374000000003, "coord_origin": "TOPLEFT" }, "text": "and Peter Staar", "orig": "and Peter Staar", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 298.60608, "r_y0": 200.18591000000004, "r_x1": 316.74771, "r_y1": 200.18591000000004, "r_x2": 316.74771, "r_y2": 193.99316, "r_x3": 298.60608, "r_y3": 193.99316, "coord_origin": "TOPLEFT" }, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.74609, "r_y0": 200.18591000000004, "r_x1": 322.97299, "r_y1": 200.18591000000004, "r_x2": 322.97299, "r_y2": 193.60266000000001, "r_x3": 316.74609, "r_y3": 193.60266000000001, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.97308, "r_y0": 200.18591000000004, "r_x1": 338.85941, "r_y1": 200.18591000000004, "r_x2": 338.85941, "r_y2": 193.99316, "r_x3": 322.97308, "r_y3": 193.99316, "coord_origin": "TOPLEFT" }, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 338.85809, "r_y0": 200.18591000000004, "r_x1": 345.08499, "r_y1": 200.18591000000004, "r_x2": 345.08499, "r_y2": 193.60266000000001, "r_x3": 338.85809, "r_y3": 193.60266000000001, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.08508, "r_y0": 200.18591000000004, "r_x1": 360.97141, "r_y1": 200.18591000000004, "r_x2": 360.97141, "r_y2": 193.99316, "r_x3": 345.08508, "r_y3": 193.99316, "coord_origin": "TOPLEFT" }, "text": "8088", "orig": "8088", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 360.97009, "r_y0": 200.18591000000004, "r_x1": 367.19699, "r_y1": 200.18591000000004, "r_x2": 367.19699, "r_y2": 193.60266000000001, "r_x3": 360.97009, "r_y3": 193.60266000000001, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.19611, "r_y0": 200.18591000000004, "r_x1": 385.33774, "r_y1": 200.18591000000004, "r_x2": 385.33774, "r_y2": 193.99316, "r_x3": 367.19611, "r_y3": 193.99316, "coord_origin": "TOPLEFT" }, "text": "0823]", "orig": "0823]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 279.1051, "r_y0": 225.27368, "r_x1": 336.25153, "r_y1": 225.27368, "r_x2": 336.25153, "r_y2": 217.20398, "r_x3": 279.1051, "r_y3": 217.20398, "coord_origin": "TOPLEFT" }, "text": "IBM Research", "orig": "IBM Research", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.96609, "r_y0": 236.27752999999996, "r_x1": 392.38983, "r_y1": 236.27752999999996, "r_x2": 392.38983, "r_y2": 228.80853000000002, "r_x3": 222.96609, "r_y3": 228.80853000000002, "coord_origin": "TOPLEFT" }, "text": "{mly,ahn,nli,cau,taa}@zurich.ibm.com", "orig": "{mly,ahn,nli,cau,taa}@zurich.ibm.com", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 7, "label": "text", "bbox": { "l": 139.34305, "t": 169.69159000000002, "r": 476.01270000000005, "b": 200.18591000000004, "coord_origin": "TOPLEFT" }, "confidence": 0.7918068766593933, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.22598, "r_y0": 180.47069999999997, "r_x1": 217.04390999999998, "r_y1": 180.47069999999997, "r_x2": 217.04390999999998, "r_y2": 171.67371000000003, "r_x3": 151.22598, "r_y3": 171.67371000000003, "coord_origin": "TOPLEFT" }, "text": "Maksym Lysak", "orig": "Maksym Lysak", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 217.04599, "r_y0": 176.27484000000004, "r_x1": 235.18764, "r_y1": 176.27484000000004, "r_x2": 235.18764, "r_y2": 170.08209, "r_x3": 217.04599, "r_y3": 170.08209, "coord_origin": "TOPLEFT" }, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 235.18598999999998, "r_y0": 176.27484000000004, "r_x1": 241.4129, "r_y1": 176.27484000000004, "r_x2": 241.4129, "r_y2": 169.69159000000002, "r_x3": 235.18598999999998, "r_y3": 169.69159000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 241.41299000000004, "r_y0": 176.27484000000004, "r_x1": 257.29932, "r_y1": 176.27484000000004, "r_x2": 257.29932, "r_y2": 170.08209, "r_x3": 241.41299000000004, "r_y3": 170.08209, "coord_origin": "TOPLEFT" }, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 257.298, "r_y0": 176.27484000000004, "r_x1": 263.5249, "r_y1": 176.27484000000004, "r_x2": 263.5249, "r_y2": 169.69159000000002, "r_x3": 257.298, "r_y3": 169.69159000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.52499, "r_y0": 176.27484000000004, "r_x1": 279.41132, "r_y1": 176.27484000000004, "r_x2": 279.41132, "r_y2": 170.08209, "r_x3": 263.52499, "r_y3": 170.08209, "coord_origin": "TOPLEFT" }, "text": "3723", "orig": "3723", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 279.41, "r_y0": 176.27484000000004, "r_x1": 285.6369, "r_y1": 176.27484000000004, "r_x2": 285.6369, "r_y2": 169.69159000000002, "r_x3": 279.41, "r_y3": 169.69159000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.63602, "r_y0": 180.47069999999997, "r_x1": 392.27664, "r_y1": 180.47069999999997, "r_x2": 392.27664, "r_y2": 171.67371000000003, "r_x3": 285.63602, "r_y3": 171.67371000000003, "coord_origin": "TOPLEFT" }, "text": "$^{6960]}$, Ahmed Nassar[0000", "orig": "$^{6960]}$, Ahmed Nassar[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 392.27502, "r_y0": 176.27484000000004, "r_x1": 398.50192, "r_y1": 176.27484000000004, "r_x2": 398.50192, "r_y2": 169.69159000000002, "r_x3": 392.27502, "r_y3": 169.69159000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.50201, "r_y0": 176.27484000000004, "r_x1": 414.38834, "r_y1": 176.27484000000004, "r_x2": 414.38834, "r_y2": 170.08209, "r_x3": 398.50201, "r_y3": 170.08209, "coord_origin": "TOPLEFT" }, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 414.38702, "r_y0": 176.27484000000004, "r_x1": 420.61392, "r_y1": 176.27484000000004, "r_x2": 420.61392, "r_y2": 169.69159000000002, "r_x3": 414.38702, "r_y3": 169.69159000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 420.61304, "r_y0": 176.27484000000004, "r_x1": 436.49936, "r_y1": 176.27484000000004, "r_x2": 436.49936, "r_y2": 170.08209, "r_x3": 420.61304, "r_y3": 170.08209, "coord_origin": "TOPLEFT" }, "text": "9468", "orig": "9468", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.49805000000003, "r_y0": 176.27484000000004, "r_x1": 442.72495000000004, "r_y1": 176.27484000000004, "r_x2": 442.72495000000004, "r_y2": 169.69159000000002, "r_x3": 436.49805000000003, "r_y3": 169.69159000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.72504, "r_y0": 180.47069999999997, "r_x1": 464.12963999999994, "r_y1": 180.47069999999997, "r_x2": 464.12963999999994, "r_y2": 171.67371000000003, "r_x3": 442.72504, "r_y3": 171.67371000000003, "coord_origin": "TOPLEFT" }, "text": "$^{0822]}$,", "orig": "$^{0822]}$,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.34305, "r_y0": 192.42571999999996, "r_x1": 224.80720999999997, "r_y1": 192.42571999999996, "r_x2": 224.80720999999997, "r_y2": 183.62872000000004, "r_x3": 139.34305, "r_y3": 183.62872000000004, "coord_origin": "TOPLEFT" }, "text": "Nikolaos Livathinos", "orig": "Nikolaos Livathinos", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 224.80704000000003, "r_y0": 188.23090000000002, "r_x1": 242.94868, "r_y1": 188.23090000000002, "r_x2": 242.94868, "r_y2": 182.03814999999997, "r_x3": 224.80704000000003, "r_y3": 182.03814999999997, "coord_origin": "TOPLEFT" }, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 242.94704000000002, "r_y0": 188.23090000000002, "r_x1": 249.17394999999996, "r_y1": 188.23090000000002, "r_x2": 249.17394999999996, "r_y2": 181.64764000000002, "r_x3": 242.94704000000002, "r_y3": 181.64764000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.17404000000002, "r_y0": 188.23090000000002, "r_x1": 265.06036, "r_y1": 188.23090000000002, "r_x2": 265.06036, "r_y2": 182.03814999999997, "r_x3": 249.17404000000002, "r_y3": 182.03814999999997, "coord_origin": "TOPLEFT" }, "text": "0001", "orig": "0001", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 265.05905, "r_y0": 188.23090000000002, "r_x1": 271.28595, "r_y1": 188.23090000000002, "r_x2": 271.28595, "r_y2": 181.64764000000002, "r_x3": 265.05905, "r_y3": 181.64764000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 271.28506, "r_y0": 188.23090000000002, "r_x1": 287.17139, "r_y1": 188.23090000000002, "r_x2": 287.17139, "r_y2": 182.03814999999997, "r_x3": 271.28506, "r_y3": 182.03814999999997, "coord_origin": "TOPLEFT" }, "text": "8513", "orig": "8513", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 287.17007, "r_y0": 188.23090000000002, "r_x1": 293.39697, "r_y1": 188.23090000000002, "r_x2": 293.39697, "r_y2": 181.64764000000002, "r_x3": 287.17007, "r_y3": 181.64764000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.39706, "r_y0": 192.42571999999996, "r_x1": 404.1597, "r_y1": 192.42571999999996, "r_x2": 404.1597, "r_y2": 183.62872000000004, "r_x3": 293.39706, "r_y3": 183.62872000000004, "coord_origin": "TOPLEFT" }, "text": "$^{3491]}$, Christoph Auer[0000", "orig": "$^{3491]}$, Christoph Auer[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 404.15808, "r_y0": 188.23090000000002, "r_x1": 410.38498, "r_y1": 188.23090000000002, "r_x2": 410.38498, "r_y2": 181.64764000000002, "r_x3": 404.15808, "r_y3": 181.64764000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.38507, "r_y0": 188.23090000000002, "r_x1": 426.27139, "r_y1": 188.23090000000002, "r_x2": 426.27139, "r_y2": 182.03814999999997, "r_x3": 410.38507, "r_y3": 182.03814999999997, "coord_origin": "TOPLEFT" }, "text": "0001", "orig": "0001", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 426.27008, "r_y0": 188.23090000000002, "r_x1": 432.49697999999995, "r_y1": 188.23090000000002, "r_x2": 432.49697999999995, "r_y2": 181.64764000000002, "r_x3": 426.27008, "r_y3": 181.64764000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 432.49609, "r_y0": 188.23090000000002, "r_x1": 448.3824200000001, "r_y1": 188.23090000000002, "r_x2": 448.3824200000001, "r_y2": 182.03814999999997, "r_x3": 432.49609, "r_y3": 182.03814999999997, "coord_origin": "TOPLEFT" }, "text": "5761", "orig": "5761", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 448.3811, "r_y0": 188.23090000000002, "r_x1": 454.608, "r_y1": 188.23090000000002, "r_x2": 454.608, "r_y2": 181.64764000000002, "r_x3": 448.3811, "r_y3": 181.64764000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 454.60808999999995, "r_y0": 192.42571999999996, "r_x1": 476.01270000000005, "r_y1": 192.42571999999996, "r_x2": 476.01270000000005, "r_y2": 183.62872000000004, "r_x3": 454.60808999999995, "r_y3": 183.62872000000004, "coord_origin": "TOPLEFT" }, "text": "$^{0422]}$,", "orig": "$^{0422]}$,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 298.60608, "r_y0": 200.18591000000004, "r_x1": 316.74771, "r_y1": 200.18591000000004, "r_x2": 316.74771, "r_y2": 193.99316, "r_x3": 298.60608, "r_y3": 193.99316, "coord_origin": "TOPLEFT" }, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.74609, "r_y0": 200.18591000000004, "r_x1": 322.97299, "r_y1": 200.18591000000004, "r_x2": 322.97299, "r_y2": 193.60266000000001, "r_x3": 316.74609, "r_y3": 193.60266000000001, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.97308, "r_y0": 200.18591000000004, "r_x1": 338.85941, "r_y1": 200.18591000000004, "r_x2": 338.85941, "r_y2": 193.99316, "r_x3": 322.97308, "r_y3": 193.99316, "coord_origin": "TOPLEFT" }, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 338.85809, "r_y0": 200.18591000000004, "r_x1": 345.08499, "r_y1": 200.18591000000004, "r_x2": 345.08499, "r_y2": 193.60266000000001, "r_x3": 338.85809, "r_y3": 193.60266000000001, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.08508, "r_y0": 200.18591000000004, "r_x1": 360.97141, "r_y1": 200.18591000000004, "r_x2": 360.97141, "r_y2": 193.99316, "r_x3": 345.08508, "r_y3": 193.99316, "coord_origin": "TOPLEFT" }, "text": "8088", "orig": "8088", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 360.97009, "r_y0": 200.18591000000004, "r_x1": 367.19699, "r_y1": 200.18591000000004, "r_x2": 367.19699, "r_y2": 193.60266000000001, "r_x3": 360.97009, "r_y3": 193.60266000000001, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.19611, "r_y0": 200.18591000000004, "r_x1": 385.33774, "r_y1": 200.18591000000004, "r_x2": 385.33774, "r_y2": 193.99316, "r_x3": 367.19611, "r_y3": 193.99316, "coord_origin": "TOPLEFT" }, "text": "0823]", "orig": "0823]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 13, "label": "text", "bbox": { "l": 229.52109000000002, "t": 195.58374000000003, "r": 298.6087, "b": 204.38073999999995, "coord_origin": "TOPLEFT" }, "confidence": 0.5015263557434082, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.52109000000002, "r_y0": 204.38073999999995, "r_x1": 298.6087, "r_y1": 204.38073999999995, "r_x2": 298.6087, "r_y2": 195.58374000000003, "r_x3": 229.52109000000002, "r_y3": 195.58374000000003, "coord_origin": "TOPLEFT" }, "text": "and Peter Staar", "orig": "and Peter Staar", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 9, "label": "text", "bbox": { "l": 279.1051, "t": 217.20398, "r": 336.25153, "b": 225.27368, "coord_origin": "TOPLEFT" }, "confidence": 0.6310867667198181, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 279.1051, "r_y0": 225.27368, "r_x1": 336.25153, "r_y1": 225.27368, "r_x2": 336.25153, "r_y2": 217.20398, "r_x3": 279.1051, "r_y3": 217.20398, "coord_origin": "TOPLEFT" }, "text": "IBM Research", "orig": "IBM Research", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 8, "label": "text", "bbox": { "l": 222.96609, "t": 228.80853000000002, "r": 392.38983, "b": 236.27752999999996, "coord_origin": "TOPLEFT" }, "confidence": 0.6924149990081787, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.96609, "r_y0": 236.27752999999996, "r_x1": 392.38983, "r_y1": 236.27752999999996, "r_x2": 392.38983, "r_y2": 228.80853000000002, "r_x3": 222.96609, "r_y3": 228.80853000000002, "coord_origin": "TOPLEFT" }, "text": "{mly,ahn,nli,cau,taa}@zurich.ibm.com", "orig": "{mly,ahn,nli,cau,taa}@zurich.ibm.com", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": null }, { "label": "text", "id": 1, "page_no": 0, "cluster": { "id": 1, "label": "text", "bbox": { "l": 163.1111, "t": 270.30115, "r": 452.24878000000007, "b": 464.73447, "coord_origin": "TOPLEFT" }, "confidence": 0.9807654023170471, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1111, "r_y0": 278.22748, "r_x1": 206.6358, "r_y1": 278.22748, "r_x2": 206.6358, "r_y2": 270.30115, "r_x3": 163.1111, "r_y3": 270.30115, "coord_origin": "TOPLEFT" }, "text": "Abstract.", "orig": "Abstract.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 211.6171, "r_y0": 278.43364999999994, "r_x1": 452.2447199999999, "r_y1": 278.43364999999994, "r_x2": 452.2447199999999, "r_y2": 270.36395000000005, "r_x3": 211.6171, "r_y3": 270.36395000000005, "coord_origin": "TOPLEFT" }, "text": "Extracting tables from documents is a crucial task in any", "orig": "Extracting tables from documents is a crucial task in any", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1111, "r_y0": 289.39267, "r_x1": 452.24246, "r_y1": 289.39267, "r_x2": 452.24246, "r_y2": 281.3229099999999, "r_x3": 163.1111, "r_y3": 281.3229099999999, "coord_origin": "TOPLEFT" }, "text": "document conversion pipeline. Recently, transformer-based models have", "orig": "document conversion pipeline. Recently, transformer-based models have", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1111, "r_y0": 300.35165000000006, "r_x1": 452.24792, "r_y1": 300.35165000000006, "r_x2": 452.24792, "r_y2": 292.28189, "r_x3": 163.1111, "r_y3": 292.28189, "coord_origin": "TOPLEFT" }, "text": "demonstrated that table-structure can be recognized with impressive ac-", "orig": "demonstrated that table-structure can be recognized with impressive ac-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1111, "r_y0": 311.31064, "r_x1": 452.2407799999999, "r_y1": 311.31064, "r_x2": 452.2407799999999, "r_y2": 303.24088, "r_x3": 163.1111, "r_y3": 303.24088, "coord_origin": "TOPLEFT" }, "text": "curacy using Image-to-Markup-Sequence (Im2Seq) approaches. Taking", "orig": "curacy using Image-to-Markup-Sequence (Im2Seq) approaches. Taking", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1111, "r_y0": 322.26865, "r_x1": 452.24609, "r_y1": 322.26865, "r_x2": 452.24609, "r_y2": 314.19888, "r_x3": 163.1111, "r_y3": 314.19888, "coord_origin": "TOPLEFT" }, "text": "only the image of a table, such models predict a sequence of tokens (e.g.", "orig": "only the image of a table, such models predict a sequence of tokens (e.g.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1111, "r_y0": 333.22763, "r_x1": 452.24615000000006, "r_y1": 333.22763, "r_x2": 452.24615000000006, "r_y2": 325.15787, "r_x3": 163.1111, "r_y3": 325.15787, "coord_origin": "TOPLEFT" }, "text": "in HTML, LaTeX) which represent the structure of the table. Since the", "orig": "in HTML, LaTeX) which represent the structure of the table. Since the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1111, "r_y0": 344.18661, "r_x1": 452.24707, "r_y1": 344.18661, "r_x2": 452.24707, "r_y2": 336.11685, "r_x3": 163.1111, "r_y3": 336.11685, "coord_origin": "TOPLEFT" }, "text": "token representation of the table structure has a significant impact on", "orig": "token representation of the table structure has a significant impact on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1111, "r_y0": 355.1456, "r_x1": 452.2459999999999, "r_y1": 355.1456, "r_x2": 452.2459999999999, "r_y2": 347.07584, "r_x3": 163.1111, "r_y3": 347.07584, "coord_origin": "TOPLEFT" }, "text": "the accuracy and run-time performance of any Im2Seq model, we inves-", "orig": "the accuracy and run-time performance of any Im2Seq model, we inves-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1111, "r_y0": 366.10458, "r_x1": 452.2479900000001, "r_y1": 366.10458, "r_x2": 452.2479900000001, "r_y2": 358.03482, "r_x3": 163.1111, "r_y3": 358.03482, "coord_origin": "TOPLEFT" }, "text": "tigate in this paper how table-structure representation can be optimised.", "orig": "tigate in this paper how table-structure representation can be optimised.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1111, "r_y0": 377.06357, "r_x1": 452.24609, "r_y1": 377.06357, "r_x2": 452.24609, "r_y2": 368.9938, "r_x3": 163.1111, "r_y3": 368.9938, "coord_origin": "TOPLEFT" }, "text": "We propose a new, optimised table-structure language (OTSL) with a", "orig": "We propose a new, optimised table-structure language (OTSL) with a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1111, "r_y0": 388.02255, "r_x1": 452.2417, "r_y1": 388.02255, "r_x2": 452.2417, "r_y2": 379.95279, "r_x3": 163.1111, "r_y3": 379.95279, "coord_origin": "TOPLEFT" }, "text": "minimized vocabulary and specific rules. The benefits of OTSL are that", "orig": "minimized vocabulary and specific rules. The benefits of OTSL are that", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1111, "r_y0": 398.98154, "r_x1": 452.2443200000001, "r_y1": 398.98154, "r_x2": 452.2443200000001, "r_y2": 390.91177, "r_x3": 163.1111, "r_y3": 390.91177, "coord_origin": "TOPLEFT" }, "text": "it reduces the number of tokens to 5 (HTML needs 28+) and shortens", "orig": "it reduces the number of tokens to 5 (HTML needs 28+) and shortens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1111, "r_y0": 409.94052, "r_x1": 452.24878000000007, "r_y1": 409.94052, "r_x2": 452.24878000000007, "r_y2": 401.87076, "r_x3": 163.1111, "r_y3": 401.87076, "coord_origin": "TOPLEFT" }, "text": "the sequence length to half of HTML on average. Consequently, model", "orig": "the sequence length to half of HTML on average. Consequently, model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1111, "r_y0": 420.8995100000001, "r_x1": 452.24063000000007, "r_y1": 420.8995100000001, "r_x2": 452.24063000000007, "r_y2": 412.82974, "r_x3": 163.1111, "r_y3": 412.82974, "coord_origin": "TOPLEFT" }, "text": "accuracy improves significantly, inference time is halved compared to", "orig": "accuracy improves significantly, inference time is halved compared to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1111, "r_y0": 431.85751000000005, "r_x1": 452.24161, "r_y1": 431.85751000000005, "r_x2": 452.24161, "r_y2": 423.78774999999996, "r_x3": 163.1111, "r_y3": 423.78774999999996, "coord_origin": "TOPLEFT" }, "text": "HTML-based models, and the predicted table structures are always syn-", "orig": "HTML-based models, and the predicted table structures are always syn-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1111, "r_y0": 442.8165, "r_x1": 452.24429, "r_y1": 442.8165, "r_x2": 452.24429, "r_y2": 434.74673, "r_x3": 163.1111, "r_y3": 434.74673, "coord_origin": "TOPLEFT" }, "text": "tactically correct. This in turn eliminates most post-processing needs.", "orig": "tactically correct. This in turn eliminates most post-processing needs.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1111, "r_y0": 453.77547999999996, "r_x1": 452.24603, "r_y1": 453.77547999999996, "r_x2": 452.24603, "r_y2": 445.70572000000004, "r_x3": 163.1111, "r_y3": 445.70572000000004, "coord_origin": "TOPLEFT" }, "text": "Popular table structure data-sets will be published in OTSL format to", "orig": "Popular table structure data-sets will be published in OTSL format to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1111, "r_y0": 464.73447, "r_x1": 225.56116, "r_y1": 464.73447, "r_x2": 225.56116, "r_y2": 456.6647, "r_x3": 163.1111, "r_y3": 456.6647, "coord_origin": "TOPLEFT" }, "text": "the community.", "orig": "the community.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Abstract. Extracting tables from documents is a crucial task in any document conversion pipeline. Recently, transformer-based models have demonstrated that table-structure can be recognized with impressive accuracy using Image-to-Markup-Sequence (Im2Seq) approaches. Taking only the image of a table, such models predict a sequence of tokens (e.g. in HTML, LaTeX) which represent the structure of the table. Since the token representation of the table structure has a significant impact on the accuracy and run-time performance of any Im2Seq model, we investigate in this paper how table-structure representation can be optimised. We propose a new, optimised table-structure language (OTSL) with a minimized vocabulary and specific rules. The benefits of OTSL are that it reduces the number of tokens to 5 (HTML needs 28+) and shortens the sequence length to half of HTML on average. Consequently, model accuracy improves significantly, inference time is halved compared to HTML-based models, and the predicted table structures are always syntactically correct. This in turn eliminates most post-processing needs. Popular table structure data-sets will be published in OTSL format to the community." }, { "label": "text", "id": 4, "page_no": 0, "cluster": { "id": 4, "label": "text", "bbox": { "l": 163.1111, "t": 478.69394, "r": 452.24158, "b": 497.78549, "coord_origin": "TOPLEFT" }, "confidence": 0.9304055571556091, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1111, "r_y0": 486.62024, "r_x1": 211.94211, "r_y1": 486.62024, "r_x2": 211.94211, "r_y2": 478.69394, "r_x3": 163.1111, "r_y3": 478.69394, "coord_origin": "TOPLEFT" }, "text": "Keywords:", "orig": "Keywords:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 216.55208999999996, "r_y0": 486.82648, "r_x1": 452.24158, "r_y1": 486.82648, "r_x2": 452.24158, "r_y2": 478.75671, "r_x3": 216.55208999999996, "r_y3": 478.75671, "coord_origin": "TOPLEFT" }, "text": "Table Structure Recognition \u00b7 Data Representation \u00b7 Trans-", "orig": "Table Structure Recognition \u00b7 Data Representation \u00b7 Trans-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11111, "r_y0": 497.78549, "r_x1": 257.64185, "r_y1": 497.78549, "r_x2": 257.64185, "r_y2": 489.71573, "r_x3": 163.11111, "r_y3": 489.71573, "coord_origin": "TOPLEFT" }, "text": "formers \u00b7 Optimization.", "orig": "formers \u00b7 Optimization.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Keywords: Table Structure Recognition \u00b7 Data Representation \u00b7 Transformers \u00b7 Optimization." }, { "label": "section_header", "id": 3, "page_no": 0, "cluster": { "id": 3, "label": "section_header", "bbox": { "l": 134.76512, "t": 522.11969, "r": 228.93384, "b": 532.68808, "coord_origin": "TOPLEFT" }, "confidence": 0.9392016530036926, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76512, "r_y0": 532.68808, "r_x1": 141.48872, "r_y1": 532.68808, "r_x2": 141.48872, "r_y2": 522.11969, "r_x3": 134.76512, "r_y3": 522.11969, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.93832, "r_y0": 532.68808, "r_x1": 228.93384, "r_y1": 532.68808, "r_x2": 228.93384, "r_y2": 522.11969, "r_x3": 154.93832, "r_y3": 522.11969, "coord_origin": "TOPLEFT" }, "text": "Introduction", "orig": "Introduction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "1 Introduction" }, { "label": "text", "id": 0, "page_no": 0, "cluster": { "id": 0, "label": "text", "bbox": { "l": 134.76512, "t": 548.2865400000001, "r": 480.5959500000001, "b": 628.81451, "coord_origin": "TOPLEFT" }, "confidence": 0.9835679531097412, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76512, "r_y0": 557.0835099999999, "r_x1": 480.5939, "r_y1": 557.0835099999999, "r_x2": 480.5939, "r_y2": 548.2865400000001, "r_x3": 134.76512, "r_y3": 548.2865400000001, "coord_origin": "TOPLEFT" }, "text": "Tables are ubiquitous in documents such as scientific papers, patents, reports,", "orig": "Tables are ubiquitous in documents such as scientific papers, patents, reports,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76512, "r_y0": 569.0395100000001, "r_x1": 480.59180000000003, "r_y1": 569.0395100000001, "r_x2": 480.59180000000003, "r_y2": 560.24254, "r_x3": 134.76512, "r_y3": 560.24254, "coord_origin": "TOPLEFT" }, "text": "manuals, specification sheets or marketing material. They often encode highly", "orig": "manuals, specification sheets or marketing material. They often encode highly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76512, "r_y0": 580.99451, "r_x1": 480.59283000000005, "r_y1": 580.99451, "r_x2": 480.59283000000005, "r_y2": 572.19754, "r_x3": 134.76512, "r_y3": 572.19754, "coord_origin": "TOPLEFT" }, "text": "valuable information and therefore need to be extracted with high accuracy.", "orig": "valuable information and therefore need to be extracted with high accuracy.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76512, "r_y0": 592.9495099999999, "r_x1": 480.5959500000001, "r_y1": 592.9495099999999, "r_x2": 480.5959500000001, "r_y2": 584.15254, "r_x3": 134.76512, "r_y3": 584.15254, "coord_origin": "TOPLEFT" }, "text": "Unfortunately, tables appear in documents in various sizes, styling and struc-", "orig": "Unfortunately, tables appear in documents in various sizes, styling and struc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76512, "r_y0": 604.90451, "r_x1": 480.58688, "r_y1": 604.90451, "r_x2": 480.58688, "r_y2": 596.10754, "r_x3": 134.76512, "r_y3": 596.10754, "coord_origin": "TOPLEFT" }, "text": "ture, making it difficult to recover their correct structure with simple analyt-", "orig": "ture, making it difficult to recover their correct structure with simple analyt-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76512, "r_y0": 616.85951, "r_x1": 480.59088, "r_y1": 616.85951, "r_x2": 480.59088, "r_y2": 608.06255, "r_x3": 134.76512, "r_y3": 608.06255, "coord_origin": "TOPLEFT" }, "text": "ical methods. Therefore, accurate table extraction is achieved these days with", "orig": "ical methods. Therefore, accurate table extraction is achieved these days with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76512, "r_y0": 628.81451, "r_x1": 279.32745, "r_y1": 628.81451, "r_x2": 279.32745, "r_y2": 620.01755, "r_x3": 134.76512, "r_y3": 620.01755, "coord_origin": "TOPLEFT" }, "text": "machine-learning based methods.", "orig": "machine-learning based methods.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Tables are ubiquitous in documents such as scientific papers, patents, reports, manuals, specification sheets or marketing material. They often encode highly valuable information and therefore need to be extracted with high accuracy. Unfortunately, tables appear in documents in various sizes, styling and structure, making it difficult to recover their correct structure with simple analytical methods. Therefore, accurate table extraction is achieved these days with machine-learning based methods." }, { "label": "text", "id": 2, "page_no": 0, "cluster": { "id": 2, "label": "text", "bbox": { "l": 134.76512, "t": 632.14755, "r": 480.59583, "b": 664.85453, "coord_origin": "TOPLEFT" }, "confidence": 0.9696458578109741, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.70811, "r_y0": 640.94452, "r_x1": 480.58899, "r_y1": 640.94452, "r_x2": 480.58899, "r_y2": 632.14755, "r_x3": 149.70811, "r_y3": 632.14755, "coord_origin": "TOPLEFT" }, "text": "In modern document understanding systems [1,15], table extraction is typi-", "orig": "In modern document understanding systems [1,15], table extraction is typi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76512, "r_y0": 652.8995199999999, "r_x1": 480.59583, "r_y1": 652.8995199999999, "r_x2": 480.59583, "r_y2": 644.1025500000001, "r_x3": 134.76512, "r_y3": 644.1025500000001, "coord_origin": "TOPLEFT" }, "text": "cally a two-step process. Firstly, every table on a page is located with a bounding", "orig": "cally a two-step process. Firstly, every table on a page is located with a bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76512, "r_y0": 664.85453, "r_x1": 480.59496999999993, "r_y1": 664.85453, "r_x2": 480.59496999999993, "r_y2": 656.05756, "r_x3": 134.76512, "r_y3": 656.05756, "coord_origin": "TOPLEFT" }, "text": "box, and secondly, their logical row and column structure is recognized. As of", "orig": "box, and secondly, their logical row and column structure is recognized. As of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "In modern document understanding systems [1,15], table extraction is typically a two-step process. Firstly, every table on a page is located with a bounding box, and secondly, their logical row and column structure is recognized. As of" }, { "label": "page_header", "id": 6, "page_no": 0, "cluster": { "id": 6, "label": "page_header", "bbox": { "l": 18.340218, "t": 209.47997999999995, "r": 36.339787, "b": 555.00003, "coord_origin": "TOPLEFT" }, "confidence": 0.8899643421173096, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 18.340218, "r_y0": 555.00003, "r_x1": 36.339787, "r_y1": 555.00003, "r_x2": 36.339787, "r_y2": 209.47997999999995, "r_x3": 18.340218, "r_y3": 209.47997999999995, "coord_origin": "TOPLEFT" }, "text": "arXiv:2305.03393v1 [cs.CV] 5 May 2023", "orig": "arXiv:2305.03393v1 [cs.CV] 5 May 2023", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "arXiv:2305.03393v1 [cs.CV] 5 May 2023" } ], "body": [ { "label": "section_header", "id": 5, "page_no": 0, "cluster": { "id": 5, "label": "section_header", "bbox": { "l": 134.765, "t": 115.89910999999995, "r": 480.59735, "b": 146.51409999999998, "coord_origin": "TOPLEFT" }, "confidence": 0.8918349742889404, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 128.58112000000006, "r_x1": 480.59735, "r_y1": 128.58112000000006, "r_x2": 480.59735, "r_y2": 115.89910999999995, "r_x3": 134.765, "r_y3": 115.89910999999995, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure", "orig": "Optimized Table Tokenization for Table Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 266.67499, "r_y0": 146.51409999999998, "r_x1": 348.68506, "r_y1": 146.51409999999998, "r_x2": 348.68506, "r_y2": 133.83209, "r_x3": 266.67499, "r_y3": 133.83209, "coord_origin": "TOPLEFT" }, "text": "Recognition", "orig": "Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Optimized Table Tokenization for Table Structure Recognition" }, { "label": "key_value_region", "id": 16, "page_no": 0, "cluster": { "id": 16, "label": "key_value_region", "bbox": { "l": 139.34305, "t": 169.69159000000002, "r": 476.01270000000005, "b": 236.27752999999996, "coord_origin": "TOPLEFT" }, "confidence": 0.48445820808410645, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.22598, "r_y0": 180.47069999999997, "r_x1": 217.04390999999998, "r_y1": 180.47069999999997, "r_x2": 217.04390999999998, "r_y2": 171.67371000000003, "r_x3": 151.22598, "r_y3": 171.67371000000003, "coord_origin": "TOPLEFT" }, "text": "Maksym Lysak", "orig": "Maksym Lysak", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 217.04599, "r_y0": 176.27484000000004, "r_x1": 235.18764, "r_y1": 176.27484000000004, "r_x2": 235.18764, "r_y2": 170.08209, "r_x3": 217.04599, "r_y3": 170.08209, "coord_origin": "TOPLEFT" }, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 235.18598999999998, "r_y0": 176.27484000000004, "r_x1": 241.4129, "r_y1": 176.27484000000004, "r_x2": 241.4129, "r_y2": 169.69159000000002, "r_x3": 235.18598999999998, "r_y3": 169.69159000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 241.41299000000004, "r_y0": 176.27484000000004, "r_x1": 257.29932, "r_y1": 176.27484000000004, "r_x2": 257.29932, "r_y2": 170.08209, "r_x3": 241.41299000000004, "r_y3": 170.08209, "coord_origin": "TOPLEFT" }, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 257.298, "r_y0": 176.27484000000004, "r_x1": 263.5249, "r_y1": 176.27484000000004, "r_x2": 263.5249, "r_y2": 169.69159000000002, "r_x3": 257.298, "r_y3": 169.69159000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.52499, "r_y0": 176.27484000000004, "r_x1": 279.41132, "r_y1": 176.27484000000004, "r_x2": 279.41132, "r_y2": 170.08209, "r_x3": 263.52499, "r_y3": 170.08209, "coord_origin": "TOPLEFT" }, "text": "3723", "orig": "3723", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 279.41, "r_y0": 176.27484000000004, "r_x1": 285.6369, "r_y1": 176.27484000000004, "r_x2": 285.6369, "r_y2": 169.69159000000002, "r_x3": 279.41, "r_y3": 169.69159000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.63602, "r_y0": 180.47069999999997, "r_x1": 392.27664, "r_y1": 180.47069999999997, "r_x2": 392.27664, "r_y2": 171.67371000000003, "r_x3": 285.63602, "r_y3": 171.67371000000003, "coord_origin": "TOPLEFT" }, "text": "$^{6960]}$, Ahmed Nassar[0000", "orig": "$^{6960]}$, Ahmed Nassar[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 392.27502, "r_y0": 176.27484000000004, "r_x1": 398.50192, "r_y1": 176.27484000000004, "r_x2": 398.50192, "r_y2": 169.69159000000002, "r_x3": 392.27502, "r_y3": 169.69159000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.50201, "r_y0": 176.27484000000004, "r_x1": 414.38834, "r_y1": 176.27484000000004, "r_x2": 414.38834, "r_y2": 170.08209, "r_x3": 398.50201, "r_y3": 170.08209, "coord_origin": "TOPLEFT" }, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 414.38702, "r_y0": 176.27484000000004, "r_x1": 420.61392, "r_y1": 176.27484000000004, "r_x2": 420.61392, "r_y2": 169.69159000000002, "r_x3": 414.38702, "r_y3": 169.69159000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 420.61304, "r_y0": 176.27484000000004, "r_x1": 436.49936, "r_y1": 176.27484000000004, "r_x2": 436.49936, "r_y2": 170.08209, "r_x3": 420.61304, "r_y3": 170.08209, "coord_origin": "TOPLEFT" }, "text": "9468", "orig": "9468", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.49805000000003, "r_y0": 176.27484000000004, "r_x1": 442.72495000000004, "r_y1": 176.27484000000004, "r_x2": 442.72495000000004, "r_y2": 169.69159000000002, "r_x3": 436.49805000000003, "r_y3": 169.69159000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.72504, "r_y0": 180.47069999999997, "r_x1": 464.12963999999994, "r_y1": 180.47069999999997, "r_x2": 464.12963999999994, "r_y2": 171.67371000000003, "r_x3": 442.72504, "r_y3": 171.67371000000003, "coord_origin": "TOPLEFT" }, "text": "$^{0822]}$,", "orig": "$^{0822]}$,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.34305, "r_y0": 192.42571999999996, "r_x1": 224.80720999999997, "r_y1": 192.42571999999996, "r_x2": 224.80720999999997, "r_y2": 183.62872000000004, "r_x3": 139.34305, "r_y3": 183.62872000000004, "coord_origin": "TOPLEFT" }, "text": "Nikolaos Livathinos", "orig": "Nikolaos Livathinos", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 224.80704000000003, "r_y0": 188.23090000000002, "r_x1": 242.94868, "r_y1": 188.23090000000002, "r_x2": 242.94868, "r_y2": 182.03814999999997, "r_x3": 224.80704000000003, "r_y3": 182.03814999999997, "coord_origin": "TOPLEFT" }, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 242.94704000000002, "r_y0": 188.23090000000002, "r_x1": 249.17394999999996, "r_y1": 188.23090000000002, "r_x2": 249.17394999999996, "r_y2": 181.64764000000002, "r_x3": 242.94704000000002, "r_y3": 181.64764000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.17404000000002, "r_y0": 188.23090000000002, "r_x1": 265.06036, "r_y1": 188.23090000000002, "r_x2": 265.06036, "r_y2": 182.03814999999997, "r_x3": 249.17404000000002, "r_y3": 182.03814999999997, "coord_origin": "TOPLEFT" }, "text": "0001", "orig": "0001", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 265.05905, "r_y0": 188.23090000000002, "r_x1": 271.28595, "r_y1": 188.23090000000002, "r_x2": 271.28595, "r_y2": 181.64764000000002, "r_x3": 265.05905, "r_y3": 181.64764000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 271.28506, "r_y0": 188.23090000000002, "r_x1": 287.17139, "r_y1": 188.23090000000002, "r_x2": 287.17139, "r_y2": 182.03814999999997, "r_x3": 271.28506, "r_y3": 182.03814999999997, "coord_origin": "TOPLEFT" }, "text": "8513", "orig": "8513", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 287.17007, "r_y0": 188.23090000000002, "r_x1": 293.39697, "r_y1": 188.23090000000002, "r_x2": 293.39697, "r_y2": 181.64764000000002, "r_x3": 287.17007, "r_y3": 181.64764000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.39706, "r_y0": 192.42571999999996, "r_x1": 404.1597, "r_y1": 192.42571999999996, "r_x2": 404.1597, "r_y2": 183.62872000000004, "r_x3": 293.39706, "r_y3": 183.62872000000004, "coord_origin": "TOPLEFT" }, "text": "$^{3491]}$, Christoph Auer[0000", "orig": "$^{3491]}$, Christoph Auer[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 404.15808, "r_y0": 188.23090000000002, "r_x1": 410.38498, "r_y1": 188.23090000000002, "r_x2": 410.38498, "r_y2": 181.64764000000002, "r_x3": 404.15808, "r_y3": 181.64764000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.38507, "r_y0": 188.23090000000002, "r_x1": 426.27139, "r_y1": 188.23090000000002, "r_x2": 426.27139, "r_y2": 182.03814999999997, "r_x3": 410.38507, "r_y3": 182.03814999999997, "coord_origin": "TOPLEFT" }, "text": "0001", "orig": "0001", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 426.27008, "r_y0": 188.23090000000002, "r_x1": 432.49697999999995, "r_y1": 188.23090000000002, "r_x2": 432.49697999999995, "r_y2": 181.64764000000002, "r_x3": 426.27008, "r_y3": 181.64764000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 432.49609, "r_y0": 188.23090000000002, "r_x1": 448.3824200000001, "r_y1": 188.23090000000002, "r_x2": 448.3824200000001, "r_y2": 182.03814999999997, "r_x3": 432.49609, "r_y3": 182.03814999999997, "coord_origin": "TOPLEFT" }, "text": "5761", "orig": "5761", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 448.3811, "r_y0": 188.23090000000002, "r_x1": 454.608, "r_y1": 188.23090000000002, "r_x2": 454.608, "r_y2": 181.64764000000002, "r_x3": 448.3811, "r_y3": 181.64764000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 454.60808999999995, "r_y0": 192.42571999999996, "r_x1": 476.01270000000005, "r_y1": 192.42571999999996, "r_x2": 476.01270000000005, "r_y2": 183.62872000000004, "r_x3": 454.60808999999995, "r_y3": 183.62872000000004, "coord_origin": "TOPLEFT" }, "text": "$^{0422]}$,", "orig": "$^{0422]}$,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.52109000000002, "r_y0": 204.38073999999995, "r_x1": 298.6087, "r_y1": 204.38073999999995, "r_x2": 298.6087, "r_y2": 195.58374000000003, "r_x3": 229.52109000000002, "r_y3": 195.58374000000003, "coord_origin": "TOPLEFT" }, "text": "and Peter Staar", "orig": "and Peter Staar", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 298.60608, "r_y0": 200.18591000000004, "r_x1": 316.74771, "r_y1": 200.18591000000004, "r_x2": 316.74771, "r_y2": 193.99316, "r_x3": 298.60608, "r_y3": 193.99316, "coord_origin": "TOPLEFT" }, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.74609, "r_y0": 200.18591000000004, "r_x1": 322.97299, "r_y1": 200.18591000000004, "r_x2": 322.97299, "r_y2": 193.60266000000001, "r_x3": 316.74609, "r_y3": 193.60266000000001, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.97308, "r_y0": 200.18591000000004, "r_x1": 338.85941, "r_y1": 200.18591000000004, "r_x2": 338.85941, "r_y2": 193.99316, "r_x3": 322.97308, "r_y3": 193.99316, "coord_origin": "TOPLEFT" }, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 338.85809, "r_y0": 200.18591000000004, "r_x1": 345.08499, "r_y1": 200.18591000000004, "r_x2": 345.08499, "r_y2": 193.60266000000001, "r_x3": 338.85809, "r_y3": 193.60266000000001, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.08508, "r_y0": 200.18591000000004, "r_x1": 360.97141, "r_y1": 200.18591000000004, "r_x2": 360.97141, "r_y2": 193.99316, "r_x3": 345.08508, "r_y3": 193.99316, "coord_origin": "TOPLEFT" }, "text": "8088", "orig": "8088", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 360.97009, "r_y0": 200.18591000000004, "r_x1": 367.19699, "r_y1": 200.18591000000004, "r_x2": 367.19699, "r_y2": 193.60266000000001, "r_x3": 360.97009, "r_y3": 193.60266000000001, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.19611, "r_y0": 200.18591000000004, "r_x1": 385.33774, "r_y1": 200.18591000000004, "r_x2": 385.33774, "r_y2": 193.99316, "r_x3": 367.19611, "r_y3": 193.99316, "coord_origin": "TOPLEFT" }, "text": "0823]", "orig": "0823]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 279.1051, "r_y0": 225.27368, "r_x1": 336.25153, "r_y1": 225.27368, "r_x2": 336.25153, "r_y2": 217.20398, "r_x3": 279.1051, "r_y3": 217.20398, "coord_origin": "TOPLEFT" }, "text": "IBM Research", "orig": "IBM Research", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.96609, "r_y0": 236.27752999999996, "r_x1": 392.38983, "r_y1": 236.27752999999996, "r_x2": 392.38983, "r_y2": 228.80853000000002, "r_x3": 222.96609, "r_y3": 228.80853000000002, "coord_origin": "TOPLEFT" }, "text": "{mly,ahn,nli,cau,taa}@zurich.ibm.com", "orig": "{mly,ahn,nli,cau,taa}@zurich.ibm.com", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 7, "label": "text", "bbox": { "l": 139.34305, "t": 169.69159000000002, "r": 476.01270000000005, "b": 200.18591000000004, "coord_origin": "TOPLEFT" }, "confidence": 0.7918068766593933, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.22598, "r_y0": 180.47069999999997, "r_x1": 217.04390999999998, "r_y1": 180.47069999999997, "r_x2": 217.04390999999998, "r_y2": 171.67371000000003, "r_x3": 151.22598, "r_y3": 171.67371000000003, "coord_origin": "TOPLEFT" }, "text": "Maksym Lysak", "orig": "Maksym Lysak", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 217.04599, "r_y0": 176.27484000000004, "r_x1": 235.18764, "r_y1": 176.27484000000004, "r_x2": 235.18764, "r_y2": 170.08209, "r_x3": 217.04599, "r_y3": 170.08209, "coord_origin": "TOPLEFT" }, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 235.18598999999998, "r_y0": 176.27484000000004, "r_x1": 241.4129, "r_y1": 176.27484000000004, "r_x2": 241.4129, "r_y2": 169.69159000000002, "r_x3": 235.18598999999998, "r_y3": 169.69159000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 241.41299000000004, "r_y0": 176.27484000000004, "r_x1": 257.29932, "r_y1": 176.27484000000004, "r_x2": 257.29932, "r_y2": 170.08209, "r_x3": 241.41299000000004, "r_y3": 170.08209, "coord_origin": "TOPLEFT" }, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 257.298, "r_y0": 176.27484000000004, "r_x1": 263.5249, "r_y1": 176.27484000000004, "r_x2": 263.5249, "r_y2": 169.69159000000002, "r_x3": 257.298, "r_y3": 169.69159000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.52499, "r_y0": 176.27484000000004, "r_x1": 279.41132, "r_y1": 176.27484000000004, "r_x2": 279.41132, "r_y2": 170.08209, "r_x3": 263.52499, "r_y3": 170.08209, "coord_origin": "TOPLEFT" }, "text": "3723", "orig": "3723", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 279.41, "r_y0": 176.27484000000004, "r_x1": 285.6369, "r_y1": 176.27484000000004, "r_x2": 285.6369, "r_y2": 169.69159000000002, "r_x3": 279.41, "r_y3": 169.69159000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.63602, "r_y0": 180.47069999999997, "r_x1": 392.27664, "r_y1": 180.47069999999997, "r_x2": 392.27664, "r_y2": 171.67371000000003, "r_x3": 285.63602, "r_y3": 171.67371000000003, "coord_origin": "TOPLEFT" }, "text": "$^{6960]}$, Ahmed Nassar[0000", "orig": "$^{6960]}$, Ahmed Nassar[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 392.27502, "r_y0": 176.27484000000004, "r_x1": 398.50192, "r_y1": 176.27484000000004, "r_x2": 398.50192, "r_y2": 169.69159000000002, "r_x3": 392.27502, "r_y3": 169.69159000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.50201, "r_y0": 176.27484000000004, "r_x1": 414.38834, "r_y1": 176.27484000000004, "r_x2": 414.38834, "r_y2": 170.08209, "r_x3": 398.50201, "r_y3": 170.08209, "coord_origin": "TOPLEFT" }, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 414.38702, "r_y0": 176.27484000000004, "r_x1": 420.61392, "r_y1": 176.27484000000004, "r_x2": 420.61392, "r_y2": 169.69159000000002, "r_x3": 414.38702, "r_y3": 169.69159000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 420.61304, "r_y0": 176.27484000000004, "r_x1": 436.49936, "r_y1": 176.27484000000004, "r_x2": 436.49936, "r_y2": 170.08209, "r_x3": 420.61304, "r_y3": 170.08209, "coord_origin": "TOPLEFT" }, "text": "9468", "orig": "9468", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.49805000000003, "r_y0": 176.27484000000004, "r_x1": 442.72495000000004, "r_y1": 176.27484000000004, "r_x2": 442.72495000000004, "r_y2": 169.69159000000002, "r_x3": 436.49805000000003, "r_y3": 169.69159000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.72504, "r_y0": 180.47069999999997, "r_x1": 464.12963999999994, "r_y1": 180.47069999999997, "r_x2": 464.12963999999994, "r_y2": 171.67371000000003, "r_x3": 442.72504, "r_y3": 171.67371000000003, "coord_origin": "TOPLEFT" }, "text": "$^{0822]}$,", "orig": "$^{0822]}$,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.34305, "r_y0": 192.42571999999996, "r_x1": 224.80720999999997, "r_y1": 192.42571999999996, "r_x2": 224.80720999999997, "r_y2": 183.62872000000004, "r_x3": 139.34305, "r_y3": 183.62872000000004, "coord_origin": "TOPLEFT" }, "text": "Nikolaos Livathinos", "orig": "Nikolaos Livathinos", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 224.80704000000003, "r_y0": 188.23090000000002, "r_x1": 242.94868, "r_y1": 188.23090000000002, "r_x2": 242.94868, "r_y2": 182.03814999999997, "r_x3": 224.80704000000003, "r_y3": 182.03814999999997, "coord_origin": "TOPLEFT" }, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 242.94704000000002, "r_y0": 188.23090000000002, "r_x1": 249.17394999999996, "r_y1": 188.23090000000002, "r_x2": 249.17394999999996, "r_y2": 181.64764000000002, "r_x3": 242.94704000000002, "r_y3": 181.64764000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.17404000000002, "r_y0": 188.23090000000002, "r_x1": 265.06036, "r_y1": 188.23090000000002, "r_x2": 265.06036, "r_y2": 182.03814999999997, "r_x3": 249.17404000000002, "r_y3": 182.03814999999997, "coord_origin": "TOPLEFT" }, "text": "0001", "orig": "0001", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 265.05905, "r_y0": 188.23090000000002, "r_x1": 271.28595, "r_y1": 188.23090000000002, "r_x2": 271.28595, "r_y2": 181.64764000000002, "r_x3": 265.05905, "r_y3": 181.64764000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 271.28506, "r_y0": 188.23090000000002, "r_x1": 287.17139, "r_y1": 188.23090000000002, "r_x2": 287.17139, "r_y2": 182.03814999999997, "r_x3": 271.28506, "r_y3": 182.03814999999997, "coord_origin": "TOPLEFT" }, "text": "8513", "orig": "8513", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 287.17007, "r_y0": 188.23090000000002, "r_x1": 293.39697, "r_y1": 188.23090000000002, "r_x2": 293.39697, "r_y2": 181.64764000000002, "r_x3": 287.17007, "r_y3": 181.64764000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.39706, "r_y0": 192.42571999999996, "r_x1": 404.1597, "r_y1": 192.42571999999996, "r_x2": 404.1597, "r_y2": 183.62872000000004, "r_x3": 293.39706, "r_y3": 183.62872000000004, "coord_origin": "TOPLEFT" }, "text": "$^{3491]}$, Christoph Auer[0000", "orig": "$^{3491]}$, Christoph Auer[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 404.15808, "r_y0": 188.23090000000002, "r_x1": 410.38498, "r_y1": 188.23090000000002, "r_x2": 410.38498, "r_y2": 181.64764000000002, "r_x3": 404.15808, "r_y3": 181.64764000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.38507, "r_y0": 188.23090000000002, "r_x1": 426.27139, "r_y1": 188.23090000000002, "r_x2": 426.27139, "r_y2": 182.03814999999997, "r_x3": 410.38507, "r_y3": 182.03814999999997, "coord_origin": "TOPLEFT" }, "text": "0001", "orig": "0001", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 426.27008, "r_y0": 188.23090000000002, "r_x1": 432.49697999999995, "r_y1": 188.23090000000002, "r_x2": 432.49697999999995, "r_y2": 181.64764000000002, "r_x3": 426.27008, "r_y3": 181.64764000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 432.49609, "r_y0": 188.23090000000002, "r_x1": 448.3824200000001, "r_y1": 188.23090000000002, "r_x2": 448.3824200000001, "r_y2": 182.03814999999997, "r_x3": 432.49609, "r_y3": 182.03814999999997, "coord_origin": "TOPLEFT" }, "text": "5761", "orig": "5761", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 448.3811, "r_y0": 188.23090000000002, "r_x1": 454.608, "r_y1": 188.23090000000002, "r_x2": 454.608, "r_y2": 181.64764000000002, "r_x3": 448.3811, "r_y3": 181.64764000000002, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 454.60808999999995, "r_y0": 192.42571999999996, "r_x1": 476.01270000000005, "r_y1": 192.42571999999996, "r_x2": 476.01270000000005, "r_y2": 183.62872000000004, "r_x3": 454.60808999999995, "r_y3": 183.62872000000004, "coord_origin": "TOPLEFT" }, "text": "$^{0422]}$,", "orig": "$^{0422]}$,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 298.60608, "r_y0": 200.18591000000004, "r_x1": 316.74771, "r_y1": 200.18591000000004, "r_x2": 316.74771, "r_y2": 193.99316, "r_x3": 298.60608, "r_y3": 193.99316, "coord_origin": "TOPLEFT" }, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.74609, "r_y0": 200.18591000000004, "r_x1": 322.97299, "r_y1": 200.18591000000004, "r_x2": 322.97299, "r_y2": 193.60266000000001, "r_x3": 316.74609, "r_y3": 193.60266000000001, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.97308, "r_y0": 200.18591000000004, "r_x1": 338.85941, "r_y1": 200.18591000000004, "r_x2": 338.85941, "r_y2": 193.99316, "r_x3": 322.97308, "r_y3": 193.99316, "coord_origin": "TOPLEFT" }, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 338.85809, "r_y0": 200.18591000000004, "r_x1": 345.08499, "r_y1": 200.18591000000004, "r_x2": 345.08499, "r_y2": 193.60266000000001, "r_x3": 338.85809, "r_y3": 193.60266000000001, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.08508, "r_y0": 200.18591000000004, "r_x1": 360.97141, "r_y1": 200.18591000000004, "r_x2": 360.97141, "r_y2": 193.99316, "r_x3": 345.08508, "r_y3": 193.99316, "coord_origin": "TOPLEFT" }, "text": "8088", "orig": "8088", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 360.97009, "r_y0": 200.18591000000004, "r_x1": 367.19699, "r_y1": 200.18591000000004, "r_x2": 367.19699, "r_y2": 193.60266000000001, "r_x3": 360.97009, "r_y3": 193.60266000000001, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.19611, "r_y0": 200.18591000000004, "r_x1": 385.33774, "r_y1": 200.18591000000004, "r_x2": 385.33774, "r_y2": 193.99316, "r_x3": 367.19611, "r_y3": 193.99316, "coord_origin": "TOPLEFT" }, "text": "0823]", "orig": "0823]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 13, "label": "text", "bbox": { "l": 229.52109000000002, "t": 195.58374000000003, "r": 298.6087, "b": 204.38073999999995, "coord_origin": "TOPLEFT" }, "confidence": 0.5015263557434082, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.52109000000002, "r_y0": 204.38073999999995, "r_x1": 298.6087, "r_y1": 204.38073999999995, "r_x2": 298.6087, "r_y2": 195.58374000000003, "r_x3": 229.52109000000002, "r_y3": 195.58374000000003, "coord_origin": "TOPLEFT" }, "text": "and Peter Staar", "orig": "and Peter Staar", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 9, "label": "text", "bbox": { "l": 279.1051, "t": 217.20398, "r": 336.25153, "b": 225.27368, "coord_origin": "TOPLEFT" }, "confidence": 0.6310867667198181, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 279.1051, "r_y0": 225.27368, "r_x1": 336.25153, "r_y1": 225.27368, "r_x2": 336.25153, "r_y2": 217.20398, "r_x3": 279.1051, "r_y3": 217.20398, "coord_origin": "TOPLEFT" }, "text": "IBM Research", "orig": "IBM Research", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 8, "label": "text", "bbox": { "l": 222.96609, "t": 228.80853000000002, "r": 392.38983, "b": 236.27752999999996, "coord_origin": "TOPLEFT" }, "confidence": 0.6924149990081787, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.96609, "r_y0": 236.27752999999996, "r_x1": 392.38983, "r_y1": 236.27752999999996, "r_x2": 392.38983, "r_y2": 228.80853000000002, "r_x3": 222.96609, "r_y3": 228.80853000000002, "coord_origin": "TOPLEFT" }, "text": "{mly,ahn,nli,cau,taa}@zurich.ibm.com", "orig": "{mly,ahn,nli,cau,taa}@zurich.ibm.com", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": null }, { "label": "text", "id": 1, "page_no": 0, "cluster": { "id": 1, "label": "text", "bbox": { "l": 163.1111, "t": 270.30115, "r": 452.24878000000007, "b": 464.73447, "coord_origin": "TOPLEFT" }, "confidence": 0.9807654023170471, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1111, "r_y0": 278.22748, "r_x1": 206.6358, "r_y1": 278.22748, "r_x2": 206.6358, "r_y2": 270.30115, "r_x3": 163.1111, "r_y3": 270.30115, "coord_origin": "TOPLEFT" }, "text": "Abstract.", "orig": "Abstract.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 211.6171, "r_y0": 278.43364999999994, "r_x1": 452.2447199999999, "r_y1": 278.43364999999994, "r_x2": 452.2447199999999, "r_y2": 270.36395000000005, "r_x3": 211.6171, "r_y3": 270.36395000000005, "coord_origin": "TOPLEFT" }, "text": "Extracting tables from documents is a crucial task in any", "orig": "Extracting tables from documents is a crucial task in any", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1111, "r_y0": 289.39267, "r_x1": 452.24246, "r_y1": 289.39267, "r_x2": 452.24246, "r_y2": 281.3229099999999, "r_x3": 163.1111, "r_y3": 281.3229099999999, "coord_origin": "TOPLEFT" }, "text": "document conversion pipeline. Recently, transformer-based models have", "orig": "document conversion pipeline. Recently, transformer-based models have", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1111, "r_y0": 300.35165000000006, "r_x1": 452.24792, "r_y1": 300.35165000000006, "r_x2": 452.24792, "r_y2": 292.28189, "r_x3": 163.1111, "r_y3": 292.28189, "coord_origin": "TOPLEFT" }, "text": "demonstrated that table-structure can be recognized with impressive ac-", "orig": "demonstrated that table-structure can be recognized with impressive ac-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1111, "r_y0": 311.31064, "r_x1": 452.2407799999999, "r_y1": 311.31064, "r_x2": 452.2407799999999, "r_y2": 303.24088, "r_x3": 163.1111, "r_y3": 303.24088, "coord_origin": "TOPLEFT" }, "text": "curacy using Image-to-Markup-Sequence (Im2Seq) approaches. Taking", "orig": "curacy using Image-to-Markup-Sequence (Im2Seq) approaches. Taking", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1111, "r_y0": 322.26865, "r_x1": 452.24609, "r_y1": 322.26865, "r_x2": 452.24609, "r_y2": 314.19888, "r_x3": 163.1111, "r_y3": 314.19888, "coord_origin": "TOPLEFT" }, "text": "only the image of a table, such models predict a sequence of tokens (e.g.", "orig": "only the image of a table, such models predict a sequence of tokens (e.g.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1111, "r_y0": 333.22763, "r_x1": 452.24615000000006, "r_y1": 333.22763, "r_x2": 452.24615000000006, "r_y2": 325.15787, "r_x3": 163.1111, "r_y3": 325.15787, "coord_origin": "TOPLEFT" }, "text": "in HTML, LaTeX) which represent the structure of the table. Since the", "orig": "in HTML, LaTeX) which represent the structure of the table. Since the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1111, "r_y0": 344.18661, "r_x1": 452.24707, "r_y1": 344.18661, "r_x2": 452.24707, "r_y2": 336.11685, "r_x3": 163.1111, "r_y3": 336.11685, "coord_origin": "TOPLEFT" }, "text": "token representation of the table structure has a significant impact on", "orig": "token representation of the table structure has a significant impact on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1111, "r_y0": 355.1456, "r_x1": 452.2459999999999, "r_y1": 355.1456, "r_x2": 452.2459999999999, "r_y2": 347.07584, "r_x3": 163.1111, "r_y3": 347.07584, "coord_origin": "TOPLEFT" }, "text": "the accuracy and run-time performance of any Im2Seq model, we inves-", "orig": "the accuracy and run-time performance of any Im2Seq model, we inves-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1111, "r_y0": 366.10458, "r_x1": 452.2479900000001, "r_y1": 366.10458, "r_x2": 452.2479900000001, "r_y2": 358.03482, "r_x3": 163.1111, "r_y3": 358.03482, "coord_origin": "TOPLEFT" }, "text": "tigate in this paper how table-structure representation can be optimised.", "orig": "tigate in this paper how table-structure representation can be optimised.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1111, "r_y0": 377.06357, "r_x1": 452.24609, "r_y1": 377.06357, "r_x2": 452.24609, "r_y2": 368.9938, "r_x3": 163.1111, "r_y3": 368.9938, "coord_origin": "TOPLEFT" }, "text": "We propose a new, optimised table-structure language (OTSL) with a", "orig": "We propose a new, optimised table-structure language (OTSL) with a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1111, "r_y0": 388.02255, "r_x1": 452.2417, "r_y1": 388.02255, "r_x2": 452.2417, "r_y2": 379.95279, "r_x3": 163.1111, "r_y3": 379.95279, "coord_origin": "TOPLEFT" }, "text": "minimized vocabulary and specific rules. The benefits of OTSL are that", "orig": "minimized vocabulary and specific rules. The benefits of OTSL are that", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1111, "r_y0": 398.98154, "r_x1": 452.2443200000001, "r_y1": 398.98154, "r_x2": 452.2443200000001, "r_y2": 390.91177, "r_x3": 163.1111, "r_y3": 390.91177, "coord_origin": "TOPLEFT" }, "text": "it reduces the number of tokens to 5 (HTML needs 28+) and shortens", "orig": "it reduces the number of tokens to 5 (HTML needs 28+) and shortens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1111, "r_y0": 409.94052, "r_x1": 452.24878000000007, "r_y1": 409.94052, "r_x2": 452.24878000000007, "r_y2": 401.87076, "r_x3": 163.1111, "r_y3": 401.87076, "coord_origin": "TOPLEFT" }, "text": "the sequence length to half of HTML on average. Consequently, model", "orig": "the sequence length to half of HTML on average. Consequently, model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1111, "r_y0": 420.8995100000001, "r_x1": 452.24063000000007, "r_y1": 420.8995100000001, "r_x2": 452.24063000000007, "r_y2": 412.82974, "r_x3": 163.1111, "r_y3": 412.82974, "coord_origin": "TOPLEFT" }, "text": "accuracy improves significantly, inference time is halved compared to", "orig": "accuracy improves significantly, inference time is halved compared to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1111, "r_y0": 431.85751000000005, "r_x1": 452.24161, "r_y1": 431.85751000000005, "r_x2": 452.24161, "r_y2": 423.78774999999996, "r_x3": 163.1111, "r_y3": 423.78774999999996, "coord_origin": "TOPLEFT" }, "text": "HTML-based models, and the predicted table structures are always syn-", "orig": "HTML-based models, and the predicted table structures are always syn-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1111, "r_y0": 442.8165, "r_x1": 452.24429, "r_y1": 442.8165, "r_x2": 452.24429, "r_y2": 434.74673, "r_x3": 163.1111, "r_y3": 434.74673, "coord_origin": "TOPLEFT" }, "text": "tactically correct. This in turn eliminates most post-processing needs.", "orig": "tactically correct. This in turn eliminates most post-processing needs.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1111, "r_y0": 453.77547999999996, "r_x1": 452.24603, "r_y1": 453.77547999999996, "r_x2": 452.24603, "r_y2": 445.70572000000004, "r_x3": 163.1111, "r_y3": 445.70572000000004, "coord_origin": "TOPLEFT" }, "text": "Popular table structure data-sets will be published in OTSL format to", "orig": "Popular table structure data-sets will be published in OTSL format to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1111, "r_y0": 464.73447, "r_x1": 225.56116, "r_y1": 464.73447, "r_x2": 225.56116, "r_y2": 456.6647, "r_x3": 163.1111, "r_y3": 456.6647, "coord_origin": "TOPLEFT" }, "text": "the community.", "orig": "the community.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Abstract. Extracting tables from documents is a crucial task in any document conversion pipeline. Recently, transformer-based models have demonstrated that table-structure can be recognized with impressive accuracy using Image-to-Markup-Sequence (Im2Seq) approaches. Taking only the image of a table, such models predict a sequence of tokens (e.g. in HTML, LaTeX) which represent the structure of the table. Since the token representation of the table structure has a significant impact on the accuracy and run-time performance of any Im2Seq model, we investigate in this paper how table-structure representation can be optimised. We propose a new, optimised table-structure language (OTSL) with a minimized vocabulary and specific rules. The benefits of OTSL are that it reduces the number of tokens to 5 (HTML needs 28+) and shortens the sequence length to half of HTML on average. Consequently, model accuracy improves significantly, inference time is halved compared to HTML-based models, and the predicted table structures are always syntactically correct. This in turn eliminates most post-processing needs. Popular table structure data-sets will be published in OTSL format to the community." }, { "label": "text", "id": 4, "page_no": 0, "cluster": { "id": 4, "label": "text", "bbox": { "l": 163.1111, "t": 478.69394, "r": 452.24158, "b": 497.78549, "coord_origin": "TOPLEFT" }, "confidence": 0.9304055571556091, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1111, "r_y0": 486.62024, "r_x1": 211.94211, "r_y1": 486.62024, "r_x2": 211.94211, "r_y2": 478.69394, "r_x3": 163.1111, "r_y3": 478.69394, "coord_origin": "TOPLEFT" }, "text": "Keywords:", "orig": "Keywords:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 216.55208999999996, "r_y0": 486.82648, "r_x1": 452.24158, "r_y1": 486.82648, "r_x2": 452.24158, "r_y2": 478.75671, "r_x3": 216.55208999999996, "r_y3": 478.75671, "coord_origin": "TOPLEFT" }, "text": "Table Structure Recognition \u00b7 Data Representation \u00b7 Trans-", "orig": "Table Structure Recognition \u00b7 Data Representation \u00b7 Trans-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11111, "r_y0": 497.78549, "r_x1": 257.64185, "r_y1": 497.78549, "r_x2": 257.64185, "r_y2": 489.71573, "r_x3": 163.11111, "r_y3": 489.71573, "coord_origin": "TOPLEFT" }, "text": "formers \u00b7 Optimization.", "orig": "formers \u00b7 Optimization.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Keywords: Table Structure Recognition \u00b7 Data Representation \u00b7 Transformers \u00b7 Optimization." }, { "label": "section_header", "id": 3, "page_no": 0, "cluster": { "id": 3, "label": "section_header", "bbox": { "l": 134.76512, "t": 522.11969, "r": 228.93384, "b": 532.68808, "coord_origin": "TOPLEFT" }, "confidence": 0.9392016530036926, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76512, "r_y0": 532.68808, "r_x1": 141.48872, "r_y1": 532.68808, "r_x2": 141.48872, "r_y2": 522.11969, "r_x3": 134.76512, "r_y3": 522.11969, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.93832, "r_y0": 532.68808, "r_x1": 228.93384, "r_y1": 532.68808, "r_x2": 228.93384, "r_y2": 522.11969, "r_x3": 154.93832, "r_y3": 522.11969, "coord_origin": "TOPLEFT" }, "text": "Introduction", "orig": "Introduction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "1 Introduction" }, { "label": "text", "id": 0, "page_no": 0, "cluster": { "id": 0, "label": "text", "bbox": { "l": 134.76512, "t": 548.2865400000001, "r": 480.5959500000001, "b": 628.81451, "coord_origin": "TOPLEFT" }, "confidence": 0.9835679531097412, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76512, "r_y0": 557.0835099999999, "r_x1": 480.5939, "r_y1": 557.0835099999999, "r_x2": 480.5939, "r_y2": 548.2865400000001, "r_x3": 134.76512, "r_y3": 548.2865400000001, "coord_origin": "TOPLEFT" }, "text": "Tables are ubiquitous in documents such as scientific papers, patents, reports,", "orig": "Tables are ubiquitous in documents such as scientific papers, patents, reports,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76512, "r_y0": 569.0395100000001, "r_x1": 480.59180000000003, "r_y1": 569.0395100000001, "r_x2": 480.59180000000003, "r_y2": 560.24254, "r_x3": 134.76512, "r_y3": 560.24254, "coord_origin": "TOPLEFT" }, "text": "manuals, specification sheets or marketing material. They often encode highly", "orig": "manuals, specification sheets or marketing material. They often encode highly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76512, "r_y0": 580.99451, "r_x1": 480.59283000000005, "r_y1": 580.99451, "r_x2": 480.59283000000005, "r_y2": 572.19754, "r_x3": 134.76512, "r_y3": 572.19754, "coord_origin": "TOPLEFT" }, "text": "valuable information and therefore need to be extracted with high accuracy.", "orig": "valuable information and therefore need to be extracted with high accuracy.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76512, "r_y0": 592.9495099999999, "r_x1": 480.5959500000001, "r_y1": 592.9495099999999, "r_x2": 480.5959500000001, "r_y2": 584.15254, "r_x3": 134.76512, "r_y3": 584.15254, "coord_origin": "TOPLEFT" }, "text": "Unfortunately, tables appear in documents in various sizes, styling and struc-", "orig": "Unfortunately, tables appear in documents in various sizes, styling and struc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76512, "r_y0": 604.90451, "r_x1": 480.58688, "r_y1": 604.90451, "r_x2": 480.58688, "r_y2": 596.10754, "r_x3": 134.76512, "r_y3": 596.10754, "coord_origin": "TOPLEFT" }, "text": "ture, making it difficult to recover their correct structure with simple analyt-", "orig": "ture, making it difficult to recover their correct structure with simple analyt-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76512, "r_y0": 616.85951, "r_x1": 480.59088, "r_y1": 616.85951, "r_x2": 480.59088, "r_y2": 608.06255, "r_x3": 134.76512, "r_y3": 608.06255, "coord_origin": "TOPLEFT" }, "text": "ical methods. Therefore, accurate table extraction is achieved these days with", "orig": "ical methods. Therefore, accurate table extraction is achieved these days with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76512, "r_y0": 628.81451, "r_x1": 279.32745, "r_y1": 628.81451, "r_x2": 279.32745, "r_y2": 620.01755, "r_x3": 134.76512, "r_y3": 620.01755, "coord_origin": "TOPLEFT" }, "text": "machine-learning based methods.", "orig": "machine-learning based methods.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Tables are ubiquitous in documents such as scientific papers, patents, reports, manuals, specification sheets or marketing material. They often encode highly valuable information and therefore need to be extracted with high accuracy. Unfortunately, tables appear in documents in various sizes, styling and structure, making it difficult to recover their correct structure with simple analytical methods. Therefore, accurate table extraction is achieved these days with machine-learning based methods." }, { "label": "text", "id": 2, "page_no": 0, "cluster": { "id": 2, "label": "text", "bbox": { "l": 134.76512, "t": 632.14755, "r": 480.59583, "b": 664.85453, "coord_origin": "TOPLEFT" }, "confidence": 0.9696458578109741, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.70811, "r_y0": 640.94452, "r_x1": 480.58899, "r_y1": 640.94452, "r_x2": 480.58899, "r_y2": 632.14755, "r_x3": 149.70811, "r_y3": 632.14755, "coord_origin": "TOPLEFT" }, "text": "In modern document understanding systems [1,15], table extraction is typi-", "orig": "In modern document understanding systems [1,15], table extraction is typi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76512, "r_y0": 652.8995199999999, "r_x1": 480.59583, "r_y1": 652.8995199999999, "r_x2": 480.59583, "r_y2": 644.1025500000001, "r_x3": 134.76512, "r_y3": 644.1025500000001, "coord_origin": "TOPLEFT" }, "text": "cally a two-step process. Firstly, every table on a page is located with a bounding", "orig": "cally a two-step process. Firstly, every table on a page is located with a bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76512, "r_y0": 664.85453, "r_x1": 480.59496999999993, "r_y1": 664.85453, "r_x2": 480.59496999999993, "r_y2": 656.05756, "r_x3": 134.76512, "r_y3": 656.05756, "coord_origin": "TOPLEFT" }, "text": "box, and secondly, their logical row and column structure is recognized. As of", "orig": "box, and secondly, their logical row and column structure is recognized. As of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "In modern document understanding systems [1,15], table extraction is typically a two-step process. Firstly, every table on a page is located with a bounding box, and secondly, their logical row and column structure is recognized. As of" } ], "headers": [ { "label": "page_header", "id": 6, "page_no": 0, "cluster": { "id": 6, "label": "page_header", "bbox": { "l": 18.340218, "t": 209.47997999999995, "r": 36.339787, "b": 555.00003, "coord_origin": "TOPLEFT" }, "confidence": 0.8899643421173096, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 18.340218, "r_y0": 555.00003, "r_x1": 36.339787, "r_y1": 555.00003, "r_x2": 36.339787, "r_y2": 209.47997999999995, "r_x3": 18.340218, "r_y3": 209.47997999999995, "coord_origin": "TOPLEFT" }, "text": "arXiv:2305.03393v1 [cs.CV] 5 May 2023", "orig": "arXiv:2305.03393v1 [cs.CV] 5 May 2023", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "arXiv:2305.03393v1 [cs.CV] 5 May 2023" } ] } }, { "page_no": 1, "size": { "width": 612.0, "height": 792.0 }, "parsed_page": { "dimension": { "angle": 0.0, "rect": { "r_x0": 0.0, "r_y0": 0.0, "r_x1": 612.0, "r_y1": 0.0, "r_x2": 612.0, "r_y2": 792.0, "r_x3": 0.0, "r_y3": 792.0, "coord_origin": "BOTTOMLEFT" }, "boundary_type": "crop_box", "art_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "bleed_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "crop_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "media_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "trim_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" } }, "bitmap_resources": [], "char_cells": [], "word_cells": [], "textline_cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 101.84069999999997, "r_x1": 139.37193, "r_y1": 101.84069999999997, "r_x2": 139.37193, "r_y2": 93.77099999999996, "r_x3": 134.765, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.81335, "r_y0": 101.84069999999997, "r_x1": 178.07675, "r_y1": 101.84069999999997, "r_x2": 178.07675, "r_y2": 93.77099999999996, "r_x3": 167.81335, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.37415, "r_y0": 101.84069999999997, "r_x1": 231.72227, "r_y1": 101.84069999999997, "r_x2": 231.72227, "r_y2": 93.77099999999996, "r_x3": 182.37415, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 134.26049999999998, "r_x1": 162.64424, "r_y1": 134.26049999999998, "r_x2": 162.64424, "r_y2": 126.33416999999997, "r_x3": 134.765, "r_y3": 126.33416999999997, "coord_origin": "TOPLEFT" }, "text": "Fig. 1.", "orig": "Fig. 1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.062, "r_y0": 134.46667000000002, "r_x1": 480.59106, "r_y1": 134.46667000000002, "r_x2": 480.59106, "r_y2": 126.39697000000001, "r_x3": 167.062, "r_y3": 126.39697000000001, "coord_origin": "TOPLEFT" }, "text": "Comparison between HTML and OTSL table structure representation: (A)", "orig": "Comparison between HTML and OTSL table structure representation: (A)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 145.42566, "r_x1": 480.59018, "r_y1": 145.42566, "r_x2": 480.59018, "r_y2": 137.35595999999998, "r_x3": 134.765, "r_y3": 137.35595999999998, "coord_origin": "TOPLEFT" }, "text": "table-example with complex row and column headers, including a 2D empty span,", "orig": "table-example with complex row and column headers, including a 2D empty span,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 156.38464, "r_x1": 147.95433, "r_y1": 156.38464, "r_x2": 147.95433, "r_y2": 148.31493999999998, "r_x3": 134.765, "r_y3": 148.31493999999998, "coord_origin": "TOPLEFT" }, "text": "(B)", "orig": "(B)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 152.39224, "r_y0": 156.38464, "r_x1": 480.59096999999997, "r_y1": 156.38464, "r_x2": 480.59096999999997, "r_y2": 148.31493999999998, "r_x3": 152.39224, "r_y3": 148.31493999999998, "coord_origin": "TOPLEFT" }, "text": "minimal graphical representation of table structure using rectangular layout, (C)", "orig": "minimal graphical representation of table structure using rectangular layout, (C)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 167.34362999999996, "r_x1": 480.59189, "r_y1": 167.34362999999996, "r_x2": 480.59189, "r_y2": 159.27392999999995, "r_x3": 134.765, "r_y3": 159.27392999999995, "coord_origin": "TOPLEFT" }, "text": "HTML representation, (D) OTSL representation. This example demonstrates many of", "orig": "HTML representation, (D) OTSL representation. This example demonstrates many of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 178.30260999999996, "r_x1": 480.58914000000004, "r_y1": 178.30260999999996, "r_x2": 480.58914000000004, "r_y2": 170.23290999999995, "r_x3": 134.765, "r_y3": 170.23290999999995, "coord_origin": "TOPLEFT" }, "text": "the key-features of OTSL, namely its reduced vocabulary size (12 versus 5 in this case),", "orig": "the key-features of OTSL, namely its reduced vocabulary size (12 versus 5 in this case),", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 189.26160000000004, "r_x1": 480.59020999999996, "r_y1": 189.26160000000004, "r_x2": 480.59020999999996, "r_y2": 181.19188999999994, "r_x3": 134.765, "r_y3": 181.19188999999994, "coord_origin": "TOPLEFT" }, "text": "its reduced sequence length (55 versus 30) and a enhanced internal structure (variable", "orig": "its reduced sequence length (55 versus 30) and a enhanced internal structure (variable", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 200.22058000000004, "r_x1": 460.87109, "r_y1": 200.22058000000004, "r_x2": 460.87109, "r_y2": 192.15088000000003, "r_x3": 134.765, "r_y3": 192.15088000000003, "coord_origin": "TOPLEFT" }, "text": "token sequence length per row in HTML versus a fixed length of rows in OTSL).", "orig": "token sequence length per row in HTML versus a fixed length of rows in OTSL).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.41107, "r_y0": 289.50903, "r_x1": 402.97336, "r_y1": 289.50903, "r_x2": 402.97336, "r_y2": 280.98352, "r_x3": 396.41107, "r_y3": 280.98352, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.58682, "r_y0": 289.42343, "r_x1": 425.14911, "r_y1": 289.42343, "r_x2": 425.14911, "r_y2": 280.89792, "r_x3": 418.58682, "r_y3": 280.89792, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.74835, "r_y0": 311.76279, "r_x1": 402.31064, "r_y1": 311.76279, "r_x2": 402.31064, "r_y2": 303.23727, "r_x3": 395.74835, "r_y3": 303.23727, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.54214, "r_y0": 311.89532, "r_x1": 414.10443, "r_y1": 311.89532, "r_x2": 414.10443, "r_y2": 303.36981, "r_x3": 407.54214, "r_y3": 303.36981, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.56335, "r_y0": 322.9317, "r_x1": 414.12564, "r_y1": 322.9317, "r_x2": 414.12564, "r_y2": 314.40619, "r_x3": 407.56335, "r_y3": 314.40619, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.51108, "r_y0": 300.61053000000004, "r_x1": 425.07336, "r_y1": 300.61053000000004, "r_x2": 425.07336, "r_y2": 292.08502000000004, "r_x3": 418.51108, "r_y3": 292.08502000000004, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.59744, "r_y0": 300.61658, "r_x1": 436.1597300000001, "r_y1": 300.61658, "r_x2": 436.1597300000001, "r_y2": 292.09106, "r_x3": 429.59744, "r_y3": 292.09106, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.68759000000006, "r_y0": 300.53781000000004, "r_x1": 447.24987999999996, "r_y1": 300.53781000000004, "r_x2": 447.24987999999996, "r_y2": 292.01230000000004, "r_x3": 440.68759000000006, "r_y3": 292.01230000000004, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.6232, "r_y0": 311.82034, "r_x1": 425.18549, "r_y1": 311.82034, "r_x2": 425.18549, "r_y2": 303.29483, "r_x3": 418.6232, "r_y3": 303.29483, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.7095299999999, "r_y0": 311.82562, "r_x1": 436.27182, "r_y1": 311.82562, "r_x2": 436.27182, "r_y2": 303.30011, "r_x3": 429.7095299999999, "r_y3": 303.30011, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.7996800000001, "r_y0": 311.74762, "r_x1": 447.36197, "r_y1": 311.74762, "r_x2": 447.36197, "r_y2": 303.22211, "r_x3": 440.7996800000001, "r_y3": 303.22211, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.62546, "r_y0": 323.09454, "r_x1": 425.18774, "r_y1": 323.09454, "r_x2": 425.18774, "r_y2": 314.56903, "r_x3": 418.62546, "r_y3": 314.56903, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.71181999999993, "r_y0": 323.09985, "r_x1": 436.27411, "r_y1": 323.09985, "r_x2": 436.27411, "r_y2": 314.57434, "r_x3": 429.71181999999993, "r_y3": 314.57434, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.80194, "r_y0": 323.02182, "r_x1": 447.36423, "r_y1": 323.02182, "r_x2": 447.36423, "r_y2": 314.49631, "r_x3": 440.80194, "r_y3": 314.49631, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.39746, "r_y0": 333.81583, "r_x1": 413.95975, "r_y1": 333.81583, "r_x2": 413.95975, "r_y2": 325.29031, "r_x3": 407.39746, "r_y3": 325.29031, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.45959, "r_y0": 333.97867, "r_x1": 425.02188, "r_y1": 333.97867, "r_x2": 425.02188, "r_y2": 325.45316, "r_x3": 418.45959, "r_y3": 325.45316, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.54593, "r_y0": 333.98471, "r_x1": 436.10822, "r_y1": 333.98471, "r_x2": 436.10822, "r_y2": 325.4592, "r_x3": 429.54593, "r_y3": 325.4592, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.63608, "r_y0": 333.90594, "r_x1": 447.19836, "r_y1": 333.90594, "r_x2": 447.19836, "r_y2": 325.38043, "r_x3": 440.63608, "r_y3": 325.38043, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 451.89511000000005, "r_y0": 288.68268, "r_x1": 463.51273000000003, "r_y1": 288.68268, "r_x2": 463.51273000000003, "r_y2": 280.15717, "r_x3": 451.89511000000005, "r_y3": 280.15717, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.1557, "r_y0": 300.12427, "r_x1": 463.77332, "r_y1": 300.12427, "r_x2": 463.77332, "r_y2": 291.59875000000005, "r_x3": 452.1557, "r_y3": 291.59875000000005, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.17688000000004, "r_y0": 311.36816, "r_x1": 463.79449000000005, "r_y1": 311.36816, "r_x2": 463.79449000000005, "r_y2": 302.84265, "r_x3": 452.17688000000004, "r_y3": 302.84265, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.09887999999995, "r_y0": 322.6499299999999, "r_x1": 463.71648999999996, "r_y1": 322.6499299999999, "r_x2": 463.71648999999996, "r_y2": 314.12441999999993, "r_x3": 452.09887999999995, "r_y3": 314.12441999999993, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.29733, "r_y0": 333.99457, "r_x1": 463.91495, "r_y1": 333.99457, "r_x2": 463.91495, "r_y2": 325.46906, "r_x3": 452.29733, "r_y3": 325.46906, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.09677, "r_y0": 323.02029000000005, "r_x1": 402.65906, "r_y1": 323.02029000000005, "r_x2": 402.65906, "r_y2": 314.49478, "r_x3": 396.09677, "r_y3": 314.49478, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.99829, "r_y0": 333.91428, "r_x1": 402.56058, "r_y1": 333.91428, "r_x2": 402.56058, "r_y2": 325.38876000000005, "r_x3": 395.99829, "r_y3": 325.38876000000005, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.27475, "r_y0": 300.79608, "r_x1": 402.83704, "r_y1": 300.79608, "r_x2": 402.83704, "r_y2": 292.27057, "r_x3": 396.27475, "r_y3": 292.27057, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.54724, "r_y0": 289.49463, "r_x1": 413.60074, "r_y1": 289.49463, "r_x2": 413.60074, "r_y2": 280.96912, "r_x3": 408.54724, "r_y3": 280.96912, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 430.58966, "r_y0": 289.02277, "r_x1": 435.6431600000001, "r_y1": 289.02277, "r_x2": 435.6431600000001, "r_y2": 280.49725, "r_x3": 430.58966, "r_y3": 280.49725, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 441.08069, "r_y0": 288.90613, "r_x1": 446.13419, "r_y1": 288.90613, "r_x2": 446.13419, "r_y2": 280.38062, "r_x3": 441.08069, "r_y3": 280.38062, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.97388, "r_y0": 300.65976, "r_x1": 414.03625, "r_y1": 300.65976, "r_x2": 414.03625, "r_y2": 292.13425, "r_x3": 407.97388, "r_y3": 292.13425, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 441.25640999999996, "r_y0": 419.7062700000001, "r_x1": 452.87402, "r_y1": 419.7062700000001, "r_x2": 452.87402, "r_y2": 411.1807600000001, "r_x3": 441.25640999999996, "r_y3": 411.1807600000001, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.75256, "r_y0": 406.89935, "r_x1": 432.48929, "r_y1": 406.89935, "r_x2": 432.48929, "r_y2": 399.7947700000001, "r_x3": 393.75256, "r_y3": 399.7947700000001, "coord_origin": "TOPLEFT" }, "text": "vocabulary:", "orig": "vocabulary:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 434.5896000000001, "r_y0": 406.89935, "r_x1": 438.80083999999994, "r_y1": 406.89935, "r_x2": 438.80083999999994, "r_y2": 399.7947700000001, "r_x3": 434.5896000000001, "r_y3": 399.7947700000001, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.90573, "r_y0": 406.89935, "r_x1": 463.22235, "r_y1": 406.89935, "r_x2": 463.22235, "r_y2": 399.7947700000001, "r_x3": 440.90573, "r_y3": 399.7947700000001, "coord_origin": "TOPLEFT" }, "text": "tokens", "orig": "tokens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 384.11816, "r_y0": 265.65179, "r_x1": 413.99307, "r_y1": 265.65179, "r_x2": 413.99307, "r_y2": 258.54718, "r_x3": 384.11816, "r_y3": 258.54718, "coord_origin": "TOPLEFT" }, "text": "D OTSL", "orig": "D OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.75256, "r_y0": 273.77966000000004, "r_x1": 451.45129000000003, "r_y1": 273.77966000000004, "r_x2": 451.45129000000003, "r_y2": 266.67505000000006, "r_x3": 393.75256, "r_y3": 266.67505000000006, "coord_origin": "TOPLEFT" }, "text": "sequence length:", "orig": "sequence length:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 453.55083999999994, "r_y0": 273.77966000000004, "r_x1": 461.97485, "r_y1": 273.77966000000004, "r_x2": 461.97485, "r_y2": 266.67505000000006, "r_x3": 453.55083999999994, "r_y3": 266.67505000000006, "coord_origin": "TOPLEFT" }, "text": "30", "orig": "30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.79318, "r_y0": 406.86474999999996, "r_x1": 233.89371000000003, "r_y1": 406.86474999999996, "r_x2": 233.89371000000003, "r_y2": 399.76016, "r_x3": 151.79318, "r_y3": 399.76016, "coord_origin": "TOPLEFT" }, "text": "vocabulary for this table:", "orig": "vocabulary for this table:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 235.99332, "r_y0": 406.86474999999996, "r_x1": 244.41734000000002, "r_y1": 406.86474999999996, "r_x2": 244.41734000000002, "r_y2": 399.76016, "r_x3": 235.99332, "r_y3": 399.76016, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.52222, "r_y0": 406.86474999999996, "r_x1": 268.83884, "r_y1": 406.86474999999996, "r_x2": 268.83884, "r_y2": 399.76016, "r_x3": 246.52222, "r_y3": 399.76016, "coord_origin": "TOPLEFT" }, "text": "tokens", "orig": "tokens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.3298, "r_y0": 220.67920000000004, "r_x1": 159.79837, "r_y1": 220.67920000000004, "r_x2": 159.79837, "r_y2": 213.57457999999997, "r_x3": 154.3298, "r_y3": 213.57457999999997, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 321.07053, "r_y0": 220.67920000000004, "r_x1": 326.53909, "r_y1": 220.67920000000004, "r_x2": 326.53909, "r_y2": 213.57457999999997, "r_x3": 321.07053, "r_y3": 213.57457999999997, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 153.0947, "r_y0": 286.69824, "r_x1": 175.83888, "r_y1": 286.69824, "r_x2": 175.83888, "r_y2": 280.30411, "r_x3": 153.0947, "r_y3": 280.30411, "coord_origin": "TOPLEFT" }, "text": "", "orig": "
", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67039, "r_y0": 293.51501, "r_x1": 172.79608, "r_y1": 293.51501, "r_x2": 172.79608, "r_y2": 287.12088, "r_x3": 160.67039, "r_y3": 287.12088, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.24603, "r_y0": 300.33179, "r_x1": 177.91019, "r_y1": 300.33179, "r_x2": 177.91019, "r_y2": 293.93765, "r_x3": 168.24603, "r_y3": 293.93765, "coord_origin": "TOPLEFT" }, "text": "", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.35785, "r_y0": 300.33179, "r_x1": 278.89804, "r_y1": 300.33179, "r_x2": 278.89804, "r_y2": 293.93765, "r_x3": 263.35785, "r_y3": 293.93765, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 280.79175, "r_y0": 300.33179, "r_x1": 290.4559, "r_y1": 300.33179, "r_x2": 290.4559, "r_y2": 293.93765, "r_x3": 280.79175, "r_y3": 293.93765, "coord_origin": "TOPLEFT" }, "text": "", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 335.92926, "r_y0": 300.33179, "r_x1": 351.46945, "r_y1": 300.33179, "r_x2": 351.46945, "r_y2": 293.93765, "r_x3": 335.92926, "r_y3": 293.93765, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67039, "r_y0": 307.14856, "r_x1": 174.68979, "r_y1": 307.14856, "r_x2": 174.68979, "r_y2": 300.75442999999996, "r_x3": 160.67039, "r_y3": 300.75442999999996, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67039, "r_y0": 313.96536, "r_x1": 172.79608, "r_y1": 313.96536, "r_x2": 172.79608, "r_y2": 307.57122999999996, "r_x3": 160.67039, "r_y3": 307.57122999999996, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.24603, "r_y0": 320.78214, "r_x1": 181.89255, "r_y1": 320.78214, "r_x2": 181.89255, "r_y2": 314.388, "r_x3": 168.24603, "r_y3": 314.388, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 201.22015, "r_y0": 320.78214, "r_x1": 214.86666999999997, "r_y1": 320.78214, "r_x2": 214.86666999999997, "r_y2": 314.388, "r_x3": 201.22015, "r_y3": 314.388, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.19427000000002, "r_y0": 320.78214, "r_x1": 247.84079000000003, "r_y1": 320.78214, "r_x2": 247.84079000000003, "r_y2": 314.388, "r_x3": 234.19427000000002, "r_y3": 314.388, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67039, "r_y0": 327.59890999999993, "r_x1": 174.68979, "r_y1": 327.59890999999993, "r_x2": 174.68979, "r_y2": 321.20477, "r_x3": 160.67039, "r_y3": 321.20477, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67039, "r_y0": 334.41571000000005, "r_x1": 172.79608, "r_y1": 334.41571000000005, "r_x2": 172.79608, "r_y2": 328.02158, "r_x3": 160.67039, "r_y3": 328.02158, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.24603, "r_y0": 341.23248, "r_x1": 373.09091, "r_y1": 341.23248, "r_x2": 373.09091, "r_y2": 334.83835, "r_x3": 168.24603, "r_y3": 334.83835, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67039, "r_y0": 348.04926, "r_x1": 174.68979, "r_y1": 348.04926, "r_x2": 174.68979, "r_y2": 341.65512, "r_x3": 160.67039, "r_y3": 341.65512, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67039, "r_y0": 354.86572, "r_x1": 172.79608, "r_y1": 354.86572, "r_x2": 172.79608, "r_y2": 348.47159, "r_x3": 160.67039, "r_y3": 348.47159, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.24603, "r_y0": 361.68249999999995, "r_x1": 181.89255, "r_y1": 361.68249999999995, "r_x2": 181.89255, "r_y2": 355.28836000000007, "r_x3": 168.24603, "r_y3": 355.28836000000007, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 201.22015, "r_y0": 361.68249999999995, "r_x1": 214.86666999999997, "r_y1": 361.68249999999995, "r_x2": 214.86666999999997, "r_y2": 355.28836000000007, "r_x3": 201.22015, "r_y3": 355.28836000000007, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.19427000000002, "r_y0": 361.68249999999995, "r_x1": 247.84079000000003, "r_y1": 361.68249999999995, "r_x2": 247.84079000000003, "r_y2": 355.28836000000007, "r_x3": 234.19427000000002, "r_y3": 355.28836000000007, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 267.1684, "r_y0": 361.68249999999995, "r_x1": 280.81488, "r_y1": 361.68249999999995, "r_x2": 280.81488, "r_y2": 355.28836000000007, "r_x3": 267.1684, "r_y3": 355.28836000000007, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67039, "r_y0": 368.49929999999995, "r_x1": 174.68979, "r_y1": 368.49929999999995, "r_x2": 174.68979, "r_y2": 362.10516000000007, "r_x3": 160.67039, "r_y3": 362.10516000000007, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67039, "r_y0": 375.31607, "r_x1": 172.79608, "r_y1": 375.31607, "r_x2": 172.79608, "r_y2": 368.92194, "r_x3": 160.67039, "r_y3": 368.92194, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.24603, "r_y0": 382.13284, "r_x1": 181.89255, "r_y1": 382.13284, "r_x2": 181.89255, "r_y2": 375.73871, "r_x3": 168.24603, "r_y3": 375.73871, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 201.22015, "r_y0": 382.13284, "r_x1": 214.86666999999997, "r_y1": 382.13284, "r_x2": 214.86666999999997, "r_y2": 375.73871, "r_x3": 201.22015, "r_y3": 375.73871, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.19427000000002, "r_y0": 382.13284, "r_x1": 247.84079000000003, "r_y1": 382.13284, "r_x2": 247.84079000000003, "r_y2": 375.73871, "r_x3": 234.19427000000002, "r_y3": 375.73871, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 267.1684, "r_y0": 382.13284, "r_x1": 280.81488, "r_y1": 382.13284, "r_x2": 280.81488, "r_y2": 375.73871, "r_x3": 267.1684, "r_y3": 375.73871, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67039, "r_y0": 388.94965, "r_x1": 174.68979, "r_y1": 388.94965, "r_x2": 174.68979, "r_y2": 382.55551, "r_x3": 160.67039, "r_y3": 382.55551, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 153.0947, "r_y0": 395.76642, "r_x1": 177.73259, "r_y1": 395.76642, "r_x2": 177.73259, "r_y2": 389.37228, "r_x3": 153.0947, "r_y3": 389.37228, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.78624, "r_y0": 320.78214, "r_x1": 199.32646, "r_y1": 320.78214, "r_x2": 199.32646, "r_y2": 314.388, "r_x3": 183.78624, "r_y3": 314.388, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 216.76038, "r_y0": 320.78214, "r_x1": 232.30058, "r_y1": 320.78214, "r_x2": 232.30058, "r_y2": 314.388, "r_x3": 216.76038, "r_y3": 314.388, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.73447999999996, "r_y0": 320.78214, "r_x1": 265.27469, "r_y1": 320.78214, "r_x2": 265.27469, "r_y2": 314.388, "r_x3": 249.73447999999996, "r_y3": 314.388, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.78624, "r_y0": 361.68249999999995, "r_x1": 199.32646, "r_y1": 361.68249999999995, "r_x2": 199.32646, "r_y2": 355.28836000000007, "r_x3": 183.78624, "r_y3": 355.28836000000007, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 216.76038, "r_y0": 361.68249999999995, "r_x1": 232.30058, "r_y1": 361.68249999999995, "r_x2": 232.30058, "r_y2": 355.28836000000007, "r_x3": 216.76038, "r_y3": 355.28836000000007, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.73447999999996, "r_y0": 361.68249999999995, "r_x1": 265.27469, "r_y1": 361.68249999999995, "r_x2": 265.27469, "r_y2": 355.28836000000007, "r_x3": 249.73447999999996, "r_y3": 355.28836000000007, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.70862, "r_y0": 361.68249999999995, "r_x1": 298.24881, "r_y1": 361.68249999999995, "r_x2": 298.24881, "r_y2": 355.28836000000007, "r_x3": 282.70862, "r_y3": 355.28836000000007, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.78624, "r_y0": 382.13284, "r_x1": 199.32646, "r_y1": 382.13284, "r_x2": 199.32646, "r_y2": 375.73871, "r_x3": 183.78624, "r_y3": 375.73871, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 216.76038, "r_y0": 382.13284, "r_x1": 232.30058, "r_y1": 382.13284, "r_x2": 232.30058, "r_y2": 375.73871, "r_x3": 216.76038, "r_y3": 375.73871, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.73447999999996, "r_y0": 382.13284, "r_x1": 265.27469, "r_y1": 382.13284, "r_x2": 265.27469, "r_y2": 375.73871, "r_x3": 249.73447999999996, "r_y3": 375.73871, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.70862, "r_y0": 382.13284, "r_x1": 298.24881, "r_y1": 382.13284, "r_x2": 298.24881, "r_y2": 375.73871, "r_x3": 282.70862, "r_y3": 375.73871, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.06137, "r_y0": 419.85904, "r_x1": 401.62366, "r_y1": 419.85904, "r_x2": 401.62366, "r_y2": 411.33353, "r_x3": 395.06137, "r_y3": 411.33353, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.42249, "r_y0": 419.85904, "r_x1": 412.47598, "r_y1": 419.85904, "r_x2": 412.47598, "r_y2": 411.33353, "r_x3": 407.42249, "r_y3": 411.33353, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.69287, "r_y0": 419.85904, "r_x1": 425.25516, "r_y1": 419.85904, "r_x2": 425.25516, "r_y2": 411.33353, "r_x3": 418.69287, "r_y3": 411.33353, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 430.5086099999999, "r_y0": 419.85904, "r_x1": 436.5709800000001, "r_y1": 419.85904, "r_x2": 436.5709800000001, "r_y2": 411.33353, "r_x3": 430.5086099999999, "r_y3": 411.33353, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 152.36208, "r_y0": 416.16776, "r_x1": 175.10626, "r_y1": 416.16776, "r_x2": 175.10626, "r_y2": 409.77362, "r_x3": 152.36208, "r_y3": 409.77362, "coord_origin": "TOPLEFT" }, "text": "", "orig": "
", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 178.89366, "r_y0": 416.16776, "r_x1": 191.01935, "r_y1": 416.16776, "r_x2": 191.01935, "r_y2": 409.77362, "r_x3": 178.89366, "r_y3": 409.77362, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.80676, "r_y0": 416.16776, "r_x1": 208.82614, "r_y1": 416.16776, "r_x2": 208.82614, "r_y2": 409.77362, "r_x3": 194.80676, "r_y3": 409.77362, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 212.61354, "r_y0": 416.16776, "r_x1": 226.26003999999998, "r_y1": 416.16776, "r_x2": 226.26003999999998, "r_y2": 409.77362, "r_x3": 212.61354, "r_y3": 409.77362, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.37506000000002, "r_y0": 416.16776, "r_x1": 259.03918, "r_y1": 416.16776, "r_x2": 259.03918, "r_y2": 409.77362, "r_x3": 249.37506000000002, "r_y3": 409.77362, "coord_origin": "TOPLEFT" }, "text": "", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 244.46358, "r_y0": 424.49936, "r_x1": 269.10144, "r_y1": 424.49936, "r_x2": 269.10144, "r_y2": 418.10522, "r_x3": 244.46358, "r_y3": 418.10522, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 230.04745000000003, "r_y0": 416.16776, "r_x1": 245.58765000000002, "r_y1": 416.16776, "r_x2": 245.58765000000002, "r_y2": 409.77362, "r_x3": 230.04745000000003, "r_y3": 409.77362, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.50595, "r_y0": 265.70556999999997, "r_x1": 159.62473, "r_y1": 265.70556999999997, "r_x2": 159.62473, "r_y2": 258.60095, "r_x3": 154.50595, "r_y3": 258.60095, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 164.74348, "r_y0": 265.70556999999997, "r_x1": 185.21857, "r_y1": 265.70556999999997, "r_x2": 185.21857, "r_y2": 258.60095, "r_x3": 164.74348, "r_y3": 258.60095, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 164.3548, "r_y0": 273.60168, "r_x1": 222.05352999999997, "r_y1": 273.60168, "r_x2": 222.05352999999997, "r_y2": 266.49707, "r_x3": 164.3548, "r_y3": 266.49707, "coord_origin": "TOPLEFT" }, "text": "sequence length:", "orig": "sequence length:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 224.15326, "r_y0": 273.60168, "r_x1": 232.57729, "r_y1": 273.60168, "r_x2": 232.57729, "r_y2": 266.49707, "r_x3": 224.15326, "r_y3": 266.49707, "coord_origin": "TOPLEFT" }, "text": "55", "orig": "55", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 461.11075, "r_x1": 161.32928, "r_y1": 461.11075, "r_x2": 161.32928, "r_y2": 452.31378, "r_x3": 134.765, "r_y3": 452.31378, "coord_origin": "TOPLEFT" }, "text": "today,", "orig": "today,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 164.269, "r_y0": 461.11075, "r_x1": 226.28617999999997, "r_y1": 461.11075, "r_x2": 226.28617999999997, "r_y2": 452.31378, "r_x3": 164.269, "r_y3": 452.31378, "coord_origin": "TOPLEFT" }, "text": "table detection", "orig": "table detection", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.992, "r_y0": 461.11075, "r_x1": 480.59232000000003, "r_y1": 461.11075, "r_x2": 480.59232000000003, "r_y2": 452.31378, "r_x3": 229.992, "r_y3": 452.31378, "coord_origin": "TOPLEFT" }, "text": "in documents is a well understood problem, and the latest", "orig": "in documents is a well understood problem, and the latest", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 473.06573, "r_x1": 480.59180000000003, "r_y1": 473.06573, "r_x2": 480.59180000000003, "r_y2": 464.26877, "r_x3": 134.76501, "r_y3": 464.26877, "coord_origin": "TOPLEFT" }, "text": "state-of-the-art (SOTA) object detection methods provide an accuracy compa-", "orig": "state-of-the-art (SOTA) object detection methods provide an accuracy compa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 485.02072, "r_x1": 480.58673, "r_y1": 485.02072, "r_x2": 480.58673, "r_y2": 476.22375, "r_x3": 134.76501, "r_y3": 476.22375, "coord_origin": "TOPLEFT" }, "text": "rable to human observers [7,8,10,14,23]. On the other hand, the problem of table", "orig": "rable to human observers [7,8,10,14,23]. On the other hand, the problem of table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 496.97672, "r_x1": 480.58658, "r_y1": 496.97672, "r_x2": 480.58658, "r_y2": 488.17975, "r_x3": 134.76501, "r_y3": 488.17975, "coord_origin": "TOPLEFT" }, "text": "structure recognition (TSR) is a lot more challenging and remains a very active", "orig": "structure recognition (TSR) is a lot more challenging and remains a very active", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 508.9317, "r_x1": 480.58978, "r_y1": 508.9317, "r_x2": 480.58978, "r_y2": 500.13474, "r_x3": 134.76501, "r_y3": 500.13474, "coord_origin": "TOPLEFT" }, "text": "area of research, in which many novel machine learning algorithms are being", "orig": "area of research, in which many novel machine learning algorithms are being", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 520.88669, "r_x1": 313.24597, "r_y1": 520.88669, "r_x2": 313.24597, "r_y2": 512.0897199999999, "r_x3": 134.76501, "r_y3": 512.0897199999999, "coord_origin": "TOPLEFT" }, "text": "explored [3,4,5,9,11,12,13,14,17,18,21,22].", "orig": "explored [3,4,5,9,11,12,13,14,17,18,21,22].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.70901, "r_y0": 533.3476900000001, "r_x1": 480.58884000000006, "r_y1": 533.3476900000001, "r_x2": 480.58884000000006, "r_y2": 524.55072, "r_x3": 149.70901, "r_y3": 524.55072, "coord_origin": "TOPLEFT" }, "text": "Recently emerging SOTA methods for table structure recognition employ", "orig": "Recently emerging SOTA methods for table structure recognition employ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 545.30368, "r_x1": 480.5917400000001, "r_y1": 545.30368, "r_x2": 480.5917400000001, "r_y2": 536.50671, "r_x3": 134.76501, "r_y3": 536.50671, "coord_origin": "TOPLEFT" }, "text": "transformer-based models, in which an image of the table is provided to the net-", "orig": "transformer-based models, in which an image of the table is provided to the net-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 557.25868, "r_x1": 480.58868, "r_y1": 557.25868, "r_x2": 480.58868, "r_y2": 548.46172, "r_x3": 134.76501, "r_y3": 548.46172, "coord_origin": "TOPLEFT" }, "text": "work in order to predict the structure of the table as a sequence of tokens. These", "orig": "work in order to predict the structure of the table as a sequence of tokens. These", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 569.2136800000001, "r_x1": 480.58795, "r_y1": 569.2136800000001, "r_x2": 480.58795, "r_y2": 560.41672, "r_x3": 134.76501, "r_y3": 560.41672, "coord_origin": "TOPLEFT" }, "text": "image-to-sequence (Im2Seq) models are extremely powerful, since they allow for", "orig": "image-to-sequence (Im2Seq) models are extremely powerful, since they allow for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 581.16869, "r_x1": 480.58978, "r_y1": 581.16869, "r_x2": 480.58978, "r_y2": 572.37172, "r_x3": 134.76501, "r_y3": 572.37172, "coord_origin": "TOPLEFT" }, "text": "a purely data-driven solution. The tokens of the sequence typically belong to a", "orig": "a purely data-driven solution. The tokens of the sequence typically belong to a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 593.12369, "r_x1": 480.59479, "r_y1": 593.12369, "r_x2": 480.59479, "r_y2": 584.32672, "r_x3": 134.76501, "r_y3": 584.32672, "coord_origin": "TOPLEFT" }, "text": "markup language such as HTML, Latex or Markdown, which allow to describe", "orig": "markup language such as HTML, Latex or Markdown, which allow to describe", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 605.0796799999999, "r_x1": 480.58678999999995, "r_y1": 605.0796799999999, "r_x2": 480.58678999999995, "r_y2": 596.28271, "r_x3": 134.76501, "r_y3": 596.28271, "coord_origin": "TOPLEFT" }, "text": "table structure as rows, columns and spanning cells in various configurations.", "orig": "table structure as rows, columns and spanning cells in various configurations.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 617.03468, "r_x1": 480.59476, "r_y1": 617.03468, "r_x2": 480.59476, "r_y2": 608.23772, "r_x3": 134.76501, "r_y3": 608.23772, "coord_origin": "TOPLEFT" }, "text": "In Figure 1, we illustrate how HTML is used to represent the table-structure", "orig": "In Figure 1, we illustrate how HTML is used to represent the table-structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 628.98969, "r_x1": 480.5938100000001, "r_y1": 628.98969, "r_x2": 480.5938100000001, "r_y2": 620.19272, "r_x3": 134.76501, "r_y3": 620.19272, "coord_origin": "TOPLEFT" }, "text": "of a particular example table. Public table-structure data sets such as PubTab-", "orig": "of a particular example table. Public table-structure data sets such as PubTab-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 640.94469, "r_x1": 480.59482, "r_y1": 640.94469, "r_x2": 480.59482, "r_y2": 632.1477199999999, "r_x3": 134.76501, "r_y3": 632.1477199999999, "coord_origin": "TOPLEFT" }, "text": "Net [22], and FinTabNet [21], which were created in a semi-automated way from", "orig": "Net [22], and FinTabNet [21], which were created in a semi-automated way from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 652.89969, "r_x1": 480.58771, "r_y1": 652.89969, "r_x2": 480.58771, "r_y2": 644.10272, "r_x3": 134.76501, "r_y3": 644.10272, "coord_origin": "TOPLEFT" }, "text": "paired PDF and HTML sources (e.g. PubMed Central), popularized primarily", "orig": "paired PDF and HTML sources (e.g. PubMed Central), popularized primarily", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 664.8547, "r_x1": 421.45377, "r_y1": 664.8547, "r_x2": 421.45377, "r_y2": 656.05772, "r_x3": 134.76501, "r_y3": 656.05772, "coord_origin": "TOPLEFT" }, "text": "the use of HTML as ground-truth representation format for TSR.", "orig": "the use of HTML as ground-truth representation format for TSR.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "has_chars": false, "has_words": false, "has_lines": true, "image": null, "lines": [] }, "predictions": { "layout": { "clusters": [ { "id": 5, "label": "page_header", "bbox": { "l": 134.765, "t": 93.77099999999996, "r": 139.37193, "b": 101.84069999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.8580349683761597, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 101.84069999999997, "r_x1": 139.37193, "r_y1": 101.84069999999997, "r_x2": 139.37193, "r_y2": 93.77099999999996, "r_x3": 134.765, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 3, "label": "page_header", "bbox": { "l": 167.81335, "t": 93.77099999999996, "r": 231.72227, "b": 101.84069999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.9076642990112305, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.81335, "r_y0": 101.84069999999997, "r_x1": 178.07675, "r_y1": 101.84069999999997, "r_x2": 178.07675, "r_y2": 93.77099999999996, "r_x3": 167.81335, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.37415, "r_y0": 101.84069999999997, "r_x1": 231.72227, "r_y1": 101.84069999999997, "r_x2": 231.72227, "r_y2": 93.77099999999996, "r_x3": 182.37415, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 4, "label": "caption", "bbox": { "l": 134.765, "t": 126.33416999999997, "r": 480.59189, "b": 200.22058000000004, "coord_origin": "TOPLEFT" }, "confidence": 0.8939083218574524, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 134.26049999999998, "r_x1": 162.64424, "r_y1": 134.26049999999998, "r_x2": 162.64424, "r_y2": 126.33416999999997, "r_x3": 134.765, "r_y3": 126.33416999999997, "coord_origin": "TOPLEFT" }, "text": "Fig. 1.", "orig": "Fig. 1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.062, "r_y0": 134.46667000000002, "r_x1": 480.59106, "r_y1": 134.46667000000002, "r_x2": 480.59106, "r_y2": 126.39697000000001, "r_x3": 167.062, "r_y3": 126.39697000000001, "coord_origin": "TOPLEFT" }, "text": "Comparison between HTML and OTSL table structure representation: (A)", "orig": "Comparison between HTML and OTSL table structure representation: (A)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 145.42566, "r_x1": 480.59018, "r_y1": 145.42566, "r_x2": 480.59018, "r_y2": 137.35595999999998, "r_x3": 134.765, "r_y3": 137.35595999999998, "coord_origin": "TOPLEFT" }, "text": "table-example with complex row and column headers, including a 2D empty span,", "orig": "table-example with complex row and column headers, including a 2D empty span,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 156.38464, "r_x1": 147.95433, "r_y1": 156.38464, "r_x2": 147.95433, "r_y2": 148.31493999999998, "r_x3": 134.765, "r_y3": 148.31493999999998, "coord_origin": "TOPLEFT" }, "text": "(B)", "orig": "(B)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 152.39224, "r_y0": 156.38464, "r_x1": 480.59096999999997, "r_y1": 156.38464, "r_x2": 480.59096999999997, "r_y2": 148.31493999999998, "r_x3": 152.39224, "r_y3": 148.31493999999998, "coord_origin": "TOPLEFT" }, "text": "minimal graphical representation of table structure using rectangular layout, (C)", "orig": "minimal graphical representation of table structure using rectangular layout, (C)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 167.34362999999996, "r_x1": 480.59189, "r_y1": 167.34362999999996, "r_x2": 480.59189, "r_y2": 159.27392999999995, "r_x3": 134.765, "r_y3": 159.27392999999995, "coord_origin": "TOPLEFT" }, "text": "HTML representation, (D) OTSL representation. This example demonstrates many of", "orig": "HTML representation, (D) OTSL representation. This example demonstrates many of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 178.30260999999996, "r_x1": 480.58914000000004, "r_y1": 178.30260999999996, "r_x2": 480.58914000000004, "r_y2": 170.23290999999995, "r_x3": 134.765, "r_y3": 170.23290999999995, "coord_origin": "TOPLEFT" }, "text": "the key-features of OTSL, namely its reduced vocabulary size (12 versus 5 in this case),", "orig": "the key-features of OTSL, namely its reduced vocabulary size (12 versus 5 in this case),", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 189.26160000000004, "r_x1": 480.59020999999996, "r_y1": 189.26160000000004, "r_x2": 480.59020999999996, "r_y2": 181.19188999999994, "r_x3": 134.765, "r_y3": 181.19188999999994, "coord_origin": "TOPLEFT" }, "text": "its reduced sequence length (55 versus 30) and a enhanced internal structure (variable", "orig": "its reduced sequence length (55 versus 30) and a enhanced internal structure (variable", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 200.22058000000004, "r_x1": 460.87109, "r_y1": 200.22058000000004, "r_x2": 460.87109, "r_y2": 192.15088000000003, "r_x3": 134.765, "r_y3": 192.15088000000003, "coord_origin": "TOPLEFT" }, "text": "token sequence length per row in HTML versus a fixed length of rows in OTSL).", "orig": "token sequence length per row in HTML versus a fixed length of rows in OTSL).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 1, "label": "picture", "bbox": { "l": 148.45364379882812, "t": 208.37423706054688, "r": 464.3608093261719, "b": 425.8462219238281, "coord_origin": "TOPLEFT" }, "confidence": 0.9688959121704102, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.41107, "r_y0": 289.50903, "r_x1": 402.97336, "r_y1": 289.50903, "r_x2": 402.97336, "r_y2": 280.98352, "r_x3": 396.41107, "r_y3": 280.98352, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.58682, "r_y0": 289.42343, "r_x1": 425.14911, "r_y1": 289.42343, "r_x2": 425.14911, "r_y2": 280.89792, "r_x3": 418.58682, "r_y3": 280.89792, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.74835, "r_y0": 311.76279, "r_x1": 402.31064, "r_y1": 311.76279, "r_x2": 402.31064, "r_y2": 303.23727, "r_x3": 395.74835, "r_y3": 303.23727, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.54214, "r_y0": 311.89532, "r_x1": 414.10443, "r_y1": 311.89532, "r_x2": 414.10443, "r_y2": 303.36981, "r_x3": 407.54214, "r_y3": 303.36981, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.56335, "r_y0": 322.9317, "r_x1": 414.12564, "r_y1": 322.9317, "r_x2": 414.12564, "r_y2": 314.40619, "r_x3": 407.56335, "r_y3": 314.40619, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.51108, "r_y0": 300.61053000000004, "r_x1": 425.07336, "r_y1": 300.61053000000004, "r_x2": 425.07336, "r_y2": 292.08502000000004, "r_x3": 418.51108, "r_y3": 292.08502000000004, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.59744, "r_y0": 300.61658, "r_x1": 436.1597300000001, "r_y1": 300.61658, "r_x2": 436.1597300000001, "r_y2": 292.09106, "r_x3": 429.59744, "r_y3": 292.09106, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.68759000000006, "r_y0": 300.53781000000004, "r_x1": 447.24987999999996, "r_y1": 300.53781000000004, "r_x2": 447.24987999999996, "r_y2": 292.01230000000004, "r_x3": 440.68759000000006, "r_y3": 292.01230000000004, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.6232, "r_y0": 311.82034, "r_x1": 425.18549, "r_y1": 311.82034, "r_x2": 425.18549, "r_y2": 303.29483, "r_x3": 418.6232, "r_y3": 303.29483, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.7095299999999, "r_y0": 311.82562, "r_x1": 436.27182, "r_y1": 311.82562, "r_x2": 436.27182, "r_y2": 303.30011, "r_x3": 429.7095299999999, "r_y3": 303.30011, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.7996800000001, "r_y0": 311.74762, "r_x1": 447.36197, "r_y1": 311.74762, "r_x2": 447.36197, "r_y2": 303.22211, "r_x3": 440.7996800000001, "r_y3": 303.22211, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.62546, "r_y0": 323.09454, "r_x1": 425.18774, "r_y1": 323.09454, "r_x2": 425.18774, "r_y2": 314.56903, "r_x3": 418.62546, "r_y3": 314.56903, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.71181999999993, "r_y0": 323.09985, "r_x1": 436.27411, "r_y1": 323.09985, "r_x2": 436.27411, "r_y2": 314.57434, "r_x3": 429.71181999999993, "r_y3": 314.57434, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.80194, "r_y0": 323.02182, "r_x1": 447.36423, "r_y1": 323.02182, "r_x2": 447.36423, "r_y2": 314.49631, "r_x3": 440.80194, "r_y3": 314.49631, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.39746, "r_y0": 333.81583, "r_x1": 413.95975, "r_y1": 333.81583, "r_x2": 413.95975, "r_y2": 325.29031, "r_x3": 407.39746, "r_y3": 325.29031, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.45959, "r_y0": 333.97867, "r_x1": 425.02188, "r_y1": 333.97867, "r_x2": 425.02188, "r_y2": 325.45316, "r_x3": 418.45959, "r_y3": 325.45316, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.54593, "r_y0": 333.98471, "r_x1": 436.10822, "r_y1": 333.98471, "r_x2": 436.10822, "r_y2": 325.4592, "r_x3": 429.54593, "r_y3": 325.4592, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.63608, "r_y0": 333.90594, "r_x1": 447.19836, "r_y1": 333.90594, "r_x2": 447.19836, "r_y2": 325.38043, "r_x3": 440.63608, "r_y3": 325.38043, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 451.89511000000005, "r_y0": 288.68268, "r_x1": 463.51273000000003, "r_y1": 288.68268, "r_x2": 463.51273000000003, "r_y2": 280.15717, "r_x3": 451.89511000000005, "r_y3": 280.15717, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.1557, "r_y0": 300.12427, "r_x1": 463.77332, "r_y1": 300.12427, "r_x2": 463.77332, "r_y2": 291.59875000000005, "r_x3": 452.1557, "r_y3": 291.59875000000005, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.17688000000004, "r_y0": 311.36816, "r_x1": 463.79449000000005, "r_y1": 311.36816, "r_x2": 463.79449000000005, "r_y2": 302.84265, "r_x3": 452.17688000000004, "r_y3": 302.84265, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.09887999999995, "r_y0": 322.6499299999999, "r_x1": 463.71648999999996, "r_y1": 322.6499299999999, "r_x2": 463.71648999999996, "r_y2": 314.12441999999993, "r_x3": 452.09887999999995, "r_y3": 314.12441999999993, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.29733, "r_y0": 333.99457, "r_x1": 463.91495, "r_y1": 333.99457, "r_x2": 463.91495, "r_y2": 325.46906, "r_x3": 452.29733, "r_y3": 325.46906, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.09677, "r_y0": 323.02029000000005, "r_x1": 402.65906, "r_y1": 323.02029000000005, "r_x2": 402.65906, "r_y2": 314.49478, "r_x3": 396.09677, "r_y3": 314.49478, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.99829, "r_y0": 333.91428, "r_x1": 402.56058, "r_y1": 333.91428, "r_x2": 402.56058, "r_y2": 325.38876000000005, "r_x3": 395.99829, "r_y3": 325.38876000000005, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.27475, "r_y0": 300.79608, "r_x1": 402.83704, "r_y1": 300.79608, "r_x2": 402.83704, "r_y2": 292.27057, "r_x3": 396.27475, "r_y3": 292.27057, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.54724, "r_y0": 289.49463, "r_x1": 413.60074, "r_y1": 289.49463, "r_x2": 413.60074, "r_y2": 280.96912, "r_x3": 408.54724, "r_y3": 280.96912, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 430.58966, "r_y0": 289.02277, "r_x1": 435.6431600000001, "r_y1": 289.02277, "r_x2": 435.6431600000001, "r_y2": 280.49725, "r_x3": 430.58966, "r_y3": 280.49725, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 441.08069, "r_y0": 288.90613, "r_x1": 446.13419, "r_y1": 288.90613, "r_x2": 446.13419, "r_y2": 280.38062, "r_x3": 441.08069, "r_y3": 280.38062, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.97388, "r_y0": 300.65976, "r_x1": 414.03625, "r_y1": 300.65976, "r_x2": 414.03625, "r_y2": 292.13425, "r_x3": 407.97388, "r_y3": 292.13425, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 441.25640999999996, "r_y0": 419.7062700000001, "r_x1": 452.87402, "r_y1": 419.7062700000001, "r_x2": 452.87402, "r_y2": 411.1807600000001, "r_x3": 441.25640999999996, "r_y3": 411.1807600000001, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.75256, "r_y0": 406.89935, "r_x1": 432.48929, "r_y1": 406.89935, "r_x2": 432.48929, "r_y2": 399.7947700000001, "r_x3": 393.75256, "r_y3": 399.7947700000001, "coord_origin": "TOPLEFT" }, "text": "vocabulary:", "orig": "vocabulary:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 434.5896000000001, "r_y0": 406.89935, "r_x1": 438.80083999999994, "r_y1": 406.89935, "r_x2": 438.80083999999994, "r_y2": 399.7947700000001, "r_x3": 434.5896000000001, "r_y3": 399.7947700000001, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.90573, "r_y0": 406.89935, "r_x1": 463.22235, "r_y1": 406.89935, "r_x2": 463.22235, "r_y2": 399.7947700000001, "r_x3": 440.90573, "r_y3": 399.7947700000001, "coord_origin": "TOPLEFT" }, "text": "tokens", "orig": "tokens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 384.11816, "r_y0": 265.65179, "r_x1": 413.99307, "r_y1": 265.65179, "r_x2": 413.99307, "r_y2": 258.54718, "r_x3": 384.11816, "r_y3": 258.54718, "coord_origin": "TOPLEFT" }, "text": "D OTSL", "orig": "D OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.75256, "r_y0": 273.77966000000004, "r_x1": 451.45129000000003, "r_y1": 273.77966000000004, "r_x2": 451.45129000000003, "r_y2": 266.67505000000006, "r_x3": 393.75256, "r_y3": 266.67505000000006, "coord_origin": "TOPLEFT" }, "text": "sequence length:", "orig": "sequence length:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 453.55083999999994, "r_y0": 273.77966000000004, "r_x1": 461.97485, "r_y1": 273.77966000000004, "r_x2": 461.97485, "r_y2": 266.67505000000006, "r_x3": 453.55083999999994, "r_y3": 266.67505000000006, "coord_origin": "TOPLEFT" }, "text": "30", "orig": "30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.79318, "r_y0": 406.86474999999996, "r_x1": 233.89371000000003, "r_y1": 406.86474999999996, "r_x2": 233.89371000000003, "r_y2": 399.76016, "r_x3": 151.79318, "r_y3": 399.76016, "coord_origin": "TOPLEFT" }, "text": "vocabulary for this table:", "orig": "vocabulary for this table:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 235.99332, "r_y0": 406.86474999999996, "r_x1": 244.41734000000002, "r_y1": 406.86474999999996, "r_x2": 244.41734000000002, "r_y2": 399.76016, "r_x3": 235.99332, "r_y3": 399.76016, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.52222, "r_y0": 406.86474999999996, "r_x1": 268.83884, "r_y1": 406.86474999999996, "r_x2": 268.83884, "r_y2": 399.76016, "r_x3": 246.52222, "r_y3": 399.76016, "coord_origin": "TOPLEFT" }, "text": "tokens", "orig": "tokens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.3298, "r_y0": 220.67920000000004, "r_x1": 159.79837, "r_y1": 220.67920000000004, "r_x2": 159.79837, "r_y2": 213.57457999999997, "r_x3": 154.3298, "r_y3": 213.57457999999997, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 321.07053, "r_y0": 220.67920000000004, "r_x1": 326.53909, "r_y1": 220.67920000000004, "r_x2": 326.53909, "r_y2": 213.57457999999997, "r_x3": 321.07053, "r_y3": 213.57457999999997, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 153.0947, "r_y0": 286.69824, "r_x1": 175.83888, "r_y1": 286.69824, "r_x2": 175.83888, "r_y2": 280.30411, "r_x3": 153.0947, "r_y3": 280.30411, "coord_origin": "TOPLEFT" }, "text": "", "orig": "
", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67039, "r_y0": 293.51501, "r_x1": 172.79608, "r_y1": 293.51501, "r_x2": 172.79608, "r_y2": 287.12088, "r_x3": 160.67039, "r_y3": 287.12088, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.24603, "r_y0": 300.33179, "r_x1": 177.91019, "r_y1": 300.33179, "r_x2": 177.91019, "r_y2": 293.93765, "r_x3": 168.24603, "r_y3": 293.93765, "coord_origin": "TOPLEFT" }, "text": "", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.35785, "r_y0": 300.33179, "r_x1": 278.89804, "r_y1": 300.33179, "r_x2": 278.89804, "r_y2": 293.93765, "r_x3": 263.35785, "r_y3": 293.93765, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 280.79175, "r_y0": 300.33179, "r_x1": 290.4559, "r_y1": 300.33179, "r_x2": 290.4559, "r_y2": 293.93765, "r_x3": 280.79175, "r_y3": 293.93765, "coord_origin": "TOPLEFT" }, "text": "", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 335.92926, "r_y0": 300.33179, "r_x1": 351.46945, "r_y1": 300.33179, "r_x2": 351.46945, "r_y2": 293.93765, "r_x3": 335.92926, "r_y3": 293.93765, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67039, "r_y0": 307.14856, "r_x1": 174.68979, "r_y1": 307.14856, "r_x2": 174.68979, "r_y2": 300.75442999999996, "r_x3": 160.67039, "r_y3": 300.75442999999996, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67039, "r_y0": 313.96536, "r_x1": 172.79608, "r_y1": 313.96536, "r_x2": 172.79608, "r_y2": 307.57122999999996, "r_x3": 160.67039, "r_y3": 307.57122999999996, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.24603, "r_y0": 320.78214, "r_x1": 181.89255, "r_y1": 320.78214, "r_x2": 181.89255, "r_y2": 314.388, "r_x3": 168.24603, "r_y3": 314.388, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 201.22015, "r_y0": 320.78214, "r_x1": 214.86666999999997, "r_y1": 320.78214, "r_x2": 214.86666999999997, "r_y2": 314.388, "r_x3": 201.22015, "r_y3": 314.388, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.19427000000002, "r_y0": 320.78214, "r_x1": 247.84079000000003, "r_y1": 320.78214, "r_x2": 247.84079000000003, "r_y2": 314.388, "r_x3": 234.19427000000002, "r_y3": 314.388, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67039, "r_y0": 327.59890999999993, "r_x1": 174.68979, "r_y1": 327.59890999999993, "r_x2": 174.68979, "r_y2": 321.20477, "r_x3": 160.67039, "r_y3": 321.20477, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67039, "r_y0": 334.41571000000005, "r_x1": 172.79608, "r_y1": 334.41571000000005, "r_x2": 172.79608, "r_y2": 328.02158, "r_x3": 160.67039, "r_y3": 328.02158, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.24603, "r_y0": 341.23248, "r_x1": 373.09091, "r_y1": 341.23248, "r_x2": 373.09091, "r_y2": 334.83835, "r_x3": 168.24603, "r_y3": 334.83835, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67039, "r_y0": 348.04926, "r_x1": 174.68979, "r_y1": 348.04926, "r_x2": 174.68979, "r_y2": 341.65512, "r_x3": 160.67039, "r_y3": 341.65512, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67039, "r_y0": 354.86572, "r_x1": 172.79608, "r_y1": 354.86572, "r_x2": 172.79608, "r_y2": 348.47159, "r_x3": 160.67039, "r_y3": 348.47159, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.24603, "r_y0": 361.68249999999995, "r_x1": 181.89255, "r_y1": 361.68249999999995, "r_x2": 181.89255, "r_y2": 355.28836000000007, "r_x3": 168.24603, "r_y3": 355.28836000000007, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 201.22015, "r_y0": 361.68249999999995, "r_x1": 214.86666999999997, "r_y1": 361.68249999999995, "r_x2": 214.86666999999997, "r_y2": 355.28836000000007, "r_x3": 201.22015, "r_y3": 355.28836000000007, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.19427000000002, "r_y0": 361.68249999999995, "r_x1": 247.84079000000003, "r_y1": 361.68249999999995, "r_x2": 247.84079000000003, "r_y2": 355.28836000000007, "r_x3": 234.19427000000002, "r_y3": 355.28836000000007, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 267.1684, "r_y0": 361.68249999999995, "r_x1": 280.81488, "r_y1": 361.68249999999995, "r_x2": 280.81488, "r_y2": 355.28836000000007, "r_x3": 267.1684, "r_y3": 355.28836000000007, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67039, "r_y0": 368.49929999999995, "r_x1": 174.68979, "r_y1": 368.49929999999995, "r_x2": 174.68979, "r_y2": 362.10516000000007, "r_x3": 160.67039, "r_y3": 362.10516000000007, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67039, "r_y0": 375.31607, "r_x1": 172.79608, "r_y1": 375.31607, "r_x2": 172.79608, "r_y2": 368.92194, "r_x3": 160.67039, "r_y3": 368.92194, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.24603, "r_y0": 382.13284, "r_x1": 181.89255, "r_y1": 382.13284, "r_x2": 181.89255, "r_y2": 375.73871, "r_x3": 168.24603, "r_y3": 375.73871, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 201.22015, "r_y0": 382.13284, "r_x1": 214.86666999999997, "r_y1": 382.13284, "r_x2": 214.86666999999997, "r_y2": 375.73871, "r_x3": 201.22015, "r_y3": 375.73871, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.19427000000002, "r_y0": 382.13284, "r_x1": 247.84079000000003, "r_y1": 382.13284, "r_x2": 247.84079000000003, "r_y2": 375.73871, "r_x3": 234.19427000000002, "r_y3": 375.73871, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 267.1684, "r_y0": 382.13284, "r_x1": 280.81488, "r_y1": 382.13284, "r_x2": 280.81488, "r_y2": 375.73871, "r_x3": 267.1684, "r_y3": 375.73871, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67039, "r_y0": 388.94965, "r_x1": 174.68979, "r_y1": 388.94965, "r_x2": 174.68979, "r_y2": 382.55551, "r_x3": 160.67039, "r_y3": 382.55551, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 153.0947, "r_y0": 395.76642, "r_x1": 177.73259, "r_y1": 395.76642, "r_x2": 177.73259, "r_y2": 389.37228, "r_x3": 153.0947, "r_y3": 389.37228, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.78624, "r_y0": 320.78214, "r_x1": 199.32646, "r_y1": 320.78214, "r_x2": 199.32646, "r_y2": 314.388, "r_x3": 183.78624, "r_y3": 314.388, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 216.76038, "r_y0": 320.78214, "r_x1": 232.30058, "r_y1": 320.78214, "r_x2": 232.30058, "r_y2": 314.388, "r_x3": 216.76038, "r_y3": 314.388, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.73447999999996, "r_y0": 320.78214, "r_x1": 265.27469, "r_y1": 320.78214, "r_x2": 265.27469, "r_y2": 314.388, "r_x3": 249.73447999999996, "r_y3": 314.388, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.78624, "r_y0": 361.68249999999995, "r_x1": 199.32646, "r_y1": 361.68249999999995, "r_x2": 199.32646, "r_y2": 355.28836000000007, "r_x3": 183.78624, "r_y3": 355.28836000000007, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 216.76038, "r_y0": 361.68249999999995, "r_x1": 232.30058, "r_y1": 361.68249999999995, "r_x2": 232.30058, "r_y2": 355.28836000000007, "r_x3": 216.76038, "r_y3": 355.28836000000007, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.73447999999996, "r_y0": 361.68249999999995, "r_x1": 265.27469, "r_y1": 361.68249999999995, "r_x2": 265.27469, "r_y2": 355.28836000000007, "r_x3": 249.73447999999996, "r_y3": 355.28836000000007, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.70862, "r_y0": 361.68249999999995, "r_x1": 298.24881, "r_y1": 361.68249999999995, "r_x2": 298.24881, "r_y2": 355.28836000000007, "r_x3": 282.70862, "r_y3": 355.28836000000007, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.78624, "r_y0": 382.13284, "r_x1": 199.32646, "r_y1": 382.13284, "r_x2": 199.32646, "r_y2": 375.73871, "r_x3": 183.78624, "r_y3": 375.73871, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 216.76038, "r_y0": 382.13284, "r_x1": 232.30058, "r_y1": 382.13284, "r_x2": 232.30058, "r_y2": 375.73871, "r_x3": 216.76038, "r_y3": 375.73871, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.73447999999996, "r_y0": 382.13284, "r_x1": 265.27469, "r_y1": 382.13284, "r_x2": 265.27469, "r_y2": 375.73871, "r_x3": 249.73447999999996, "r_y3": 375.73871, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.70862, "r_y0": 382.13284, "r_x1": 298.24881, "r_y1": 382.13284, "r_x2": 298.24881, "r_y2": 375.73871, "r_x3": 282.70862, "r_y3": 375.73871, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.06137, "r_y0": 419.85904, "r_x1": 401.62366, "r_y1": 419.85904, "r_x2": 401.62366, "r_y2": 411.33353, "r_x3": 395.06137, "r_y3": 411.33353, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.42249, "r_y0": 419.85904, "r_x1": 412.47598, "r_y1": 419.85904, "r_x2": 412.47598, "r_y2": 411.33353, "r_x3": 407.42249, "r_y3": 411.33353, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.69287, "r_y0": 419.85904, "r_x1": 425.25516, "r_y1": 419.85904, "r_x2": 425.25516, "r_y2": 411.33353, "r_x3": 418.69287, "r_y3": 411.33353, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 430.5086099999999, "r_y0": 419.85904, "r_x1": 436.5709800000001, "r_y1": 419.85904, "r_x2": 436.5709800000001, "r_y2": 411.33353, "r_x3": 430.5086099999999, "r_y3": 411.33353, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 152.36208, "r_y0": 416.16776, "r_x1": 175.10626, "r_y1": 416.16776, "r_x2": 175.10626, "r_y2": 409.77362, "r_x3": 152.36208, "r_y3": 409.77362, "coord_origin": "TOPLEFT" }, "text": "", "orig": "
", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 178.89366, "r_y0": 416.16776, "r_x1": 191.01935, "r_y1": 416.16776, "r_x2": 191.01935, "r_y2": 409.77362, "r_x3": 178.89366, "r_y3": 409.77362, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.80676, "r_y0": 416.16776, "r_x1": 208.82614, "r_y1": 416.16776, "r_x2": 208.82614, "r_y2": 409.77362, "r_x3": 194.80676, "r_y3": 409.77362, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 212.61354, "r_y0": 416.16776, "r_x1": 226.26003999999998, "r_y1": 416.16776, "r_x2": 226.26003999999998, "r_y2": 409.77362, "r_x3": 212.61354, "r_y3": 409.77362, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.37506000000002, "r_y0": 416.16776, "r_x1": 259.03918, "r_y1": 416.16776, "r_x2": 259.03918, "r_y2": 409.77362, "r_x3": 249.37506000000002, "r_y3": 409.77362, "coord_origin": "TOPLEFT" }, "text": "", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 244.46358, "r_y0": 424.49936, "r_x1": 269.10144, "r_y1": 424.49936, "r_x2": 269.10144, "r_y2": 418.10522, "r_x3": 244.46358, "r_y3": 418.10522, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 230.04745000000003, "r_y0": 416.16776, "r_x1": 245.58765000000002, "r_y1": 416.16776, "r_x2": 245.58765000000002, "r_y2": 409.77362, "r_x3": 230.04745000000003, "r_y3": 409.77362, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.50595, "r_y0": 265.70556999999997, "r_x1": 159.62473, "r_y1": 265.70556999999997, "r_x2": 159.62473, "r_y2": 258.60095, "r_x3": 154.50595, "r_y3": 258.60095, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 164.74348, "r_y0": 265.70556999999997, "r_x1": 185.21857, "r_y1": 265.70556999999997, "r_x2": 185.21857, "r_y2": 258.60095, "r_x3": 164.74348, "r_y3": 258.60095, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 164.3548, "r_y0": 273.60168, "r_x1": 222.05352999999997, "r_y1": 273.60168, "r_x2": 222.05352999999997, "r_y2": 266.49707, "r_x3": 164.3548, "r_y3": 266.49707, "coord_origin": "TOPLEFT" }, "text": "sequence length:", "orig": "sequence length:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 224.15326, "r_y0": 273.60168, "r_x1": 232.57729, "r_y1": 273.60168, "r_x2": 232.57729, "r_y2": 266.49707, "r_x3": 224.15326, "r_y3": 266.49707, "coord_origin": "TOPLEFT" }, "text": "55", "orig": "55", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 11, "label": "text", "bbox": { "l": 396.41107, "t": 280.98352, "r": 402.97336, "b": 289.50903, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.41107, "r_y0": 289.50903, "r_x1": 402.97336, "r_y1": 289.50903, "r_x2": 402.97336, "r_y2": 280.98352, "r_x3": 396.41107, "r_y3": 280.98352, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 12, "label": "text", "bbox": { "l": 418.58682, "t": 280.89792, "r": 425.14911, "b": 289.42343, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.58682, "r_y0": 289.42343, "r_x1": 425.14911, "r_y1": 289.42343, "r_x2": 425.14911, "r_y2": 280.89792, "r_x3": 418.58682, "r_y3": 280.89792, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 13, "label": "text", "bbox": { "l": 395.74835, "t": 303.23727, "r": 402.31064, "b": 311.76279, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.74835, "r_y0": 311.76279, "r_x1": 402.31064, "r_y1": 311.76279, "r_x2": 402.31064, "r_y2": 303.23727, "r_x3": 395.74835, "r_y3": 303.23727, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 14, "label": "text", "bbox": { "l": 407.54214, "t": 303.36981, "r": 414.10443, "b": 311.89532, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.54214, "r_y0": 311.89532, "r_x1": 414.10443, "r_y1": 311.89532, "r_x2": 414.10443, "r_y2": 303.36981, "r_x3": 407.54214, "r_y3": 303.36981, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 15, "label": "text", "bbox": { "l": 407.56335, "t": 314.40619, "r": 414.12564, "b": 322.9317, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.56335, "r_y0": 322.9317, "r_x1": 414.12564, "r_y1": 322.9317, "r_x2": 414.12564, "r_y2": 314.40619, "r_x3": 407.56335, "r_y3": 314.40619, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 16, "label": "text", "bbox": { "l": 418.51108, "t": 292.08502000000004, "r": 425.07336, "b": 300.61053000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.51108, "r_y0": 300.61053000000004, "r_x1": 425.07336, "r_y1": 300.61053000000004, "r_x2": 425.07336, "r_y2": 292.08502000000004, "r_x3": 418.51108, "r_y3": 292.08502000000004, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 17, "label": "text", "bbox": { "l": 429.59744, "t": 292.09106, "r": 436.1597300000001, "b": 300.61658, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.59744, "r_y0": 300.61658, "r_x1": 436.1597300000001, "r_y1": 300.61658, "r_x2": 436.1597300000001, "r_y2": 292.09106, "r_x3": 429.59744, "r_y3": 292.09106, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 18, "label": "text", "bbox": { "l": 440.68759000000006, "t": 292.01230000000004, "r": 447.24987999999996, "b": 300.53781000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.68759000000006, "r_y0": 300.53781000000004, "r_x1": 447.24987999999996, "r_y1": 300.53781000000004, "r_x2": 447.24987999999996, "r_y2": 292.01230000000004, "r_x3": 440.68759000000006, "r_y3": 292.01230000000004, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 19, "label": "text", "bbox": { "l": 418.6232, "t": 303.29483, "r": 425.18549, "b": 311.82034, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.6232, "r_y0": 311.82034, "r_x1": 425.18549, "r_y1": 311.82034, "r_x2": 425.18549, "r_y2": 303.29483, "r_x3": 418.6232, "r_y3": 303.29483, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 20, "label": "text", "bbox": { "l": 429.7095299999999, "t": 303.30011, "r": 436.27182, "b": 311.82562, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.7095299999999, "r_y0": 311.82562, "r_x1": 436.27182, "r_y1": 311.82562, "r_x2": 436.27182, "r_y2": 303.30011, "r_x3": 429.7095299999999, "r_y3": 303.30011, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 21, "label": "text", "bbox": { "l": 440.7996800000001, "t": 303.22211, "r": 447.36197, "b": 311.74762, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.7996800000001, "r_y0": 311.74762, "r_x1": 447.36197, "r_y1": 311.74762, "r_x2": 447.36197, "r_y2": 303.22211, "r_x3": 440.7996800000001, "r_y3": 303.22211, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 22, "label": "text", "bbox": { "l": 418.62546, "t": 314.56903, "r": 425.18774, "b": 323.09454, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.62546, "r_y0": 323.09454, "r_x1": 425.18774, "r_y1": 323.09454, "r_x2": 425.18774, "r_y2": 314.56903, "r_x3": 418.62546, "r_y3": 314.56903, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 23, "label": "text", "bbox": { "l": 429.71181999999993, "t": 314.57434, "r": 436.27411, "b": 323.09985, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.71181999999993, "r_y0": 323.09985, "r_x1": 436.27411, "r_y1": 323.09985, "r_x2": 436.27411, "r_y2": 314.57434, "r_x3": 429.71181999999993, "r_y3": 314.57434, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 24, "label": "text", "bbox": { "l": 440.80194, "t": 314.49631, "r": 447.36423, "b": 323.02182, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.80194, "r_y0": 323.02182, "r_x1": 447.36423, "r_y1": 323.02182, "r_x2": 447.36423, "r_y2": 314.49631, "r_x3": 440.80194, "r_y3": 314.49631, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 25, "label": "text", "bbox": { "l": 407.39746, "t": 325.29031, "r": 413.95975, "b": 333.81583, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.39746, "r_y0": 333.81583, "r_x1": 413.95975, "r_y1": 333.81583, "r_x2": 413.95975, "r_y2": 325.29031, "r_x3": 407.39746, "r_y3": 325.29031, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 26, "label": "text", "bbox": { "l": 418.45959, "t": 325.45316, "r": 425.02188, "b": 333.97867, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.45959, "r_y0": 333.97867, "r_x1": 425.02188, "r_y1": 333.97867, "r_x2": 425.02188, "r_y2": 325.45316, "r_x3": 418.45959, "r_y3": 325.45316, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 27, "label": "text", "bbox": { "l": 429.54593, "t": 325.4592, "r": 436.10822, "b": 333.98471, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.54593, "r_y0": 333.98471, "r_x1": 436.10822, "r_y1": 333.98471, "r_x2": 436.10822, "r_y2": 325.4592, "r_x3": 429.54593, "r_y3": 325.4592, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 28, "label": "text", "bbox": { "l": 440.63608, "t": 325.38043, "r": 447.19836, "b": 333.90594, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.63608, "r_y0": 333.90594, "r_x1": 447.19836, "r_y1": 333.90594, "r_x2": 447.19836, "r_y2": 325.38043, "r_x3": 440.63608, "r_y3": 325.38043, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 29, "label": "text", "bbox": { "l": 451.89511000000005, "t": 280.15717, "r": 463.51273000000003, "b": 288.68268, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 451.89511000000005, "r_y0": 288.68268, "r_x1": 463.51273000000003, "r_y1": 288.68268, "r_x2": 463.51273000000003, "r_y2": 280.15717, "r_x3": 451.89511000000005, "r_y3": 280.15717, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 30, "label": "text", "bbox": { "l": 452.1557, "t": 291.59875000000005, "r": 463.77332, "b": 300.12427, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.1557, "r_y0": 300.12427, "r_x1": 463.77332, "r_y1": 300.12427, "r_x2": 463.77332, "r_y2": 291.59875000000005, "r_x3": 452.1557, "r_y3": 291.59875000000005, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 31, "label": "text", "bbox": { "l": 452.17688000000004, "t": 302.84265, "r": 463.79449000000005, "b": 311.36816, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.17688000000004, "r_y0": 311.36816, "r_x1": 463.79449000000005, "r_y1": 311.36816, "r_x2": 463.79449000000005, "r_y2": 302.84265, "r_x3": 452.17688000000004, "r_y3": 302.84265, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 32, "label": "text", "bbox": { "l": 452.09887999999995, "t": 314.12441999999993, "r": 463.71648999999996, "b": 322.6499299999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.09887999999995, "r_y0": 322.6499299999999, "r_x1": 463.71648999999996, "r_y1": 322.6499299999999, "r_x2": 463.71648999999996, "r_y2": 314.12441999999993, "r_x3": 452.09887999999995, "r_y3": 314.12441999999993, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 33, "label": "text", "bbox": { "l": 452.29733, "t": 325.46906, "r": 463.91495, "b": 333.99457, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.29733, "r_y0": 333.99457, "r_x1": 463.91495, "r_y1": 333.99457, "r_x2": 463.91495, "r_y2": 325.46906, "r_x3": 452.29733, "r_y3": 325.46906, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 34, "label": "text", "bbox": { "l": 396.09677, "t": 314.49478, "r": 402.65906, "b": 323.02029000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.09677, "r_y0": 323.02029000000005, "r_x1": 402.65906, "r_y1": 323.02029000000005, "r_x2": 402.65906, "r_y2": 314.49478, "r_x3": 396.09677, "r_y3": 314.49478, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 35, "label": "text", "bbox": { "l": 395.99829, "t": 325.38876000000005, "r": 402.56058, "b": 333.91428, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.99829, "r_y0": 333.91428, "r_x1": 402.56058, "r_y1": 333.91428, "r_x2": 402.56058, "r_y2": 325.38876000000005, "r_x3": 395.99829, "r_y3": 325.38876000000005, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 36, "label": "text", "bbox": { "l": 396.27475, "t": 292.27057, "r": 402.83704, "b": 300.79608, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.27475, "r_y0": 300.79608, "r_x1": 402.83704, "r_y1": 300.79608, "r_x2": 402.83704, "r_y2": 292.27057, "r_x3": 396.27475, "r_y3": 292.27057, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 37, "label": "text", "bbox": { "l": 408.54724, "t": 280.96912, "r": 413.60074, "b": 289.49463, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.54724, "r_y0": 289.49463, "r_x1": 413.60074, "r_y1": 289.49463, "r_x2": 413.60074, "r_y2": 280.96912, "r_x3": 408.54724, "r_y3": 280.96912, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 38, "label": "text", "bbox": { "l": 430.58966, "t": 280.49725, "r": 435.6431600000001, "b": 289.02277, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 430.58966, "r_y0": 289.02277, "r_x1": 435.6431600000001, "r_y1": 289.02277, "r_x2": 435.6431600000001, "r_y2": 280.49725, "r_x3": 430.58966, "r_y3": 280.49725, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 39, "label": "text", "bbox": { "l": 441.08069, "t": 280.38062, "r": 446.13419, "b": 288.90613, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 441.08069, "r_y0": 288.90613, "r_x1": 446.13419, "r_y1": 288.90613, "r_x2": 446.13419, "r_y2": 280.38062, "r_x3": 441.08069, "r_y3": 280.38062, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 40, "label": "text", "bbox": { "l": 407.97388, "t": 292.13425, "r": 414.03625, "b": 300.65976, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.97388, "r_y0": 300.65976, "r_x1": 414.03625, "r_y1": 300.65976, "r_x2": 414.03625, "r_y2": 292.13425, "r_x3": 407.97388, "r_y3": 292.13425, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 441.25640999999996, "t": 411.1807600000001, "r": 452.87402, "b": 419.7062700000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 441.25640999999996, "r_y0": 419.7062700000001, "r_x1": 452.87402, "r_y1": 419.7062700000001, "r_x2": 452.87402, "r_y2": 411.1807600000001, "r_x3": 441.25640999999996, "r_y3": 411.1807600000001, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 393.75256, "t": 399.7947700000001, "r": 432.48929, "b": 406.89935, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.75256, "r_y0": 406.89935, "r_x1": 432.48929, "r_y1": 406.89935, "r_x2": 432.48929, "r_y2": 399.7947700000001, "r_x3": 393.75256, "r_y3": 399.7947700000001, "coord_origin": "TOPLEFT" }, "text": "vocabulary:", "orig": "vocabulary:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 434.5896000000001, "t": 399.7947700000001, "r": 438.80083999999994, "b": 406.89935, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 434.5896000000001, "r_y0": 406.89935, "r_x1": 438.80083999999994, "r_y1": 406.89935, "r_x2": 438.80083999999994, "r_y2": 399.7947700000001, "r_x3": 434.5896000000001, "r_y3": 399.7947700000001, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 440.90573, "t": 399.7947700000001, "r": 463.22235, "b": 406.89935, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.90573, "r_y0": 406.89935, "r_x1": 463.22235, "r_y1": 406.89935, "r_x2": 463.22235, "r_y2": 399.7947700000001, "r_x3": 440.90573, "r_y3": 399.7947700000001, "coord_origin": "TOPLEFT" }, "text": "tokens", "orig": "tokens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 384.11816, "t": 258.54718, "r": 413.99307, "b": 265.65179, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 384.11816, "r_y0": 265.65179, "r_x1": 413.99307, "r_y1": 265.65179, "r_x2": 413.99307, "r_y2": 258.54718, "r_x3": 384.11816, "r_y3": 258.54718, "coord_origin": "TOPLEFT" }, "text": "D OTSL", "orig": "D OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 393.75256, "t": 266.67505000000006, "r": 451.45129000000003, "b": 273.77966000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.75256, "r_y0": 273.77966000000004, "r_x1": 451.45129000000003, "r_y1": 273.77966000000004, "r_x2": 451.45129000000003, "r_y2": 266.67505000000006, "r_x3": 393.75256, "r_y3": 266.67505000000006, "coord_origin": "TOPLEFT" }, "text": "sequence length:", "orig": "sequence length:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 453.55083999999994, "t": 266.67505000000006, "r": 461.97485, "b": 273.77966000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 453.55083999999994, "r_y0": 273.77966000000004, "r_x1": 461.97485, "r_y1": 273.77966000000004, "r_x2": 461.97485, "r_y2": 266.67505000000006, "r_x3": 453.55083999999994, "r_y3": 266.67505000000006, "coord_origin": "TOPLEFT" }, "text": "30", "orig": "30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 151.79318, "t": 399.76016, "r": 233.89371000000003, "b": 406.86474999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.79318, "r_y0": 406.86474999999996, "r_x1": 233.89371000000003, "r_y1": 406.86474999999996, "r_x2": 233.89371000000003, "r_y2": 399.76016, "r_x3": 151.79318, "r_y3": 399.76016, "coord_origin": "TOPLEFT" }, "text": "vocabulary for this table:", "orig": "vocabulary for this table:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 235.99332, "t": 399.76016, "r": 244.41734000000002, "b": 406.86474999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 235.99332, "r_y0": 406.86474999999996, "r_x1": 244.41734000000002, "r_y1": 406.86474999999996, "r_x2": 244.41734000000002, "r_y2": 399.76016, "r_x3": 235.99332, "r_y3": 399.76016, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 246.52222, "t": 399.76016, "r": 268.83884, "b": 406.86474999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.52222, "r_y0": 406.86474999999996, "r_x1": 268.83884, "r_y1": 406.86474999999996, "r_x2": 268.83884, "r_y2": 399.76016, "r_x3": 246.52222, "r_y3": 399.76016, "coord_origin": "TOPLEFT" }, "text": "tokens", "orig": "tokens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 51, "label": "text", "bbox": { "l": 154.3298, "t": 213.57457999999997, "r": 159.79837, "b": 220.67920000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.3298, "r_y0": 220.67920000000004, "r_x1": 159.79837, "r_y1": 220.67920000000004, "r_x2": 159.79837, "r_y2": 213.57457999999997, "r_x3": 154.3298, "r_y3": 213.57457999999997, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 52, "label": "text", "bbox": { "l": 321.07053, "t": 213.57457999999997, "r": 326.53909, "b": 220.67920000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 321.07053, "r_y0": 220.67920000000004, "r_x1": 326.53909, "r_y1": 220.67920000000004, "r_x2": 326.53909, "r_y2": 213.57457999999997, "r_x3": 321.07053, "r_y3": 213.57457999999997, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 53, "label": "text", "bbox": { "l": 153.0947, "t": 280.30411, "r": 175.83888, "b": 286.69824, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 153.0947, "r_y0": 286.69824, "r_x1": 175.83888, "r_y1": 286.69824, "r_x2": 175.83888, "r_y2": 280.30411, "r_x3": 153.0947, "r_y3": 280.30411, "coord_origin": "TOPLEFT" }, "text": "", "orig": "
", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 54, "label": "text", "bbox": { "l": 160.67039, "t": 287.12088, "r": 172.79608, "b": 293.51501, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67039, "r_y0": 293.51501, "r_x1": 172.79608, "r_y1": 293.51501, "r_x2": 172.79608, "r_y2": 287.12088, "r_x3": 160.67039, "r_y3": 287.12088, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 55, "label": "text", "bbox": { "l": 168.24603, "t": 293.93765, "r": 177.91019, "b": 300.33179, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.24603, "r_y0": 300.33179, "r_x1": 177.91019, "r_y1": 300.33179, "r_x2": 177.91019, "r_y2": 293.93765, "r_x3": 168.24603, "r_y3": 293.93765, "coord_origin": "TOPLEFT" }, "text": "", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 59, "label": "text", "bbox": { "l": 263.35785, "t": 293.93765, "r": 278.89804, "b": 300.33179, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.35785, "r_y0": 300.33179, "r_x1": 278.89804, "r_y1": 300.33179, "r_x2": 278.89804, "r_y2": 293.93765, "r_x3": 263.35785, "r_y3": 293.93765, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 60, "label": "text", "bbox": { "l": 280.79175, "t": 293.93765, "r": 290.4559, "b": 300.33179, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 280.79175, "r_y0": 300.33179, "r_x1": 290.4559, "r_y1": 300.33179, "r_x2": 290.4559, "r_y2": 293.93765, "r_x3": 280.79175, "r_y3": 293.93765, "coord_origin": "TOPLEFT" }, "text": "", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 335.92926, "t": 293.93765, "r": 351.46945, "b": 300.33179, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 335.92926, "r_y0": 300.33179, "r_x1": 351.46945, "r_y1": 300.33179, "r_x2": 351.46945, "r_y2": 293.93765, "r_x3": 335.92926, "r_y3": 293.93765, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 160.67039, "t": 300.75442999999996, "r": 174.68979, "b": 307.14856, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67039, "r_y0": 307.14856, "r_x1": 174.68979, "r_y1": 307.14856, "r_x2": 174.68979, "r_y2": 300.75442999999996, "r_x3": 160.67039, "r_y3": 300.75442999999996, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 160.67039, "t": 307.57122999999996, "r": 172.79608, "b": 313.96536, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67039, "r_y0": 313.96536, "r_x1": 172.79608, "r_y1": 313.96536, "r_x2": 172.79608, "r_y2": 307.57122999999996, "r_x3": 160.67039, "r_y3": 307.57122999999996, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 168.24603, "t": 314.388, "r": 181.89255, "b": 320.78214, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.24603, "r_y0": 320.78214, "r_x1": 181.89255, "r_y1": 320.78214, "r_x2": 181.89255, "r_y2": 314.388, "r_x3": 168.24603, "r_y3": 314.388, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 201.22015, "t": 314.388, "r": 214.86666999999997, "b": 320.78214, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 201.22015, "r_y0": 320.78214, "r_x1": 214.86666999999997, "r_y1": 320.78214, "r_x2": 214.86666999999997, "r_y2": 314.388, "r_x3": 201.22015, "r_y3": 314.388, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 234.19427000000002, "t": 314.388, "r": 247.84079000000003, "b": 320.78214, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.19427000000002, "r_y0": 320.78214, "r_x1": 247.84079000000003, "r_y1": 320.78214, "r_x2": 247.84079000000003, "r_y2": 314.388, "r_x3": 234.19427000000002, "r_y3": 314.388, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 160.67039, "t": 321.20477, "r": 174.68979, "b": 327.59890999999993, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67039, "r_y0": 327.59890999999993, "r_x1": 174.68979, "r_y1": 327.59890999999993, "r_x2": 174.68979, "r_y2": 321.20477, "r_x3": 160.67039, "r_y3": 321.20477, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 160.67039, "t": 328.02158, "r": 172.79608, "b": 334.41571000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67039, "r_y0": 334.41571000000005, "r_x1": 172.79608, "r_y1": 334.41571000000005, "r_x2": 172.79608, "r_y2": 328.02158, "r_x3": 160.67039, "r_y3": 328.02158, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 168.24603, "t": 334.83835, "r": 373.09091, "b": 341.23248, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.24603, "r_y0": 341.23248, "r_x1": 373.09091, "r_y1": 341.23248, "r_x2": 373.09091, "r_y2": 334.83835, "r_x3": 168.24603, "r_y3": 334.83835, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 160.67039, "t": 341.65512, "r": 174.68979, "b": 348.04926, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67039, "r_y0": 348.04926, "r_x1": 174.68979, "r_y1": 348.04926, "r_x2": 174.68979, "r_y2": 341.65512, "r_x3": 160.67039, "r_y3": 341.65512, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 160.67039, "t": 348.47159, "r": 172.79608, "b": 354.86572, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67039, "r_y0": 354.86572, "r_x1": 172.79608, "r_y1": 354.86572, "r_x2": 172.79608, "r_y2": 348.47159, "r_x3": 160.67039, "r_y3": 348.47159, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 168.24603, "t": 355.28836000000007, "r": 181.89255, "b": 361.68249999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.24603, "r_y0": 361.68249999999995, "r_x1": 181.89255, "r_y1": 361.68249999999995, "r_x2": 181.89255, "r_y2": 355.28836000000007, "r_x3": 168.24603, "r_y3": 355.28836000000007, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 201.22015, "t": 355.28836000000007, "r": 214.86666999999997, "b": 361.68249999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 201.22015, "r_y0": 361.68249999999995, "r_x1": 214.86666999999997, "r_y1": 361.68249999999995, "r_x2": 214.86666999999997, "r_y2": 355.28836000000007, "r_x3": 201.22015, "r_y3": 355.28836000000007, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 81, "label": "text", "bbox": { "l": 234.19427000000002, "t": 355.28836000000007, "r": 247.84079000000003, "b": 361.68249999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.19427000000002, "r_y0": 361.68249999999995, "r_x1": 247.84079000000003, "r_y1": 361.68249999999995, "r_x2": 247.84079000000003, "r_y2": 355.28836000000007, "r_x3": 234.19427000000002, "r_y3": 355.28836000000007, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 83, "label": "text", "bbox": { "l": 267.1684, "t": 355.28836000000007, "r": 280.81488, "b": 361.68249999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 267.1684, "r_y0": 361.68249999999995, "r_x1": 280.81488, "r_y1": 361.68249999999995, "r_x2": 280.81488, "r_y2": 355.28836000000007, "r_x3": 267.1684, "r_y3": 355.28836000000007, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 85, "label": "text", "bbox": { "l": 160.67039, "t": 362.10516000000007, "r": 174.68979, "b": 368.49929999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67039, "r_y0": 368.49929999999995, "r_x1": 174.68979, "r_y1": 368.49929999999995, "r_x2": 174.68979, "r_y2": 362.10516000000007, "r_x3": 160.67039, "r_y3": 362.10516000000007, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 86, "label": "text", "bbox": { "l": 160.67039, "t": 368.92194, "r": 172.79608, "b": 375.31607, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67039, "r_y0": 375.31607, "r_x1": 172.79608, "r_y1": 375.31607, "r_x2": 172.79608, "r_y2": 368.92194, "r_x3": 160.67039, "r_y3": 368.92194, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 87, "label": "text", "bbox": { "l": 168.24603, "t": 375.73871, "r": 181.89255, "b": 382.13284, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.24603, "r_y0": 382.13284, "r_x1": 181.89255, "r_y1": 382.13284, "r_x2": 181.89255, "r_y2": 375.73871, "r_x3": 168.24603, "r_y3": 375.73871, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 89, "label": "text", "bbox": { "l": 201.22015, "t": 375.73871, "r": 214.86666999999997, "b": 382.13284, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 201.22015, "r_y0": 382.13284, "r_x1": 214.86666999999997, "r_y1": 382.13284, "r_x2": 214.86666999999997, "r_y2": 375.73871, "r_x3": 201.22015, "r_y3": 375.73871, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 91, "label": "text", "bbox": { "l": 234.19427000000002, "t": 375.73871, "r": 247.84079000000003, "b": 382.13284, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.19427000000002, "r_y0": 382.13284, "r_x1": 247.84079000000003, "r_y1": 382.13284, "r_x2": 247.84079000000003, "r_y2": 375.73871, "r_x3": 234.19427000000002, "r_y3": 375.73871, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 93, "label": "text", "bbox": { "l": 267.1684, "t": 375.73871, "r": 280.81488, "b": 382.13284, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 267.1684, "r_y0": 382.13284, "r_x1": 280.81488, "r_y1": 382.13284, "r_x2": 280.81488, "r_y2": 375.73871, "r_x3": 267.1684, "r_y3": 375.73871, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 95, "label": "text", "bbox": { "l": 160.67039, "t": 382.55551, "r": 174.68979, "b": 388.94965, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67039, "r_y0": 388.94965, "r_x1": 174.68979, "r_y1": 388.94965, "r_x2": 174.68979, "r_y2": 382.55551, "r_x3": 160.67039, "r_y3": 382.55551, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 96, "label": "text", "bbox": { "l": 153.0947, "t": 389.37228, "r": 177.73259, "b": 395.76642, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 153.0947, "r_y0": 395.76642, "r_x1": 177.73259, "r_y1": 395.76642, "r_x2": 177.73259, "r_y2": 389.37228, "r_x3": 153.0947, "r_y3": 389.37228, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 183.78624, "t": 314.388, "r": 199.32646, "b": 320.78214, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.78624, "r_y0": 320.78214, "r_x1": 199.32646, "r_y1": 320.78214, "r_x2": 199.32646, "r_y2": 314.388, "r_x3": 183.78624, "r_y3": 314.388, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 216.76038, "t": 314.388, "r": 232.30058, "b": 320.78214, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 216.76038, "r_y0": 320.78214, "r_x1": 232.30058, "r_y1": 320.78214, "r_x2": 232.30058, "r_y2": 314.388, "r_x3": 216.76038, "r_y3": 314.388, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 249.73447999999996, "t": 314.388, "r": 265.27469, "b": 320.78214, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.73447999999996, "r_y0": 320.78214, "r_x1": 265.27469, "r_y1": 320.78214, "r_x2": 265.27469, "r_y2": 314.388, "r_x3": 249.73447999999996, "r_y3": 314.388, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 183.78624, "t": 355.28836000000007, "r": 199.32646, "b": 361.68249999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.78624, "r_y0": 361.68249999999995, "r_x1": 199.32646, "r_y1": 361.68249999999995, "r_x2": 199.32646, "r_y2": 355.28836000000007, "r_x3": 183.78624, "r_y3": 355.28836000000007, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 80, "label": "text", "bbox": { "l": 216.76038, "t": 355.28836000000007, "r": 232.30058, "b": 361.68249999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 216.76038, "r_y0": 361.68249999999995, "r_x1": 232.30058, "r_y1": 361.68249999999995, "r_x2": 232.30058, "r_y2": 355.28836000000007, "r_x3": 216.76038, "r_y3": 355.28836000000007, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 82, "label": "text", "bbox": { "l": 249.73447999999996, "t": 355.28836000000007, "r": 265.27469, "b": 361.68249999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.73447999999996, "r_y0": 361.68249999999995, "r_x1": 265.27469, "r_y1": 361.68249999999995, "r_x2": 265.27469, "r_y2": 355.28836000000007, "r_x3": 249.73447999999996, "r_y3": 355.28836000000007, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 84, "label": "text", "bbox": { "l": 282.70862, "t": 355.28836000000007, "r": 298.24881, "b": 361.68249999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.70862, "r_y0": 361.68249999999995, "r_x1": 298.24881, "r_y1": 361.68249999999995, "r_x2": 298.24881, "r_y2": 355.28836000000007, "r_x3": 282.70862, "r_y3": 355.28836000000007, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 88, "label": "text", "bbox": { "l": 183.78624, "t": 375.73871, "r": 199.32646, "b": 382.13284, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.78624, "r_y0": 382.13284, "r_x1": 199.32646, "r_y1": 382.13284, "r_x2": 199.32646, "r_y2": 375.73871, "r_x3": 183.78624, "r_y3": 375.73871, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 90, "label": "text", "bbox": { "l": 216.76038, "t": 375.73871, "r": 232.30058, "b": 382.13284, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 216.76038, "r_y0": 382.13284, "r_x1": 232.30058, "r_y1": 382.13284, "r_x2": 232.30058, "r_y2": 375.73871, "r_x3": 216.76038, "r_y3": 375.73871, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 92, "label": "text", "bbox": { "l": 249.73447999999996, "t": 375.73871, "r": 265.27469, "b": 382.13284, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.73447999999996, "r_y0": 382.13284, "r_x1": 265.27469, "r_y1": 382.13284, "r_x2": 265.27469, "r_y2": 375.73871, "r_x3": 249.73447999999996, "r_y3": 375.73871, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 94, "label": "text", "bbox": { "l": 282.70862, "t": 375.73871, "r": 298.24881, "b": 382.13284, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.70862, "r_y0": 382.13284, "r_x1": 298.24881, "r_y1": 382.13284, "r_x2": 298.24881, "r_y2": 375.73871, "r_x3": 282.70862, "r_y3": 375.73871, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 97, "label": "text", "bbox": { "l": 395.06137, "t": 411.33353, "r": 401.62366, "b": 419.85904, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.06137, "r_y0": 419.85904, "r_x1": 401.62366, "r_y1": 419.85904, "r_x2": 401.62366, "r_y2": 411.33353, "r_x3": 395.06137, "r_y3": 411.33353, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 98, "label": "text", "bbox": { "l": 407.42249, "t": 411.33353, "r": 412.47598, "b": 419.85904, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.42249, "r_y0": 419.85904, "r_x1": 412.47598, "r_y1": 419.85904, "r_x2": 412.47598, "r_y2": 411.33353, "r_x3": 407.42249, "r_y3": 411.33353, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 99, "label": "text", "bbox": { "l": 418.69287, "t": 411.33353, "r": 425.25516, "b": 419.85904, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.69287, "r_y0": 419.85904, "r_x1": 425.25516, "r_y1": 419.85904, "r_x2": 425.25516, "r_y2": 411.33353, "r_x3": 418.69287, "r_y3": 411.33353, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 100, "label": "text", "bbox": { "l": 430.5086099999999, "t": 411.33353, "r": 436.5709800000001, "b": 419.85904, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 430.5086099999999, "r_y0": 419.85904, "r_x1": 436.5709800000001, "r_y1": 419.85904, "r_x2": 436.5709800000001, "r_y2": 411.33353, "r_x3": 430.5086099999999, "r_y3": 411.33353, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 101, "label": "text", "bbox": { "l": 152.36208, "t": 409.77362, "r": 175.10626, "b": 416.16776, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 152.36208, "r_y0": 416.16776, "r_x1": 175.10626, "r_y1": 416.16776, "r_x2": 175.10626, "r_y2": 409.77362, "r_x3": 152.36208, "r_y3": 409.77362, "coord_origin": "TOPLEFT" }, "text": "", "orig": "
", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 102, "label": "text", "bbox": { "l": 178.89366, "t": 409.77362, "r": 191.01935, "b": 416.16776, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 178.89366, "r_y0": 416.16776, "r_x1": 191.01935, "r_y1": 416.16776, "r_x2": 191.01935, "r_y2": 409.77362, "r_x3": 178.89366, "r_y3": 409.77362, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 103, "label": "text", "bbox": { "l": 194.80676, "t": 409.77362, "r": 208.82614, "b": 416.16776, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.80676, "r_y0": 416.16776, "r_x1": 208.82614, "r_y1": 416.16776, "r_x2": 208.82614, "r_y2": 409.77362, "r_x3": 194.80676, "r_y3": 409.77362, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 104, "label": "text", "bbox": { "l": 212.61354, "t": 409.77362, "r": 226.26003999999998, "b": 416.16776, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 212.61354, "r_y0": 416.16776, "r_x1": 226.26003999999998, "r_y1": 416.16776, "r_x2": 226.26003999999998, "r_y2": 409.77362, "r_x3": 212.61354, "r_y3": 409.77362, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 106, "label": "text", "bbox": { "l": 249.37506000000002, "t": 409.77362, "r": 259.03918, "b": 416.16776, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.37506000000002, "r_y0": 416.16776, "r_x1": 259.03918, "r_y1": 416.16776, "r_x2": 259.03918, "r_y2": 409.77362, "r_x3": 249.37506000000002, "r_y3": 409.77362, "coord_origin": "TOPLEFT" }, "text": "", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 112, "label": "text", "bbox": { "l": 244.46358, "t": 418.10522, "r": 269.10144, "b": 424.49936, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 244.46358, "r_y0": 424.49936, "r_x1": 269.10144, "r_y1": 424.49936, "r_x2": 269.10144, "r_y2": 418.10522, "r_x3": 244.46358, "r_y3": 418.10522, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 105, "label": "text", "bbox": { "l": 230.04745000000003, "t": 409.77362, "r": 245.58765000000002, "b": 416.16776, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 230.04745000000003, "r_y0": 416.16776, "r_x1": 245.58765000000002, "r_y1": 416.16776, "r_x2": 245.58765000000002, "r_y2": 409.77362, "r_x3": 230.04745000000003, "r_y3": 409.77362, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 113, "label": "text", "bbox": { "l": 154.50595, "t": 258.60095, "r": 159.62473, "b": 265.70556999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.50595, "r_y0": 265.70556999999997, "r_x1": 159.62473, "r_y1": 265.70556999999997, "r_x2": 159.62473, "r_y2": 258.60095, "r_x3": 154.50595, "r_y3": 258.60095, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 114, "label": "text", "bbox": { "l": 164.74348, "t": 258.60095, "r": 185.21857, "b": 265.70556999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 164.74348, "r_y0": 265.70556999999997, "r_x1": 185.21857, "r_y1": 265.70556999999997, "r_x2": 185.21857, "r_y2": 258.60095, "r_x3": 164.74348, "r_y3": 258.60095, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 115, "label": "text", "bbox": { "l": 164.3548, "t": 266.49707, "r": 222.05352999999997, "b": 273.60168, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 164.3548, "r_y0": 273.60168, "r_x1": 222.05352999999997, "r_y1": 273.60168, "r_x2": 222.05352999999997, "r_y2": 266.49707, "r_x3": 164.3548, "r_y3": 266.49707, "coord_origin": "TOPLEFT" }, "text": "sequence length:", "orig": "sequence length:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 116, "label": "text", "bbox": { "l": 224.15326, "t": 266.49707, "r": 232.57729, "b": 273.60168, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 224.15326, "r_y0": 273.60168, "r_x1": 232.57729, "r_y1": 273.60168, "r_x2": 232.57729, "r_y2": 266.49707, "r_x3": 224.15326, "r_y3": 266.49707, "coord_origin": "TOPLEFT" }, "text": "55", "orig": "55", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, { "id": 2, "label": "text", "bbox": { "l": 134.765, "t": 452.31378, "r": 480.59232000000003, "b": 520.88669, "coord_origin": "TOPLEFT" }, "confidence": 0.950499951839447, "cells": [ { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 461.11075, "r_x1": 161.32928, "r_y1": 461.11075, "r_x2": 161.32928, "r_y2": 452.31378, "r_x3": 134.765, "r_y3": 452.31378, "coord_origin": "TOPLEFT" }, "text": "today,", "orig": "today,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 164.269, "r_y0": 461.11075, "r_x1": 226.28617999999997, "r_y1": 461.11075, "r_x2": 226.28617999999997, "r_y2": 452.31378, "r_x3": 164.269, "r_y3": 452.31378, "coord_origin": "TOPLEFT" }, "text": "table detection", "orig": "table detection", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.992, "r_y0": 461.11075, "r_x1": 480.59232000000003, "r_y1": 461.11075, "r_x2": 480.59232000000003, "r_y2": 452.31378, "r_x3": 229.992, "r_y3": 452.31378, "coord_origin": "TOPLEFT" }, "text": "in documents is a well understood problem, and the latest", "orig": "in documents is a well understood problem, and the latest", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 473.06573, "r_x1": 480.59180000000003, "r_y1": 473.06573, "r_x2": 480.59180000000003, "r_y2": 464.26877, "r_x3": 134.76501, "r_y3": 464.26877, "coord_origin": "TOPLEFT" }, "text": "state-of-the-art (SOTA) object detection methods provide an accuracy compa-", "orig": "state-of-the-art (SOTA) object detection methods provide an accuracy compa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 485.02072, "r_x1": 480.58673, "r_y1": 485.02072, "r_x2": 480.58673, "r_y2": 476.22375, "r_x3": 134.76501, "r_y3": 476.22375, "coord_origin": "TOPLEFT" }, "text": "rable to human observers [7,8,10,14,23]. On the other hand, the problem of table", "orig": "rable to human observers [7,8,10,14,23]. On the other hand, the problem of table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 496.97672, "r_x1": 480.58658, "r_y1": 496.97672, "r_x2": 480.58658, "r_y2": 488.17975, "r_x3": 134.76501, "r_y3": 488.17975, "coord_origin": "TOPLEFT" }, "text": "structure recognition (TSR) is a lot more challenging and remains a very active", "orig": "structure recognition (TSR) is a lot more challenging and remains a very active", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 508.9317, "r_x1": 480.58978, "r_y1": 508.9317, "r_x2": 480.58978, "r_y2": 500.13474, "r_x3": 134.76501, "r_y3": 500.13474, "coord_origin": "TOPLEFT" }, "text": "area of research, in which many novel machine learning algorithms are being", "orig": "area of research, in which many novel machine learning algorithms are being", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 520.88669, "r_x1": 313.24597, "r_y1": 520.88669, "r_x2": 313.24597, "r_y2": 512.0897199999999, "r_x3": 134.76501, "r_y3": 512.0897199999999, "coord_origin": "TOPLEFT" }, "text": "explored [3,4,5,9,11,12,13,14,17,18,21,22].", "orig": "explored [3,4,5,9,11,12,13,14,17,18,21,22].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 0, "label": "text", "bbox": { "l": 134.76501, "t": 524.55072, "r": 480.59482, "b": 664.8547, "coord_origin": "TOPLEFT" }, "confidence": 0.9845512509346008, "cells": [ { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.70901, "r_y0": 533.3476900000001, "r_x1": 480.58884000000006, "r_y1": 533.3476900000001, "r_x2": 480.58884000000006, "r_y2": 524.55072, "r_x3": 149.70901, "r_y3": 524.55072, "coord_origin": "TOPLEFT" }, "text": "Recently emerging SOTA methods for table structure recognition employ", "orig": "Recently emerging SOTA methods for table structure recognition employ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 545.30368, "r_x1": 480.5917400000001, "r_y1": 545.30368, "r_x2": 480.5917400000001, "r_y2": 536.50671, "r_x3": 134.76501, "r_y3": 536.50671, "coord_origin": "TOPLEFT" }, "text": "transformer-based models, in which an image of the table is provided to the net-", "orig": "transformer-based models, in which an image of the table is provided to the net-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 557.25868, "r_x1": 480.58868, "r_y1": 557.25868, "r_x2": 480.58868, "r_y2": 548.46172, "r_x3": 134.76501, "r_y3": 548.46172, "coord_origin": "TOPLEFT" }, "text": "work in order to predict the structure of the table as a sequence of tokens. These", "orig": "work in order to predict the structure of the table as a sequence of tokens. These", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 569.2136800000001, "r_x1": 480.58795, "r_y1": 569.2136800000001, "r_x2": 480.58795, "r_y2": 560.41672, "r_x3": 134.76501, "r_y3": 560.41672, "coord_origin": "TOPLEFT" }, "text": "image-to-sequence (Im2Seq) models are extremely powerful, since they allow for", "orig": "image-to-sequence (Im2Seq) models are extremely powerful, since they allow for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 581.16869, "r_x1": 480.58978, "r_y1": 581.16869, "r_x2": 480.58978, "r_y2": 572.37172, "r_x3": 134.76501, "r_y3": 572.37172, "coord_origin": "TOPLEFT" }, "text": "a purely data-driven solution. The tokens of the sequence typically belong to a", "orig": "a purely data-driven solution. The tokens of the sequence typically belong to a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 593.12369, "r_x1": 480.59479, "r_y1": 593.12369, "r_x2": 480.59479, "r_y2": 584.32672, "r_x3": 134.76501, "r_y3": 584.32672, "coord_origin": "TOPLEFT" }, "text": "markup language such as HTML, Latex or Markdown, which allow to describe", "orig": "markup language such as HTML, Latex or Markdown, which allow to describe", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 605.0796799999999, "r_x1": 480.58678999999995, "r_y1": 605.0796799999999, "r_x2": 480.58678999999995, "r_y2": 596.28271, "r_x3": 134.76501, "r_y3": 596.28271, "coord_origin": "TOPLEFT" }, "text": "table structure as rows, columns and spanning cells in various configurations.", "orig": "table structure as rows, columns and spanning cells in various configurations.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 617.03468, "r_x1": 480.59476, "r_y1": 617.03468, "r_x2": 480.59476, "r_y2": 608.23772, "r_x3": 134.76501, "r_y3": 608.23772, "coord_origin": "TOPLEFT" }, "text": "In Figure 1, we illustrate how HTML is used to represent the table-structure", "orig": "In Figure 1, we illustrate how HTML is used to represent the table-structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 628.98969, "r_x1": 480.5938100000001, "r_y1": 628.98969, "r_x2": 480.5938100000001, "r_y2": 620.19272, "r_x3": 134.76501, "r_y3": 620.19272, "coord_origin": "TOPLEFT" }, "text": "of a particular example table. Public table-structure data sets such as PubTab-", "orig": "of a particular example table. Public table-structure data sets such as PubTab-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 640.94469, "r_x1": 480.59482, "r_y1": 640.94469, "r_x2": 480.59482, "r_y2": 632.1477199999999, "r_x3": 134.76501, "r_y3": 632.1477199999999, "coord_origin": "TOPLEFT" }, "text": "Net [22], and FinTabNet [21], which were created in a semi-automated way from", "orig": "Net [22], and FinTabNet [21], which were created in a semi-automated way from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 652.89969, "r_x1": 480.58771, "r_y1": 652.89969, "r_x2": 480.58771, "r_y2": 644.10272, "r_x3": 134.76501, "r_y3": 644.10272, "coord_origin": "TOPLEFT" }, "text": "paired PDF and HTML sources (e.g. PubMed Central), popularized primarily", "orig": "paired PDF and HTML sources (e.g. PubMed Central), popularized primarily", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 664.8547, "r_x1": 421.45377, "r_y1": 664.8547, "r_x2": 421.45377, "r_y2": 656.05772, "r_x3": 134.76501, "r_y3": 656.05772, "coord_origin": "TOPLEFT" }, "text": "the use of HTML as ground-truth representation format for TSR.", "orig": "the use of HTML as ground-truth representation format for TSR.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "tablestructure": { "table_map": {} }, "figures_classification": null, "equations_prediction": null, "vlm_response": null }, "assembled": { "elements": [ { "label": "page_header", "id": 5, "page_no": 1, "cluster": { "id": 5, "label": "page_header", "bbox": { "l": 134.765, "t": 93.77099999999996, "r": 139.37193, "b": 101.84069999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.8580349683761597, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 101.84069999999997, "r_x1": 139.37193, "r_y1": 101.84069999999997, "r_x2": 139.37193, "r_y2": 93.77099999999996, "r_x3": 134.765, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "2" }, { "label": "page_header", "id": 3, "page_no": 1, "cluster": { "id": 3, "label": "page_header", "bbox": { "l": 167.81335, "t": 93.77099999999996, "r": 231.72227, "b": 101.84069999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.9076642990112305, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.81335, "r_y0": 101.84069999999997, "r_x1": 178.07675, "r_y1": 101.84069999999997, "r_x2": 178.07675, "r_y2": 93.77099999999996, "r_x3": 167.81335, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.37415, "r_y0": 101.84069999999997, "r_x1": 231.72227, "r_y1": 101.84069999999997, "r_x2": 231.72227, "r_y2": 93.77099999999996, "r_x3": 182.37415, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "M. Lysak, et al." }, { "label": "caption", "id": 4, "page_no": 1, "cluster": { "id": 4, "label": "caption", "bbox": { "l": 134.765, "t": 126.33416999999997, "r": 480.59189, "b": 200.22058000000004, "coord_origin": "TOPLEFT" }, "confidence": 0.8939083218574524, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 134.26049999999998, "r_x1": 162.64424, "r_y1": 134.26049999999998, "r_x2": 162.64424, "r_y2": 126.33416999999997, "r_x3": 134.765, "r_y3": 126.33416999999997, "coord_origin": "TOPLEFT" }, "text": "Fig. 1.", "orig": "Fig. 1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.062, "r_y0": 134.46667000000002, "r_x1": 480.59106, "r_y1": 134.46667000000002, "r_x2": 480.59106, "r_y2": 126.39697000000001, "r_x3": 167.062, "r_y3": 126.39697000000001, "coord_origin": "TOPLEFT" }, "text": "Comparison between HTML and OTSL table structure representation: (A)", "orig": "Comparison between HTML and OTSL table structure representation: (A)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 145.42566, "r_x1": 480.59018, "r_y1": 145.42566, "r_x2": 480.59018, "r_y2": 137.35595999999998, "r_x3": 134.765, "r_y3": 137.35595999999998, "coord_origin": "TOPLEFT" }, "text": "table-example with complex row and column headers, including a 2D empty span,", "orig": "table-example with complex row and column headers, including a 2D empty span,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 156.38464, "r_x1": 147.95433, "r_y1": 156.38464, "r_x2": 147.95433, "r_y2": 148.31493999999998, "r_x3": 134.765, "r_y3": 148.31493999999998, "coord_origin": "TOPLEFT" }, "text": "(B)", "orig": "(B)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 152.39224, "r_y0": 156.38464, "r_x1": 480.59096999999997, "r_y1": 156.38464, "r_x2": 480.59096999999997, "r_y2": 148.31493999999998, "r_x3": 152.39224, "r_y3": 148.31493999999998, "coord_origin": "TOPLEFT" }, "text": "minimal graphical representation of table structure using rectangular layout, (C)", "orig": "minimal graphical representation of table structure using rectangular layout, (C)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 167.34362999999996, "r_x1": 480.59189, "r_y1": 167.34362999999996, "r_x2": 480.59189, "r_y2": 159.27392999999995, "r_x3": 134.765, "r_y3": 159.27392999999995, "coord_origin": "TOPLEFT" }, "text": "HTML representation, (D) OTSL representation. This example demonstrates many of", "orig": "HTML representation, (D) OTSL representation. This example demonstrates many of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 178.30260999999996, "r_x1": 480.58914000000004, "r_y1": 178.30260999999996, "r_x2": 480.58914000000004, "r_y2": 170.23290999999995, "r_x3": 134.765, "r_y3": 170.23290999999995, "coord_origin": "TOPLEFT" }, "text": "the key-features of OTSL, namely its reduced vocabulary size (12 versus 5 in this case),", "orig": "the key-features of OTSL, namely its reduced vocabulary size (12 versus 5 in this case),", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 189.26160000000004, "r_x1": 480.59020999999996, "r_y1": 189.26160000000004, "r_x2": 480.59020999999996, "r_y2": 181.19188999999994, "r_x3": 134.765, "r_y3": 181.19188999999994, "coord_origin": "TOPLEFT" }, "text": "its reduced sequence length (55 versus 30) and a enhanced internal structure (variable", "orig": "its reduced sequence length (55 versus 30) and a enhanced internal structure (variable", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 200.22058000000004, "r_x1": 460.87109, "r_y1": 200.22058000000004, "r_x2": 460.87109, "r_y2": 192.15088000000003, "r_x3": 134.765, "r_y3": 192.15088000000003, "coord_origin": "TOPLEFT" }, "text": "token sequence length per row in HTML versus a fixed length of rows in OTSL).", "orig": "token sequence length per row in HTML versus a fixed length of rows in OTSL).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Fig. 1. Comparison between HTML and OTSL table structure representation: (A) table-example with complex row and column headers, including a 2D empty span, (B) minimal graphical representation of table structure using rectangular layout, (C) HTML representation, (D) OTSL representation. This example demonstrates many of the key-features of OTSL, namely its reduced vocabulary size (12 versus 5 in this case), its reduced sequence length (55 versus 30) and a enhanced internal structure (variable token sequence length per row in HTML versus a fixed length of rows in OTSL)." }, { "label": "picture", "id": 1, "page_no": 1, "cluster": { "id": 1, "label": "picture", "bbox": { "l": 148.45364379882812, "t": 208.37423706054688, "r": 464.3608093261719, "b": 425.8462219238281, "coord_origin": "TOPLEFT" }, "confidence": 0.9688959121704102, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.41107, "r_y0": 289.50903, "r_x1": 402.97336, "r_y1": 289.50903, "r_x2": 402.97336, "r_y2": 280.98352, "r_x3": 396.41107, "r_y3": 280.98352, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.58682, "r_y0": 289.42343, "r_x1": 425.14911, "r_y1": 289.42343, "r_x2": 425.14911, "r_y2": 280.89792, "r_x3": 418.58682, "r_y3": 280.89792, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.74835, "r_y0": 311.76279, "r_x1": 402.31064, "r_y1": 311.76279, "r_x2": 402.31064, "r_y2": 303.23727, "r_x3": 395.74835, "r_y3": 303.23727, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.54214, "r_y0": 311.89532, "r_x1": 414.10443, "r_y1": 311.89532, "r_x2": 414.10443, "r_y2": 303.36981, "r_x3": 407.54214, "r_y3": 303.36981, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.56335, "r_y0": 322.9317, "r_x1": 414.12564, "r_y1": 322.9317, "r_x2": 414.12564, "r_y2": 314.40619, "r_x3": 407.56335, "r_y3": 314.40619, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.51108, "r_y0": 300.61053000000004, "r_x1": 425.07336, "r_y1": 300.61053000000004, "r_x2": 425.07336, "r_y2": 292.08502000000004, "r_x3": 418.51108, "r_y3": 292.08502000000004, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.59744, "r_y0": 300.61658, "r_x1": 436.1597300000001, "r_y1": 300.61658, "r_x2": 436.1597300000001, "r_y2": 292.09106, "r_x3": 429.59744, "r_y3": 292.09106, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.68759000000006, "r_y0": 300.53781000000004, "r_x1": 447.24987999999996, "r_y1": 300.53781000000004, "r_x2": 447.24987999999996, "r_y2": 292.01230000000004, "r_x3": 440.68759000000006, "r_y3": 292.01230000000004, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.6232, "r_y0": 311.82034, "r_x1": 425.18549, "r_y1": 311.82034, "r_x2": 425.18549, "r_y2": 303.29483, "r_x3": 418.6232, "r_y3": 303.29483, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.7095299999999, "r_y0": 311.82562, "r_x1": 436.27182, "r_y1": 311.82562, "r_x2": 436.27182, "r_y2": 303.30011, "r_x3": 429.7095299999999, "r_y3": 303.30011, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.7996800000001, "r_y0": 311.74762, "r_x1": 447.36197, "r_y1": 311.74762, "r_x2": 447.36197, "r_y2": 303.22211, "r_x3": 440.7996800000001, "r_y3": 303.22211, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.62546, "r_y0": 323.09454, "r_x1": 425.18774, "r_y1": 323.09454, "r_x2": 425.18774, "r_y2": 314.56903, "r_x3": 418.62546, "r_y3": 314.56903, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.71181999999993, "r_y0": 323.09985, "r_x1": 436.27411, "r_y1": 323.09985, "r_x2": 436.27411, "r_y2": 314.57434, "r_x3": 429.71181999999993, "r_y3": 314.57434, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.80194, "r_y0": 323.02182, "r_x1": 447.36423, "r_y1": 323.02182, "r_x2": 447.36423, "r_y2": 314.49631, "r_x3": 440.80194, "r_y3": 314.49631, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.39746, "r_y0": 333.81583, "r_x1": 413.95975, "r_y1": 333.81583, "r_x2": 413.95975, "r_y2": 325.29031, "r_x3": 407.39746, "r_y3": 325.29031, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.45959, "r_y0": 333.97867, "r_x1": 425.02188, "r_y1": 333.97867, "r_x2": 425.02188, "r_y2": 325.45316, "r_x3": 418.45959, "r_y3": 325.45316, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.54593, "r_y0": 333.98471, "r_x1": 436.10822, "r_y1": 333.98471, "r_x2": 436.10822, "r_y2": 325.4592, "r_x3": 429.54593, "r_y3": 325.4592, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.63608, "r_y0": 333.90594, "r_x1": 447.19836, "r_y1": 333.90594, "r_x2": 447.19836, "r_y2": 325.38043, "r_x3": 440.63608, "r_y3": 325.38043, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 451.89511000000005, "r_y0": 288.68268, "r_x1": 463.51273000000003, "r_y1": 288.68268, "r_x2": 463.51273000000003, "r_y2": 280.15717, "r_x3": 451.89511000000005, "r_y3": 280.15717, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.1557, "r_y0": 300.12427, "r_x1": 463.77332, "r_y1": 300.12427, "r_x2": 463.77332, "r_y2": 291.59875000000005, "r_x3": 452.1557, "r_y3": 291.59875000000005, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.17688000000004, "r_y0": 311.36816, "r_x1": 463.79449000000005, "r_y1": 311.36816, "r_x2": 463.79449000000005, "r_y2": 302.84265, "r_x3": 452.17688000000004, "r_y3": 302.84265, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.09887999999995, "r_y0": 322.6499299999999, "r_x1": 463.71648999999996, "r_y1": 322.6499299999999, "r_x2": 463.71648999999996, "r_y2": 314.12441999999993, "r_x3": 452.09887999999995, "r_y3": 314.12441999999993, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.29733, "r_y0": 333.99457, "r_x1": 463.91495, "r_y1": 333.99457, "r_x2": 463.91495, "r_y2": 325.46906, "r_x3": 452.29733, "r_y3": 325.46906, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.09677, "r_y0": 323.02029000000005, "r_x1": 402.65906, "r_y1": 323.02029000000005, "r_x2": 402.65906, "r_y2": 314.49478, "r_x3": 396.09677, "r_y3": 314.49478, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.99829, "r_y0": 333.91428, "r_x1": 402.56058, "r_y1": 333.91428, "r_x2": 402.56058, "r_y2": 325.38876000000005, "r_x3": 395.99829, "r_y3": 325.38876000000005, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.27475, "r_y0": 300.79608, "r_x1": 402.83704, "r_y1": 300.79608, "r_x2": 402.83704, "r_y2": 292.27057, "r_x3": 396.27475, "r_y3": 292.27057, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.54724, "r_y0": 289.49463, "r_x1": 413.60074, "r_y1": 289.49463, "r_x2": 413.60074, "r_y2": 280.96912, "r_x3": 408.54724, "r_y3": 280.96912, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 430.58966, "r_y0": 289.02277, "r_x1": 435.6431600000001, "r_y1": 289.02277, "r_x2": 435.6431600000001, "r_y2": 280.49725, "r_x3": 430.58966, "r_y3": 280.49725, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 441.08069, "r_y0": 288.90613, "r_x1": 446.13419, "r_y1": 288.90613, "r_x2": 446.13419, "r_y2": 280.38062, "r_x3": 441.08069, "r_y3": 280.38062, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.97388, "r_y0": 300.65976, "r_x1": 414.03625, "r_y1": 300.65976, "r_x2": 414.03625, "r_y2": 292.13425, "r_x3": 407.97388, "r_y3": 292.13425, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 441.25640999999996, "r_y0": 419.7062700000001, "r_x1": 452.87402, "r_y1": 419.7062700000001, "r_x2": 452.87402, "r_y2": 411.1807600000001, "r_x3": 441.25640999999996, "r_y3": 411.1807600000001, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.75256, "r_y0": 406.89935, "r_x1": 432.48929, "r_y1": 406.89935, "r_x2": 432.48929, "r_y2": 399.7947700000001, "r_x3": 393.75256, "r_y3": 399.7947700000001, "coord_origin": "TOPLEFT" }, "text": "vocabulary:", "orig": "vocabulary:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 434.5896000000001, "r_y0": 406.89935, "r_x1": 438.80083999999994, "r_y1": 406.89935, "r_x2": 438.80083999999994, "r_y2": 399.7947700000001, "r_x3": 434.5896000000001, "r_y3": 399.7947700000001, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.90573, "r_y0": 406.89935, "r_x1": 463.22235, "r_y1": 406.89935, "r_x2": 463.22235, "r_y2": 399.7947700000001, "r_x3": 440.90573, "r_y3": 399.7947700000001, "coord_origin": "TOPLEFT" }, "text": "tokens", "orig": "tokens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 384.11816, "r_y0": 265.65179, "r_x1": 413.99307, "r_y1": 265.65179, "r_x2": 413.99307, "r_y2": 258.54718, "r_x3": 384.11816, "r_y3": 258.54718, "coord_origin": "TOPLEFT" }, "text": "D OTSL", "orig": "D OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.75256, "r_y0": 273.77966000000004, "r_x1": 451.45129000000003, "r_y1": 273.77966000000004, "r_x2": 451.45129000000003, "r_y2": 266.67505000000006, "r_x3": 393.75256, "r_y3": 266.67505000000006, "coord_origin": "TOPLEFT" }, "text": "sequence length:", "orig": "sequence length:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 453.55083999999994, "r_y0": 273.77966000000004, "r_x1": 461.97485, "r_y1": 273.77966000000004, "r_x2": 461.97485, "r_y2": 266.67505000000006, "r_x3": 453.55083999999994, "r_y3": 266.67505000000006, "coord_origin": "TOPLEFT" }, "text": "30", "orig": "30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.79318, "r_y0": 406.86474999999996, "r_x1": 233.89371000000003, "r_y1": 406.86474999999996, "r_x2": 233.89371000000003, "r_y2": 399.76016, "r_x3": 151.79318, "r_y3": 399.76016, "coord_origin": "TOPLEFT" }, "text": "vocabulary for this table:", "orig": "vocabulary for this table:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 235.99332, "r_y0": 406.86474999999996, "r_x1": 244.41734000000002, "r_y1": 406.86474999999996, "r_x2": 244.41734000000002, "r_y2": 399.76016, "r_x3": 235.99332, "r_y3": 399.76016, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.52222, "r_y0": 406.86474999999996, "r_x1": 268.83884, "r_y1": 406.86474999999996, "r_x2": 268.83884, "r_y2": 399.76016, "r_x3": 246.52222, "r_y3": 399.76016, "coord_origin": "TOPLEFT" }, "text": "tokens", "orig": "tokens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.3298, "r_y0": 220.67920000000004, "r_x1": 159.79837, "r_y1": 220.67920000000004, "r_x2": 159.79837, "r_y2": 213.57457999999997, "r_x3": 154.3298, "r_y3": 213.57457999999997, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 321.07053, "r_y0": 220.67920000000004, "r_x1": 326.53909, "r_y1": 220.67920000000004, "r_x2": 326.53909, "r_y2": 213.57457999999997, "r_x3": 321.07053, "r_y3": 213.57457999999997, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 153.0947, "r_y0": 286.69824, "r_x1": 175.83888, "r_y1": 286.69824, "r_x2": 175.83888, "r_y2": 280.30411, "r_x3": 153.0947, "r_y3": 280.30411, "coord_origin": "TOPLEFT" }, "text": "", "orig": "
", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67039, "r_y0": 293.51501, "r_x1": 172.79608, "r_y1": 293.51501, "r_x2": 172.79608, "r_y2": 287.12088, "r_x3": 160.67039, "r_y3": 287.12088, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.24603, "r_y0": 300.33179, "r_x1": 177.91019, "r_y1": 300.33179, "r_x2": 177.91019, "r_y2": 293.93765, "r_x3": 168.24603, "r_y3": 293.93765, "coord_origin": "TOPLEFT" }, "text": "", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.35785, "r_y0": 300.33179, "r_x1": 278.89804, "r_y1": 300.33179, "r_x2": 278.89804, "r_y2": 293.93765, "r_x3": 263.35785, "r_y3": 293.93765, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 280.79175, "r_y0": 300.33179, "r_x1": 290.4559, "r_y1": 300.33179, "r_x2": 290.4559, "r_y2": 293.93765, "r_x3": 280.79175, "r_y3": 293.93765, "coord_origin": "TOPLEFT" }, "text": "", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 335.92926, "r_y0": 300.33179, "r_x1": 351.46945, "r_y1": 300.33179, "r_x2": 351.46945, "r_y2": 293.93765, "r_x3": 335.92926, "r_y3": 293.93765, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67039, "r_y0": 307.14856, "r_x1": 174.68979, "r_y1": 307.14856, "r_x2": 174.68979, "r_y2": 300.75442999999996, "r_x3": 160.67039, "r_y3": 300.75442999999996, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67039, "r_y0": 313.96536, "r_x1": 172.79608, "r_y1": 313.96536, "r_x2": 172.79608, "r_y2": 307.57122999999996, "r_x3": 160.67039, "r_y3": 307.57122999999996, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.24603, "r_y0": 320.78214, "r_x1": 181.89255, "r_y1": 320.78214, "r_x2": 181.89255, "r_y2": 314.388, "r_x3": 168.24603, "r_y3": 314.388, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 201.22015, "r_y0": 320.78214, "r_x1": 214.86666999999997, "r_y1": 320.78214, "r_x2": 214.86666999999997, "r_y2": 314.388, "r_x3": 201.22015, "r_y3": 314.388, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.19427000000002, "r_y0": 320.78214, "r_x1": 247.84079000000003, "r_y1": 320.78214, "r_x2": 247.84079000000003, "r_y2": 314.388, "r_x3": 234.19427000000002, "r_y3": 314.388, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67039, "r_y0": 327.59890999999993, "r_x1": 174.68979, "r_y1": 327.59890999999993, "r_x2": 174.68979, "r_y2": 321.20477, "r_x3": 160.67039, "r_y3": 321.20477, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67039, "r_y0": 334.41571000000005, "r_x1": 172.79608, "r_y1": 334.41571000000005, "r_x2": 172.79608, "r_y2": 328.02158, "r_x3": 160.67039, "r_y3": 328.02158, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.24603, "r_y0": 341.23248, "r_x1": 373.09091, "r_y1": 341.23248, "r_x2": 373.09091, "r_y2": 334.83835, "r_x3": 168.24603, "r_y3": 334.83835, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67039, "r_y0": 348.04926, "r_x1": 174.68979, "r_y1": 348.04926, "r_x2": 174.68979, "r_y2": 341.65512, "r_x3": 160.67039, "r_y3": 341.65512, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67039, "r_y0": 354.86572, "r_x1": 172.79608, "r_y1": 354.86572, "r_x2": 172.79608, "r_y2": 348.47159, "r_x3": 160.67039, "r_y3": 348.47159, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.24603, "r_y0": 361.68249999999995, "r_x1": 181.89255, "r_y1": 361.68249999999995, "r_x2": 181.89255, "r_y2": 355.28836000000007, "r_x3": 168.24603, "r_y3": 355.28836000000007, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 201.22015, "r_y0": 361.68249999999995, "r_x1": 214.86666999999997, "r_y1": 361.68249999999995, "r_x2": 214.86666999999997, "r_y2": 355.28836000000007, "r_x3": 201.22015, "r_y3": 355.28836000000007, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.19427000000002, "r_y0": 361.68249999999995, "r_x1": 247.84079000000003, "r_y1": 361.68249999999995, "r_x2": 247.84079000000003, "r_y2": 355.28836000000007, "r_x3": 234.19427000000002, "r_y3": 355.28836000000007, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 267.1684, "r_y0": 361.68249999999995, "r_x1": 280.81488, "r_y1": 361.68249999999995, "r_x2": 280.81488, "r_y2": 355.28836000000007, "r_x3": 267.1684, "r_y3": 355.28836000000007, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67039, "r_y0": 368.49929999999995, "r_x1": 174.68979, "r_y1": 368.49929999999995, "r_x2": 174.68979, "r_y2": 362.10516000000007, "r_x3": 160.67039, "r_y3": 362.10516000000007, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67039, "r_y0": 375.31607, "r_x1": 172.79608, "r_y1": 375.31607, "r_x2": 172.79608, "r_y2": 368.92194, "r_x3": 160.67039, "r_y3": 368.92194, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.24603, "r_y0": 382.13284, "r_x1": 181.89255, "r_y1": 382.13284, "r_x2": 181.89255, "r_y2": 375.73871, "r_x3": 168.24603, "r_y3": 375.73871, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 201.22015, "r_y0": 382.13284, "r_x1": 214.86666999999997, "r_y1": 382.13284, "r_x2": 214.86666999999997, "r_y2": 375.73871, "r_x3": 201.22015, "r_y3": 375.73871, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.19427000000002, "r_y0": 382.13284, "r_x1": 247.84079000000003, "r_y1": 382.13284, "r_x2": 247.84079000000003, "r_y2": 375.73871, "r_x3": 234.19427000000002, "r_y3": 375.73871, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 267.1684, "r_y0": 382.13284, "r_x1": 280.81488, "r_y1": 382.13284, "r_x2": 280.81488, "r_y2": 375.73871, "r_x3": 267.1684, "r_y3": 375.73871, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67039, "r_y0": 388.94965, "r_x1": 174.68979, "r_y1": 388.94965, "r_x2": 174.68979, "r_y2": 382.55551, "r_x3": 160.67039, "r_y3": 382.55551, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 153.0947, "r_y0": 395.76642, "r_x1": 177.73259, "r_y1": 395.76642, "r_x2": 177.73259, "r_y2": 389.37228, "r_x3": 153.0947, "r_y3": 389.37228, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.78624, "r_y0": 320.78214, "r_x1": 199.32646, "r_y1": 320.78214, "r_x2": 199.32646, "r_y2": 314.388, "r_x3": 183.78624, "r_y3": 314.388, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 216.76038, "r_y0": 320.78214, "r_x1": 232.30058, "r_y1": 320.78214, "r_x2": 232.30058, "r_y2": 314.388, "r_x3": 216.76038, "r_y3": 314.388, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.73447999999996, "r_y0": 320.78214, "r_x1": 265.27469, "r_y1": 320.78214, "r_x2": 265.27469, "r_y2": 314.388, "r_x3": 249.73447999999996, "r_y3": 314.388, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.78624, "r_y0": 361.68249999999995, "r_x1": 199.32646, "r_y1": 361.68249999999995, "r_x2": 199.32646, "r_y2": 355.28836000000007, "r_x3": 183.78624, "r_y3": 355.28836000000007, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 216.76038, "r_y0": 361.68249999999995, "r_x1": 232.30058, "r_y1": 361.68249999999995, "r_x2": 232.30058, "r_y2": 355.28836000000007, "r_x3": 216.76038, "r_y3": 355.28836000000007, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.73447999999996, "r_y0": 361.68249999999995, "r_x1": 265.27469, "r_y1": 361.68249999999995, "r_x2": 265.27469, "r_y2": 355.28836000000007, "r_x3": 249.73447999999996, "r_y3": 355.28836000000007, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.70862, "r_y0": 361.68249999999995, "r_x1": 298.24881, "r_y1": 361.68249999999995, "r_x2": 298.24881, "r_y2": 355.28836000000007, "r_x3": 282.70862, "r_y3": 355.28836000000007, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.78624, "r_y0": 382.13284, "r_x1": 199.32646, "r_y1": 382.13284, "r_x2": 199.32646, "r_y2": 375.73871, "r_x3": 183.78624, "r_y3": 375.73871, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 216.76038, "r_y0": 382.13284, "r_x1": 232.30058, "r_y1": 382.13284, "r_x2": 232.30058, "r_y2": 375.73871, "r_x3": 216.76038, "r_y3": 375.73871, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.73447999999996, "r_y0": 382.13284, "r_x1": 265.27469, "r_y1": 382.13284, "r_x2": 265.27469, "r_y2": 375.73871, "r_x3": 249.73447999999996, "r_y3": 375.73871, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.70862, "r_y0": 382.13284, "r_x1": 298.24881, "r_y1": 382.13284, "r_x2": 298.24881, "r_y2": 375.73871, "r_x3": 282.70862, "r_y3": 375.73871, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.06137, "r_y0": 419.85904, "r_x1": 401.62366, "r_y1": 419.85904, "r_x2": 401.62366, "r_y2": 411.33353, "r_x3": 395.06137, "r_y3": 411.33353, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.42249, "r_y0": 419.85904, "r_x1": 412.47598, "r_y1": 419.85904, "r_x2": 412.47598, "r_y2": 411.33353, "r_x3": 407.42249, "r_y3": 411.33353, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.69287, "r_y0": 419.85904, "r_x1": 425.25516, "r_y1": 419.85904, "r_x2": 425.25516, "r_y2": 411.33353, "r_x3": 418.69287, "r_y3": 411.33353, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 430.5086099999999, "r_y0": 419.85904, "r_x1": 436.5709800000001, "r_y1": 419.85904, "r_x2": 436.5709800000001, "r_y2": 411.33353, "r_x3": 430.5086099999999, "r_y3": 411.33353, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 152.36208, "r_y0": 416.16776, "r_x1": 175.10626, "r_y1": 416.16776, "r_x2": 175.10626, "r_y2": 409.77362, "r_x3": 152.36208, "r_y3": 409.77362, "coord_origin": "TOPLEFT" }, "text": "", "orig": "
", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 178.89366, "r_y0": 416.16776, "r_x1": 191.01935, "r_y1": 416.16776, "r_x2": 191.01935, "r_y2": 409.77362, "r_x3": 178.89366, "r_y3": 409.77362, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.80676, "r_y0": 416.16776, "r_x1": 208.82614, "r_y1": 416.16776, "r_x2": 208.82614, "r_y2": 409.77362, "r_x3": 194.80676, "r_y3": 409.77362, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 212.61354, "r_y0": 416.16776, "r_x1": 226.26003999999998, "r_y1": 416.16776, "r_x2": 226.26003999999998, "r_y2": 409.77362, "r_x3": 212.61354, "r_y3": 409.77362, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.37506000000002, "r_y0": 416.16776, "r_x1": 259.03918, "r_y1": 416.16776, "r_x2": 259.03918, "r_y2": 409.77362, "r_x3": 249.37506000000002, "r_y3": 409.77362, "coord_origin": "TOPLEFT" }, "text": "", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 244.46358, "r_y0": 424.49936, "r_x1": 269.10144, "r_y1": 424.49936, "r_x2": 269.10144, "r_y2": 418.10522, "r_x3": 244.46358, "r_y3": 418.10522, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 230.04745000000003, "r_y0": 416.16776, "r_x1": 245.58765000000002, "r_y1": 416.16776, "r_x2": 245.58765000000002, "r_y2": 409.77362, "r_x3": 230.04745000000003, "r_y3": 409.77362, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.50595, "r_y0": 265.70556999999997, "r_x1": 159.62473, "r_y1": 265.70556999999997, "r_x2": 159.62473, "r_y2": 258.60095, "r_x3": 154.50595, "r_y3": 258.60095, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 164.74348, "r_y0": 265.70556999999997, "r_x1": 185.21857, "r_y1": 265.70556999999997, "r_x2": 185.21857, "r_y2": 258.60095, "r_x3": 164.74348, "r_y3": 258.60095, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 164.3548, "r_y0": 273.60168, "r_x1": 222.05352999999997, "r_y1": 273.60168, "r_x2": 222.05352999999997, "r_y2": 266.49707, "r_x3": 164.3548, "r_y3": 266.49707, "coord_origin": "TOPLEFT" }, "text": "sequence length:", "orig": "sequence length:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 224.15326, "r_y0": 273.60168, "r_x1": 232.57729, "r_y1": 273.60168, "r_x2": 232.57729, "r_y2": 266.49707, "r_x3": 224.15326, "r_y3": 266.49707, "coord_origin": "TOPLEFT" }, "text": "55", "orig": "55", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 11, "label": "text", "bbox": { "l": 396.41107, "t": 280.98352, "r": 402.97336, "b": 289.50903, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.41107, "r_y0": 289.50903, "r_x1": 402.97336, "r_y1": 289.50903, "r_x2": 402.97336, "r_y2": 280.98352, "r_x3": 396.41107, "r_y3": 280.98352, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 12, "label": "text", "bbox": { "l": 418.58682, "t": 280.89792, "r": 425.14911, "b": 289.42343, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.58682, "r_y0": 289.42343, "r_x1": 425.14911, "r_y1": 289.42343, "r_x2": 425.14911, "r_y2": 280.89792, "r_x3": 418.58682, "r_y3": 280.89792, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 13, "label": "text", "bbox": { "l": 395.74835, "t": 303.23727, "r": 402.31064, "b": 311.76279, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.74835, "r_y0": 311.76279, "r_x1": 402.31064, "r_y1": 311.76279, "r_x2": 402.31064, "r_y2": 303.23727, "r_x3": 395.74835, "r_y3": 303.23727, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 14, "label": "text", "bbox": { "l": 407.54214, "t": 303.36981, "r": 414.10443, "b": 311.89532, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.54214, "r_y0": 311.89532, "r_x1": 414.10443, "r_y1": 311.89532, "r_x2": 414.10443, "r_y2": 303.36981, "r_x3": 407.54214, "r_y3": 303.36981, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 15, "label": "text", "bbox": { "l": 407.56335, "t": 314.40619, "r": 414.12564, "b": 322.9317, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.56335, "r_y0": 322.9317, "r_x1": 414.12564, "r_y1": 322.9317, "r_x2": 414.12564, "r_y2": 314.40619, "r_x3": 407.56335, "r_y3": 314.40619, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 16, "label": "text", "bbox": { "l": 418.51108, "t": 292.08502000000004, "r": 425.07336, "b": 300.61053000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.51108, "r_y0": 300.61053000000004, "r_x1": 425.07336, "r_y1": 300.61053000000004, "r_x2": 425.07336, "r_y2": 292.08502000000004, "r_x3": 418.51108, "r_y3": 292.08502000000004, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 17, "label": "text", "bbox": { "l": 429.59744, "t": 292.09106, "r": 436.1597300000001, "b": 300.61658, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.59744, "r_y0": 300.61658, "r_x1": 436.1597300000001, "r_y1": 300.61658, "r_x2": 436.1597300000001, "r_y2": 292.09106, "r_x3": 429.59744, "r_y3": 292.09106, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 18, "label": "text", "bbox": { "l": 440.68759000000006, "t": 292.01230000000004, "r": 447.24987999999996, "b": 300.53781000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.68759000000006, "r_y0": 300.53781000000004, "r_x1": 447.24987999999996, "r_y1": 300.53781000000004, "r_x2": 447.24987999999996, "r_y2": 292.01230000000004, "r_x3": 440.68759000000006, "r_y3": 292.01230000000004, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 19, "label": "text", "bbox": { "l": 418.6232, "t": 303.29483, "r": 425.18549, "b": 311.82034, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.6232, "r_y0": 311.82034, "r_x1": 425.18549, "r_y1": 311.82034, "r_x2": 425.18549, "r_y2": 303.29483, "r_x3": 418.6232, "r_y3": 303.29483, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 20, "label": "text", "bbox": { "l": 429.7095299999999, "t": 303.30011, "r": 436.27182, "b": 311.82562, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.7095299999999, "r_y0": 311.82562, "r_x1": 436.27182, "r_y1": 311.82562, "r_x2": 436.27182, "r_y2": 303.30011, "r_x3": 429.7095299999999, "r_y3": 303.30011, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 21, "label": "text", "bbox": { "l": 440.7996800000001, "t": 303.22211, "r": 447.36197, "b": 311.74762, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.7996800000001, "r_y0": 311.74762, "r_x1": 447.36197, "r_y1": 311.74762, "r_x2": 447.36197, "r_y2": 303.22211, "r_x3": 440.7996800000001, "r_y3": 303.22211, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 22, "label": "text", "bbox": { "l": 418.62546, "t": 314.56903, "r": 425.18774, "b": 323.09454, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.62546, "r_y0": 323.09454, "r_x1": 425.18774, "r_y1": 323.09454, "r_x2": 425.18774, "r_y2": 314.56903, "r_x3": 418.62546, "r_y3": 314.56903, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 23, "label": "text", "bbox": { "l": 429.71181999999993, "t": 314.57434, "r": 436.27411, "b": 323.09985, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.71181999999993, "r_y0": 323.09985, "r_x1": 436.27411, "r_y1": 323.09985, "r_x2": 436.27411, "r_y2": 314.57434, "r_x3": 429.71181999999993, "r_y3": 314.57434, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 24, "label": "text", "bbox": { "l": 440.80194, "t": 314.49631, "r": 447.36423, "b": 323.02182, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.80194, "r_y0": 323.02182, "r_x1": 447.36423, "r_y1": 323.02182, "r_x2": 447.36423, "r_y2": 314.49631, "r_x3": 440.80194, "r_y3": 314.49631, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 25, "label": "text", "bbox": { "l": 407.39746, "t": 325.29031, "r": 413.95975, "b": 333.81583, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.39746, "r_y0": 333.81583, "r_x1": 413.95975, "r_y1": 333.81583, "r_x2": 413.95975, "r_y2": 325.29031, "r_x3": 407.39746, "r_y3": 325.29031, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 26, "label": "text", "bbox": { "l": 418.45959, "t": 325.45316, "r": 425.02188, "b": 333.97867, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.45959, "r_y0": 333.97867, "r_x1": 425.02188, "r_y1": 333.97867, "r_x2": 425.02188, "r_y2": 325.45316, "r_x3": 418.45959, "r_y3": 325.45316, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 27, "label": "text", "bbox": { "l": 429.54593, "t": 325.4592, "r": 436.10822, "b": 333.98471, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.54593, "r_y0": 333.98471, "r_x1": 436.10822, "r_y1": 333.98471, "r_x2": 436.10822, "r_y2": 325.4592, "r_x3": 429.54593, "r_y3": 325.4592, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 28, "label": "text", "bbox": { "l": 440.63608, "t": 325.38043, "r": 447.19836, "b": 333.90594, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.63608, "r_y0": 333.90594, "r_x1": 447.19836, "r_y1": 333.90594, "r_x2": 447.19836, "r_y2": 325.38043, "r_x3": 440.63608, "r_y3": 325.38043, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 29, "label": "text", "bbox": { "l": 451.89511000000005, "t": 280.15717, "r": 463.51273000000003, "b": 288.68268, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 451.89511000000005, "r_y0": 288.68268, "r_x1": 463.51273000000003, "r_y1": 288.68268, "r_x2": 463.51273000000003, "r_y2": 280.15717, "r_x3": 451.89511000000005, "r_y3": 280.15717, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 30, "label": "text", "bbox": { "l": 452.1557, "t": 291.59875000000005, "r": 463.77332, "b": 300.12427, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.1557, "r_y0": 300.12427, "r_x1": 463.77332, "r_y1": 300.12427, "r_x2": 463.77332, "r_y2": 291.59875000000005, "r_x3": 452.1557, "r_y3": 291.59875000000005, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 31, "label": "text", "bbox": { "l": 452.17688000000004, "t": 302.84265, "r": 463.79449000000005, "b": 311.36816, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.17688000000004, "r_y0": 311.36816, "r_x1": 463.79449000000005, "r_y1": 311.36816, "r_x2": 463.79449000000005, "r_y2": 302.84265, "r_x3": 452.17688000000004, "r_y3": 302.84265, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 32, "label": "text", "bbox": { "l": 452.09887999999995, "t": 314.12441999999993, "r": 463.71648999999996, "b": 322.6499299999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.09887999999995, "r_y0": 322.6499299999999, "r_x1": 463.71648999999996, "r_y1": 322.6499299999999, "r_x2": 463.71648999999996, "r_y2": 314.12441999999993, "r_x3": 452.09887999999995, "r_y3": 314.12441999999993, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 33, "label": "text", "bbox": { "l": 452.29733, "t": 325.46906, "r": 463.91495, "b": 333.99457, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.29733, "r_y0": 333.99457, "r_x1": 463.91495, "r_y1": 333.99457, "r_x2": 463.91495, "r_y2": 325.46906, "r_x3": 452.29733, "r_y3": 325.46906, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 34, "label": "text", "bbox": { "l": 396.09677, "t": 314.49478, "r": 402.65906, "b": 323.02029000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.09677, "r_y0": 323.02029000000005, "r_x1": 402.65906, "r_y1": 323.02029000000005, "r_x2": 402.65906, "r_y2": 314.49478, "r_x3": 396.09677, "r_y3": 314.49478, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 35, "label": "text", "bbox": { "l": 395.99829, "t": 325.38876000000005, "r": 402.56058, "b": 333.91428, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.99829, "r_y0": 333.91428, "r_x1": 402.56058, "r_y1": 333.91428, "r_x2": 402.56058, "r_y2": 325.38876000000005, "r_x3": 395.99829, "r_y3": 325.38876000000005, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 36, "label": "text", "bbox": { "l": 396.27475, "t": 292.27057, "r": 402.83704, "b": 300.79608, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.27475, "r_y0": 300.79608, "r_x1": 402.83704, "r_y1": 300.79608, "r_x2": 402.83704, "r_y2": 292.27057, "r_x3": 396.27475, "r_y3": 292.27057, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 37, "label": "text", "bbox": { "l": 408.54724, "t": 280.96912, "r": 413.60074, "b": 289.49463, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.54724, "r_y0": 289.49463, "r_x1": 413.60074, "r_y1": 289.49463, "r_x2": 413.60074, "r_y2": 280.96912, "r_x3": 408.54724, "r_y3": 280.96912, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 38, "label": "text", "bbox": { "l": 430.58966, "t": 280.49725, "r": 435.6431600000001, "b": 289.02277, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 430.58966, "r_y0": 289.02277, "r_x1": 435.6431600000001, "r_y1": 289.02277, "r_x2": 435.6431600000001, "r_y2": 280.49725, "r_x3": 430.58966, "r_y3": 280.49725, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 39, "label": "text", "bbox": { "l": 441.08069, "t": 280.38062, "r": 446.13419, "b": 288.90613, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 441.08069, "r_y0": 288.90613, "r_x1": 446.13419, "r_y1": 288.90613, "r_x2": 446.13419, "r_y2": 280.38062, "r_x3": 441.08069, "r_y3": 280.38062, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 40, "label": "text", "bbox": { "l": 407.97388, "t": 292.13425, "r": 414.03625, "b": 300.65976, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.97388, "r_y0": 300.65976, "r_x1": 414.03625, "r_y1": 300.65976, "r_x2": 414.03625, "r_y2": 292.13425, "r_x3": 407.97388, "r_y3": 292.13425, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 441.25640999999996, "t": 411.1807600000001, "r": 452.87402, "b": 419.7062700000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 441.25640999999996, "r_y0": 419.7062700000001, "r_x1": 452.87402, "r_y1": 419.7062700000001, "r_x2": 452.87402, "r_y2": 411.1807600000001, "r_x3": 441.25640999999996, "r_y3": 411.1807600000001, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 393.75256, "t": 399.7947700000001, "r": 432.48929, "b": 406.89935, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.75256, "r_y0": 406.89935, "r_x1": 432.48929, "r_y1": 406.89935, "r_x2": 432.48929, "r_y2": 399.7947700000001, "r_x3": 393.75256, "r_y3": 399.7947700000001, "coord_origin": "TOPLEFT" }, "text": "vocabulary:", "orig": "vocabulary:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 434.5896000000001, "t": 399.7947700000001, "r": 438.80083999999994, "b": 406.89935, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 434.5896000000001, "r_y0": 406.89935, "r_x1": 438.80083999999994, "r_y1": 406.89935, "r_x2": 438.80083999999994, "r_y2": 399.7947700000001, "r_x3": 434.5896000000001, "r_y3": 399.7947700000001, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 440.90573, "t": 399.7947700000001, "r": 463.22235, "b": 406.89935, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.90573, "r_y0": 406.89935, "r_x1": 463.22235, "r_y1": 406.89935, "r_x2": 463.22235, "r_y2": 399.7947700000001, "r_x3": 440.90573, "r_y3": 399.7947700000001, "coord_origin": "TOPLEFT" }, "text": "tokens", "orig": "tokens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 384.11816, "t": 258.54718, "r": 413.99307, "b": 265.65179, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 384.11816, "r_y0": 265.65179, "r_x1": 413.99307, "r_y1": 265.65179, "r_x2": 413.99307, "r_y2": 258.54718, "r_x3": 384.11816, "r_y3": 258.54718, "coord_origin": "TOPLEFT" }, "text": "D OTSL", "orig": "D OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 393.75256, "t": 266.67505000000006, "r": 451.45129000000003, "b": 273.77966000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.75256, "r_y0": 273.77966000000004, "r_x1": 451.45129000000003, "r_y1": 273.77966000000004, "r_x2": 451.45129000000003, "r_y2": 266.67505000000006, "r_x3": 393.75256, "r_y3": 266.67505000000006, "coord_origin": "TOPLEFT" }, "text": "sequence length:", "orig": "sequence length:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 453.55083999999994, "t": 266.67505000000006, "r": 461.97485, "b": 273.77966000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 453.55083999999994, "r_y0": 273.77966000000004, "r_x1": 461.97485, "r_y1": 273.77966000000004, "r_x2": 461.97485, "r_y2": 266.67505000000006, "r_x3": 453.55083999999994, "r_y3": 266.67505000000006, "coord_origin": "TOPLEFT" }, "text": "30", "orig": "30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 151.79318, "t": 399.76016, "r": 233.89371000000003, "b": 406.86474999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.79318, "r_y0": 406.86474999999996, "r_x1": 233.89371000000003, "r_y1": 406.86474999999996, "r_x2": 233.89371000000003, "r_y2": 399.76016, "r_x3": 151.79318, "r_y3": 399.76016, "coord_origin": "TOPLEFT" }, "text": "vocabulary for this table:", "orig": "vocabulary for this table:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 235.99332, "t": 399.76016, "r": 244.41734000000002, "b": 406.86474999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 235.99332, "r_y0": 406.86474999999996, "r_x1": 244.41734000000002, "r_y1": 406.86474999999996, "r_x2": 244.41734000000002, "r_y2": 399.76016, "r_x3": 235.99332, "r_y3": 399.76016, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 246.52222, "t": 399.76016, "r": 268.83884, "b": 406.86474999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.52222, "r_y0": 406.86474999999996, "r_x1": 268.83884, "r_y1": 406.86474999999996, "r_x2": 268.83884, "r_y2": 399.76016, "r_x3": 246.52222, "r_y3": 399.76016, "coord_origin": "TOPLEFT" }, "text": "tokens", "orig": "tokens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 51, "label": "text", "bbox": { "l": 154.3298, "t": 213.57457999999997, "r": 159.79837, "b": 220.67920000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.3298, "r_y0": 220.67920000000004, "r_x1": 159.79837, "r_y1": 220.67920000000004, "r_x2": 159.79837, "r_y2": 213.57457999999997, "r_x3": 154.3298, "r_y3": 213.57457999999997, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 52, "label": "text", "bbox": { "l": 321.07053, "t": 213.57457999999997, "r": 326.53909, "b": 220.67920000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 321.07053, "r_y0": 220.67920000000004, "r_x1": 326.53909, "r_y1": 220.67920000000004, "r_x2": 326.53909, "r_y2": 213.57457999999997, "r_x3": 321.07053, "r_y3": 213.57457999999997, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 53, "label": "text", "bbox": { "l": 153.0947, "t": 280.30411, "r": 175.83888, "b": 286.69824, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 153.0947, "r_y0": 286.69824, "r_x1": 175.83888, "r_y1": 286.69824, "r_x2": 175.83888, "r_y2": 280.30411, "r_x3": 153.0947, "r_y3": 280.30411, "coord_origin": "TOPLEFT" }, "text": "", "orig": "
", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 54, "label": "text", "bbox": { "l": 160.67039, "t": 287.12088, "r": 172.79608, "b": 293.51501, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67039, "r_y0": 293.51501, "r_x1": 172.79608, "r_y1": 293.51501, "r_x2": 172.79608, "r_y2": 287.12088, "r_x3": 160.67039, "r_y3": 287.12088, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 55, "label": "text", "bbox": { "l": 168.24603, "t": 293.93765, "r": 177.91019, "b": 300.33179, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.24603, "r_y0": 300.33179, "r_x1": 177.91019, "r_y1": 300.33179, "r_x2": 177.91019, "r_y2": 293.93765, "r_x3": 168.24603, "r_y3": 293.93765, "coord_origin": "TOPLEFT" }, "text": "", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 59, "label": "text", "bbox": { "l": 263.35785, "t": 293.93765, "r": 278.89804, "b": 300.33179, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.35785, "r_y0": 300.33179, "r_x1": 278.89804, "r_y1": 300.33179, "r_x2": 278.89804, "r_y2": 293.93765, "r_x3": 263.35785, "r_y3": 293.93765, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 60, "label": "text", "bbox": { "l": 280.79175, "t": 293.93765, "r": 290.4559, "b": 300.33179, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 280.79175, "r_y0": 300.33179, "r_x1": 290.4559, "r_y1": 300.33179, "r_x2": 290.4559, "r_y2": 293.93765, "r_x3": 280.79175, "r_y3": 293.93765, "coord_origin": "TOPLEFT" }, "text": "", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 335.92926, "t": 293.93765, "r": 351.46945, "b": 300.33179, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 335.92926, "r_y0": 300.33179, "r_x1": 351.46945, "r_y1": 300.33179, "r_x2": 351.46945, "r_y2": 293.93765, "r_x3": 335.92926, "r_y3": 293.93765, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 160.67039, "t": 300.75442999999996, "r": 174.68979, "b": 307.14856, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67039, "r_y0": 307.14856, "r_x1": 174.68979, "r_y1": 307.14856, "r_x2": 174.68979, "r_y2": 300.75442999999996, "r_x3": 160.67039, "r_y3": 300.75442999999996, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 160.67039, "t": 307.57122999999996, "r": 172.79608, "b": 313.96536, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67039, "r_y0": 313.96536, "r_x1": 172.79608, "r_y1": 313.96536, "r_x2": 172.79608, "r_y2": 307.57122999999996, "r_x3": 160.67039, "r_y3": 307.57122999999996, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 168.24603, "t": 314.388, "r": 181.89255, "b": 320.78214, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.24603, "r_y0": 320.78214, "r_x1": 181.89255, "r_y1": 320.78214, "r_x2": 181.89255, "r_y2": 314.388, "r_x3": 168.24603, "r_y3": 314.388, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 201.22015, "t": 314.388, "r": 214.86666999999997, "b": 320.78214, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 201.22015, "r_y0": 320.78214, "r_x1": 214.86666999999997, "r_y1": 320.78214, "r_x2": 214.86666999999997, "r_y2": 314.388, "r_x3": 201.22015, "r_y3": 314.388, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 234.19427000000002, "t": 314.388, "r": 247.84079000000003, "b": 320.78214, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.19427000000002, "r_y0": 320.78214, "r_x1": 247.84079000000003, "r_y1": 320.78214, "r_x2": 247.84079000000003, "r_y2": 314.388, "r_x3": 234.19427000000002, "r_y3": 314.388, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 160.67039, "t": 321.20477, "r": 174.68979, "b": 327.59890999999993, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67039, "r_y0": 327.59890999999993, "r_x1": 174.68979, "r_y1": 327.59890999999993, "r_x2": 174.68979, "r_y2": 321.20477, "r_x3": 160.67039, "r_y3": 321.20477, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 160.67039, "t": 328.02158, "r": 172.79608, "b": 334.41571000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67039, "r_y0": 334.41571000000005, "r_x1": 172.79608, "r_y1": 334.41571000000005, "r_x2": 172.79608, "r_y2": 328.02158, "r_x3": 160.67039, "r_y3": 328.02158, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 168.24603, "t": 334.83835, "r": 373.09091, "b": 341.23248, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.24603, "r_y0": 341.23248, "r_x1": 373.09091, "r_y1": 341.23248, "r_x2": 373.09091, "r_y2": 334.83835, "r_x3": 168.24603, "r_y3": 334.83835, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 160.67039, "t": 341.65512, "r": 174.68979, "b": 348.04926, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67039, "r_y0": 348.04926, "r_x1": 174.68979, "r_y1": 348.04926, "r_x2": 174.68979, "r_y2": 341.65512, "r_x3": 160.67039, "r_y3": 341.65512, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 160.67039, "t": 348.47159, "r": 172.79608, "b": 354.86572, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67039, "r_y0": 354.86572, "r_x1": 172.79608, "r_y1": 354.86572, "r_x2": 172.79608, "r_y2": 348.47159, "r_x3": 160.67039, "r_y3": 348.47159, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 168.24603, "t": 355.28836000000007, "r": 181.89255, "b": 361.68249999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.24603, "r_y0": 361.68249999999995, "r_x1": 181.89255, "r_y1": 361.68249999999995, "r_x2": 181.89255, "r_y2": 355.28836000000007, "r_x3": 168.24603, "r_y3": 355.28836000000007, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 201.22015, "t": 355.28836000000007, "r": 214.86666999999997, "b": 361.68249999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 201.22015, "r_y0": 361.68249999999995, "r_x1": 214.86666999999997, "r_y1": 361.68249999999995, "r_x2": 214.86666999999997, "r_y2": 355.28836000000007, "r_x3": 201.22015, "r_y3": 355.28836000000007, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 81, "label": "text", "bbox": { "l": 234.19427000000002, "t": 355.28836000000007, "r": 247.84079000000003, "b": 361.68249999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.19427000000002, "r_y0": 361.68249999999995, "r_x1": 247.84079000000003, "r_y1": 361.68249999999995, "r_x2": 247.84079000000003, "r_y2": 355.28836000000007, "r_x3": 234.19427000000002, "r_y3": 355.28836000000007, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 83, "label": "text", "bbox": { "l": 267.1684, "t": 355.28836000000007, "r": 280.81488, "b": 361.68249999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 267.1684, "r_y0": 361.68249999999995, "r_x1": 280.81488, "r_y1": 361.68249999999995, "r_x2": 280.81488, "r_y2": 355.28836000000007, "r_x3": 267.1684, "r_y3": 355.28836000000007, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 85, "label": "text", "bbox": { "l": 160.67039, "t": 362.10516000000007, "r": 174.68979, "b": 368.49929999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67039, "r_y0": 368.49929999999995, "r_x1": 174.68979, "r_y1": 368.49929999999995, "r_x2": 174.68979, "r_y2": 362.10516000000007, "r_x3": 160.67039, "r_y3": 362.10516000000007, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 86, "label": "text", "bbox": { "l": 160.67039, "t": 368.92194, "r": 172.79608, "b": 375.31607, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67039, "r_y0": 375.31607, "r_x1": 172.79608, "r_y1": 375.31607, "r_x2": 172.79608, "r_y2": 368.92194, "r_x3": 160.67039, "r_y3": 368.92194, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 87, "label": "text", "bbox": { "l": 168.24603, "t": 375.73871, "r": 181.89255, "b": 382.13284, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.24603, "r_y0": 382.13284, "r_x1": 181.89255, "r_y1": 382.13284, "r_x2": 181.89255, "r_y2": 375.73871, "r_x3": 168.24603, "r_y3": 375.73871, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 89, "label": "text", "bbox": { "l": 201.22015, "t": 375.73871, "r": 214.86666999999997, "b": 382.13284, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 201.22015, "r_y0": 382.13284, "r_x1": 214.86666999999997, "r_y1": 382.13284, "r_x2": 214.86666999999997, "r_y2": 375.73871, "r_x3": 201.22015, "r_y3": 375.73871, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 91, "label": "text", "bbox": { "l": 234.19427000000002, "t": 375.73871, "r": 247.84079000000003, "b": 382.13284, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.19427000000002, "r_y0": 382.13284, "r_x1": 247.84079000000003, "r_y1": 382.13284, "r_x2": 247.84079000000003, "r_y2": 375.73871, "r_x3": 234.19427000000002, "r_y3": 375.73871, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 93, "label": "text", "bbox": { "l": 267.1684, "t": 375.73871, "r": 280.81488, "b": 382.13284, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 267.1684, "r_y0": 382.13284, "r_x1": 280.81488, "r_y1": 382.13284, "r_x2": 280.81488, "r_y2": 375.73871, "r_x3": 267.1684, "r_y3": 375.73871, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 95, "label": "text", "bbox": { "l": 160.67039, "t": 382.55551, "r": 174.68979, "b": 388.94965, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67039, "r_y0": 388.94965, "r_x1": 174.68979, "r_y1": 388.94965, "r_x2": 174.68979, "r_y2": 382.55551, "r_x3": 160.67039, "r_y3": 382.55551, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 96, "label": "text", "bbox": { "l": 153.0947, "t": 389.37228, "r": 177.73259, "b": 395.76642, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 153.0947, "r_y0": 395.76642, "r_x1": 177.73259, "r_y1": 395.76642, "r_x2": 177.73259, "r_y2": 389.37228, "r_x3": 153.0947, "r_y3": 389.37228, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 183.78624, "t": 314.388, "r": 199.32646, "b": 320.78214, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.78624, "r_y0": 320.78214, "r_x1": 199.32646, "r_y1": 320.78214, "r_x2": 199.32646, "r_y2": 314.388, "r_x3": 183.78624, "r_y3": 314.388, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 216.76038, "t": 314.388, "r": 232.30058, "b": 320.78214, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 216.76038, "r_y0": 320.78214, "r_x1": 232.30058, "r_y1": 320.78214, "r_x2": 232.30058, "r_y2": 314.388, "r_x3": 216.76038, "r_y3": 314.388, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 249.73447999999996, "t": 314.388, "r": 265.27469, "b": 320.78214, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.73447999999996, "r_y0": 320.78214, "r_x1": 265.27469, "r_y1": 320.78214, "r_x2": 265.27469, "r_y2": 314.388, "r_x3": 249.73447999999996, "r_y3": 314.388, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 183.78624, "t": 355.28836000000007, "r": 199.32646, "b": 361.68249999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.78624, "r_y0": 361.68249999999995, "r_x1": 199.32646, "r_y1": 361.68249999999995, "r_x2": 199.32646, "r_y2": 355.28836000000007, "r_x3": 183.78624, "r_y3": 355.28836000000007, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 80, "label": "text", "bbox": { "l": 216.76038, "t": 355.28836000000007, "r": 232.30058, "b": 361.68249999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 216.76038, "r_y0": 361.68249999999995, "r_x1": 232.30058, "r_y1": 361.68249999999995, "r_x2": 232.30058, "r_y2": 355.28836000000007, "r_x3": 216.76038, "r_y3": 355.28836000000007, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 82, "label": "text", "bbox": { "l": 249.73447999999996, "t": 355.28836000000007, "r": 265.27469, "b": 361.68249999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.73447999999996, "r_y0": 361.68249999999995, "r_x1": 265.27469, "r_y1": 361.68249999999995, "r_x2": 265.27469, "r_y2": 355.28836000000007, "r_x3": 249.73447999999996, "r_y3": 355.28836000000007, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 84, "label": "text", "bbox": { "l": 282.70862, "t": 355.28836000000007, "r": 298.24881, "b": 361.68249999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.70862, "r_y0": 361.68249999999995, "r_x1": 298.24881, "r_y1": 361.68249999999995, "r_x2": 298.24881, "r_y2": 355.28836000000007, "r_x3": 282.70862, "r_y3": 355.28836000000007, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 88, "label": "text", "bbox": { "l": 183.78624, "t": 375.73871, "r": 199.32646, "b": 382.13284, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.78624, "r_y0": 382.13284, "r_x1": 199.32646, "r_y1": 382.13284, "r_x2": 199.32646, "r_y2": 375.73871, "r_x3": 183.78624, "r_y3": 375.73871, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 90, "label": "text", "bbox": { "l": 216.76038, "t": 375.73871, "r": 232.30058, "b": 382.13284, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 216.76038, "r_y0": 382.13284, "r_x1": 232.30058, "r_y1": 382.13284, "r_x2": 232.30058, "r_y2": 375.73871, "r_x3": 216.76038, "r_y3": 375.73871, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 92, "label": "text", "bbox": { "l": 249.73447999999996, "t": 375.73871, "r": 265.27469, "b": 382.13284, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.73447999999996, "r_y0": 382.13284, "r_x1": 265.27469, "r_y1": 382.13284, "r_x2": 265.27469, "r_y2": 375.73871, "r_x3": 249.73447999999996, "r_y3": 375.73871, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 94, "label": "text", "bbox": { "l": 282.70862, "t": 375.73871, "r": 298.24881, "b": 382.13284, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.70862, "r_y0": 382.13284, "r_x1": 298.24881, "r_y1": 382.13284, "r_x2": 298.24881, "r_y2": 375.73871, "r_x3": 282.70862, "r_y3": 375.73871, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 97, "label": "text", "bbox": { "l": 395.06137, "t": 411.33353, "r": 401.62366, "b": 419.85904, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.06137, "r_y0": 419.85904, "r_x1": 401.62366, "r_y1": 419.85904, "r_x2": 401.62366, "r_y2": 411.33353, "r_x3": 395.06137, "r_y3": 411.33353, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 98, "label": "text", "bbox": { "l": 407.42249, "t": 411.33353, "r": 412.47598, "b": 419.85904, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.42249, "r_y0": 419.85904, "r_x1": 412.47598, "r_y1": 419.85904, "r_x2": 412.47598, "r_y2": 411.33353, "r_x3": 407.42249, "r_y3": 411.33353, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 99, "label": "text", "bbox": { "l": 418.69287, "t": 411.33353, "r": 425.25516, "b": 419.85904, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.69287, "r_y0": 419.85904, "r_x1": 425.25516, "r_y1": 419.85904, "r_x2": 425.25516, "r_y2": 411.33353, "r_x3": 418.69287, "r_y3": 411.33353, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 100, "label": "text", "bbox": { "l": 430.5086099999999, "t": 411.33353, "r": 436.5709800000001, "b": 419.85904, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 430.5086099999999, "r_y0": 419.85904, "r_x1": 436.5709800000001, "r_y1": 419.85904, "r_x2": 436.5709800000001, "r_y2": 411.33353, "r_x3": 430.5086099999999, "r_y3": 411.33353, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 101, "label": "text", "bbox": { "l": 152.36208, "t": 409.77362, "r": 175.10626, "b": 416.16776, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 152.36208, "r_y0": 416.16776, "r_x1": 175.10626, "r_y1": 416.16776, "r_x2": 175.10626, "r_y2": 409.77362, "r_x3": 152.36208, "r_y3": 409.77362, "coord_origin": "TOPLEFT" }, "text": "", "orig": "
", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 102, "label": "text", "bbox": { "l": 178.89366, "t": 409.77362, "r": 191.01935, "b": 416.16776, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 178.89366, "r_y0": 416.16776, "r_x1": 191.01935, "r_y1": 416.16776, "r_x2": 191.01935, "r_y2": 409.77362, "r_x3": 178.89366, "r_y3": 409.77362, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 103, "label": "text", "bbox": { "l": 194.80676, "t": 409.77362, "r": 208.82614, "b": 416.16776, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.80676, "r_y0": 416.16776, "r_x1": 208.82614, "r_y1": 416.16776, "r_x2": 208.82614, "r_y2": 409.77362, "r_x3": 194.80676, "r_y3": 409.77362, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 104, "label": "text", "bbox": { "l": 212.61354, "t": 409.77362, "r": 226.26003999999998, "b": 416.16776, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 212.61354, "r_y0": 416.16776, "r_x1": 226.26003999999998, "r_y1": 416.16776, "r_x2": 226.26003999999998, "r_y2": 409.77362, "r_x3": 212.61354, "r_y3": 409.77362, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 106, "label": "text", "bbox": { "l": 249.37506000000002, "t": 409.77362, "r": 259.03918, "b": 416.16776, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.37506000000002, "r_y0": 416.16776, "r_x1": 259.03918, "r_y1": 416.16776, "r_x2": 259.03918, "r_y2": 409.77362, "r_x3": 249.37506000000002, "r_y3": 409.77362, "coord_origin": "TOPLEFT" }, "text": "", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 112, "label": "text", "bbox": { "l": 244.46358, "t": 418.10522, "r": 269.10144, "b": 424.49936, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 244.46358, "r_y0": 424.49936, "r_x1": 269.10144, "r_y1": 424.49936, "r_x2": 269.10144, "r_y2": 418.10522, "r_x3": 244.46358, "r_y3": 418.10522, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 105, "label": "text", "bbox": { "l": 230.04745000000003, "t": 409.77362, "r": 245.58765000000002, "b": 416.16776, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 230.04745000000003, "r_y0": 416.16776, "r_x1": 245.58765000000002, "r_y1": 416.16776, "r_x2": 245.58765000000002, "r_y2": 409.77362, "r_x3": 230.04745000000003, "r_y3": 409.77362, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 113, "label": "text", "bbox": { "l": 154.50595, "t": 258.60095, "r": 159.62473, "b": 265.70556999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.50595, "r_y0": 265.70556999999997, "r_x1": 159.62473, "r_y1": 265.70556999999997, "r_x2": 159.62473, "r_y2": 258.60095, "r_x3": 154.50595, "r_y3": 258.60095, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 114, "label": "text", "bbox": { "l": 164.74348, "t": 258.60095, "r": 185.21857, "b": 265.70556999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 164.74348, "r_y0": 265.70556999999997, "r_x1": 185.21857, "r_y1": 265.70556999999997, "r_x2": 185.21857, "r_y2": 258.60095, "r_x3": 164.74348, "r_y3": 258.60095, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 115, "label": "text", "bbox": { "l": 164.3548, "t": 266.49707, "r": 222.05352999999997, "b": 273.60168, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 164.3548, "r_y0": 273.60168, "r_x1": 222.05352999999997, "r_y1": 273.60168, "r_x2": 222.05352999999997, "r_y2": 266.49707, "r_x3": 164.3548, "r_y3": 266.49707, "coord_origin": "TOPLEFT" }, "text": "sequence length:", "orig": "sequence length:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 116, "label": "text", "bbox": { "l": 224.15326, "t": 266.49707, "r": 232.57729, "b": 273.60168, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 224.15326, "r_y0": 273.60168, "r_x1": 232.57729, "r_y1": 273.60168, "r_x2": 232.57729, "r_y2": 266.49707, "r_x3": 224.15326, "r_y3": 266.49707, "coord_origin": "TOPLEFT" }, "text": "55", "orig": "55", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "text", "id": 2, "page_no": 1, "cluster": { "id": 2, "label": "text", "bbox": { "l": 134.765, "t": 452.31378, "r": 480.59232000000003, "b": 520.88669, "coord_origin": "TOPLEFT" }, "confidence": 0.950499951839447, "cells": [ { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 461.11075, "r_x1": 161.32928, "r_y1": 461.11075, "r_x2": 161.32928, "r_y2": 452.31378, "r_x3": 134.765, "r_y3": 452.31378, "coord_origin": "TOPLEFT" }, "text": "today,", "orig": "today,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 164.269, "r_y0": 461.11075, "r_x1": 226.28617999999997, "r_y1": 461.11075, "r_x2": 226.28617999999997, "r_y2": 452.31378, "r_x3": 164.269, "r_y3": 452.31378, "coord_origin": "TOPLEFT" }, "text": "table detection", "orig": "table detection", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.992, "r_y0": 461.11075, "r_x1": 480.59232000000003, "r_y1": 461.11075, "r_x2": 480.59232000000003, "r_y2": 452.31378, "r_x3": 229.992, "r_y3": 452.31378, "coord_origin": "TOPLEFT" }, "text": "in documents is a well understood problem, and the latest", "orig": "in documents is a well understood problem, and the latest", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 473.06573, "r_x1": 480.59180000000003, "r_y1": 473.06573, "r_x2": 480.59180000000003, "r_y2": 464.26877, "r_x3": 134.76501, "r_y3": 464.26877, "coord_origin": "TOPLEFT" }, "text": "state-of-the-art (SOTA) object detection methods provide an accuracy compa-", "orig": "state-of-the-art (SOTA) object detection methods provide an accuracy compa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 485.02072, "r_x1": 480.58673, "r_y1": 485.02072, "r_x2": 480.58673, "r_y2": 476.22375, "r_x3": 134.76501, "r_y3": 476.22375, "coord_origin": "TOPLEFT" }, "text": "rable to human observers [7,8,10,14,23]. On the other hand, the problem of table", "orig": "rable to human observers [7,8,10,14,23]. On the other hand, the problem of table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 496.97672, "r_x1": 480.58658, "r_y1": 496.97672, "r_x2": 480.58658, "r_y2": 488.17975, "r_x3": 134.76501, "r_y3": 488.17975, "coord_origin": "TOPLEFT" }, "text": "structure recognition (TSR) is a lot more challenging and remains a very active", "orig": "structure recognition (TSR) is a lot more challenging and remains a very active", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 508.9317, "r_x1": 480.58978, "r_y1": 508.9317, "r_x2": 480.58978, "r_y2": 500.13474, "r_x3": 134.76501, "r_y3": 500.13474, "coord_origin": "TOPLEFT" }, "text": "area of research, in which many novel machine learning algorithms are being", "orig": "area of research, in which many novel machine learning algorithms are being", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 520.88669, "r_x1": 313.24597, "r_y1": 520.88669, "r_x2": 313.24597, "r_y2": 512.0897199999999, "r_x3": 134.76501, "r_y3": 512.0897199999999, "coord_origin": "TOPLEFT" }, "text": "explored [3,4,5,9,11,12,13,14,17,18,21,22].", "orig": "explored [3,4,5,9,11,12,13,14,17,18,21,22].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "today, table detection in documents is a well understood problem, and the latest state-of-the-art (SOTA) object detection methods provide an accuracy comparable to human observers [7,8,10,14,23]. On the other hand, the problem of table structure recognition (TSR) is a lot more challenging and remains a very active area of research, in which many novel machine learning algorithms are being explored [3,4,5,9,11,12,13,14,17,18,21,22]." }, { "label": "text", "id": 0, "page_no": 1, "cluster": { "id": 0, "label": "text", "bbox": { "l": 134.76501, "t": 524.55072, "r": 480.59482, "b": 664.8547, "coord_origin": "TOPLEFT" }, "confidence": 0.9845512509346008, "cells": [ { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.70901, "r_y0": 533.3476900000001, "r_x1": 480.58884000000006, "r_y1": 533.3476900000001, "r_x2": 480.58884000000006, "r_y2": 524.55072, "r_x3": 149.70901, "r_y3": 524.55072, "coord_origin": "TOPLEFT" }, "text": "Recently emerging SOTA methods for table structure recognition employ", "orig": "Recently emerging SOTA methods for table structure recognition employ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 545.30368, "r_x1": 480.5917400000001, "r_y1": 545.30368, "r_x2": 480.5917400000001, "r_y2": 536.50671, "r_x3": 134.76501, "r_y3": 536.50671, "coord_origin": "TOPLEFT" }, "text": "transformer-based models, in which an image of the table is provided to the net-", "orig": "transformer-based models, in which an image of the table is provided to the net-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 557.25868, "r_x1": 480.58868, "r_y1": 557.25868, "r_x2": 480.58868, "r_y2": 548.46172, "r_x3": 134.76501, "r_y3": 548.46172, "coord_origin": "TOPLEFT" }, "text": "work in order to predict the structure of the table as a sequence of tokens. These", "orig": "work in order to predict the structure of the table as a sequence of tokens. These", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 569.2136800000001, "r_x1": 480.58795, "r_y1": 569.2136800000001, "r_x2": 480.58795, "r_y2": 560.41672, "r_x3": 134.76501, "r_y3": 560.41672, "coord_origin": "TOPLEFT" }, "text": "image-to-sequence (Im2Seq) models are extremely powerful, since they allow for", "orig": "image-to-sequence (Im2Seq) models are extremely powerful, since they allow for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 581.16869, "r_x1": 480.58978, "r_y1": 581.16869, "r_x2": 480.58978, "r_y2": 572.37172, "r_x3": 134.76501, "r_y3": 572.37172, "coord_origin": "TOPLEFT" }, "text": "a purely data-driven solution. The tokens of the sequence typically belong to a", "orig": "a purely data-driven solution. The tokens of the sequence typically belong to a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 593.12369, "r_x1": 480.59479, "r_y1": 593.12369, "r_x2": 480.59479, "r_y2": 584.32672, "r_x3": 134.76501, "r_y3": 584.32672, "coord_origin": "TOPLEFT" }, "text": "markup language such as HTML, Latex or Markdown, which allow to describe", "orig": "markup language such as HTML, Latex or Markdown, which allow to describe", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 605.0796799999999, "r_x1": 480.58678999999995, "r_y1": 605.0796799999999, "r_x2": 480.58678999999995, "r_y2": 596.28271, "r_x3": 134.76501, "r_y3": 596.28271, "coord_origin": "TOPLEFT" }, "text": "table structure as rows, columns and spanning cells in various configurations.", "orig": "table structure as rows, columns and spanning cells in various configurations.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 617.03468, "r_x1": 480.59476, "r_y1": 617.03468, "r_x2": 480.59476, "r_y2": 608.23772, "r_x3": 134.76501, "r_y3": 608.23772, "coord_origin": "TOPLEFT" }, "text": "In Figure 1, we illustrate how HTML is used to represent the table-structure", "orig": "In Figure 1, we illustrate how HTML is used to represent the table-structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 628.98969, "r_x1": 480.5938100000001, "r_y1": 628.98969, "r_x2": 480.5938100000001, "r_y2": 620.19272, "r_x3": 134.76501, "r_y3": 620.19272, "coord_origin": "TOPLEFT" }, "text": "of a particular example table. Public table-structure data sets such as PubTab-", "orig": "of a particular example table. Public table-structure data sets such as PubTab-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 640.94469, "r_x1": 480.59482, "r_y1": 640.94469, "r_x2": 480.59482, "r_y2": 632.1477199999999, "r_x3": 134.76501, "r_y3": 632.1477199999999, "coord_origin": "TOPLEFT" }, "text": "Net [22], and FinTabNet [21], which were created in a semi-automated way from", "orig": "Net [22], and FinTabNet [21], which were created in a semi-automated way from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 652.89969, "r_x1": 480.58771, "r_y1": 652.89969, "r_x2": 480.58771, "r_y2": 644.10272, "r_x3": 134.76501, "r_y3": 644.10272, "coord_origin": "TOPLEFT" }, "text": "paired PDF and HTML sources (e.g. PubMed Central), popularized primarily", "orig": "paired PDF and HTML sources (e.g. PubMed Central), popularized primarily", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 664.8547, "r_x1": 421.45377, "r_y1": 664.8547, "r_x2": 421.45377, "r_y2": 656.05772, "r_x3": 134.76501, "r_y3": 656.05772, "coord_origin": "TOPLEFT" }, "text": "the use of HTML as ground-truth representation format for TSR.", "orig": "the use of HTML as ground-truth representation format for TSR.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Recently emerging SOTA methods for table structure recognition employ transformer-based models, in which an image of the table is provided to the network in order to predict the structure of the table as a sequence of tokens. These image-to-sequence (Im2Seq) models are extremely powerful, since they allow for a purely data-driven solution. The tokens of the sequence typically belong to a markup language such as HTML, Latex or Markdown, which allow to describe table structure as rows, columns and spanning cells in various configurations. In Figure 1, we illustrate how HTML is used to represent the table-structure of a particular example table. Public table-structure data sets such as PubTabNet [22], and FinTabNet [21], which were created in a semi-automated way from paired PDF and HTML sources (e.g. PubMed Central), popularized primarily the use of HTML as ground-truth representation format for TSR." } ], "body": [ { "label": "caption", "id": 4, "page_no": 1, "cluster": { "id": 4, "label": "caption", "bbox": { "l": 134.765, "t": 126.33416999999997, "r": 480.59189, "b": 200.22058000000004, "coord_origin": "TOPLEFT" }, "confidence": 0.8939083218574524, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 134.26049999999998, "r_x1": 162.64424, "r_y1": 134.26049999999998, "r_x2": 162.64424, "r_y2": 126.33416999999997, "r_x3": 134.765, "r_y3": 126.33416999999997, "coord_origin": "TOPLEFT" }, "text": "Fig. 1.", "orig": "Fig. 1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.062, "r_y0": 134.46667000000002, "r_x1": 480.59106, "r_y1": 134.46667000000002, "r_x2": 480.59106, "r_y2": 126.39697000000001, "r_x3": 167.062, "r_y3": 126.39697000000001, "coord_origin": "TOPLEFT" }, "text": "Comparison between HTML and OTSL table structure representation: (A)", "orig": "Comparison between HTML and OTSL table structure representation: (A)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 145.42566, "r_x1": 480.59018, "r_y1": 145.42566, "r_x2": 480.59018, "r_y2": 137.35595999999998, "r_x3": 134.765, "r_y3": 137.35595999999998, "coord_origin": "TOPLEFT" }, "text": "table-example with complex row and column headers, including a 2D empty span,", "orig": "table-example with complex row and column headers, including a 2D empty span,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 156.38464, "r_x1": 147.95433, "r_y1": 156.38464, "r_x2": 147.95433, "r_y2": 148.31493999999998, "r_x3": 134.765, "r_y3": 148.31493999999998, "coord_origin": "TOPLEFT" }, "text": "(B)", "orig": "(B)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 152.39224, "r_y0": 156.38464, "r_x1": 480.59096999999997, "r_y1": 156.38464, "r_x2": 480.59096999999997, "r_y2": 148.31493999999998, "r_x3": 152.39224, "r_y3": 148.31493999999998, "coord_origin": "TOPLEFT" }, "text": "minimal graphical representation of table structure using rectangular layout, (C)", "orig": "minimal graphical representation of table structure using rectangular layout, (C)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 167.34362999999996, "r_x1": 480.59189, "r_y1": 167.34362999999996, "r_x2": 480.59189, "r_y2": 159.27392999999995, "r_x3": 134.765, "r_y3": 159.27392999999995, "coord_origin": "TOPLEFT" }, "text": "HTML representation, (D) OTSL representation. This example demonstrates many of", "orig": "HTML representation, (D) OTSL representation. This example demonstrates many of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 178.30260999999996, "r_x1": 480.58914000000004, "r_y1": 178.30260999999996, "r_x2": 480.58914000000004, "r_y2": 170.23290999999995, "r_x3": 134.765, "r_y3": 170.23290999999995, "coord_origin": "TOPLEFT" }, "text": "the key-features of OTSL, namely its reduced vocabulary size (12 versus 5 in this case),", "orig": "the key-features of OTSL, namely its reduced vocabulary size (12 versus 5 in this case),", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 189.26160000000004, "r_x1": 480.59020999999996, "r_y1": 189.26160000000004, "r_x2": 480.59020999999996, "r_y2": 181.19188999999994, "r_x3": 134.765, "r_y3": 181.19188999999994, "coord_origin": "TOPLEFT" }, "text": "its reduced sequence length (55 versus 30) and a enhanced internal structure (variable", "orig": "its reduced sequence length (55 versus 30) and a enhanced internal structure (variable", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 200.22058000000004, "r_x1": 460.87109, "r_y1": 200.22058000000004, "r_x2": 460.87109, "r_y2": 192.15088000000003, "r_x3": 134.765, "r_y3": 192.15088000000003, "coord_origin": "TOPLEFT" }, "text": "token sequence length per row in HTML versus a fixed length of rows in OTSL).", "orig": "token sequence length per row in HTML versus a fixed length of rows in OTSL).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Fig. 1. Comparison between HTML and OTSL table structure representation: (A) table-example with complex row and column headers, including a 2D empty span, (B) minimal graphical representation of table structure using rectangular layout, (C) HTML representation, (D) OTSL representation. This example demonstrates many of the key-features of OTSL, namely its reduced vocabulary size (12 versus 5 in this case), its reduced sequence length (55 versus 30) and a enhanced internal structure (variable token sequence length per row in HTML versus a fixed length of rows in OTSL)." }, { "label": "picture", "id": 1, "page_no": 1, "cluster": { "id": 1, "label": "picture", "bbox": { "l": 148.45364379882812, "t": 208.37423706054688, "r": 464.3608093261719, "b": 425.8462219238281, "coord_origin": "TOPLEFT" }, "confidence": 0.9688959121704102, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.41107, "r_y0": 289.50903, "r_x1": 402.97336, "r_y1": 289.50903, "r_x2": 402.97336, "r_y2": 280.98352, "r_x3": 396.41107, "r_y3": 280.98352, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.58682, "r_y0": 289.42343, "r_x1": 425.14911, "r_y1": 289.42343, "r_x2": 425.14911, "r_y2": 280.89792, "r_x3": 418.58682, "r_y3": 280.89792, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.74835, "r_y0": 311.76279, "r_x1": 402.31064, "r_y1": 311.76279, "r_x2": 402.31064, "r_y2": 303.23727, "r_x3": 395.74835, "r_y3": 303.23727, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.54214, "r_y0": 311.89532, "r_x1": 414.10443, "r_y1": 311.89532, "r_x2": 414.10443, "r_y2": 303.36981, "r_x3": 407.54214, "r_y3": 303.36981, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.56335, "r_y0": 322.9317, "r_x1": 414.12564, "r_y1": 322.9317, "r_x2": 414.12564, "r_y2": 314.40619, "r_x3": 407.56335, "r_y3": 314.40619, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.51108, "r_y0": 300.61053000000004, "r_x1": 425.07336, "r_y1": 300.61053000000004, "r_x2": 425.07336, "r_y2": 292.08502000000004, "r_x3": 418.51108, "r_y3": 292.08502000000004, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.59744, "r_y0": 300.61658, "r_x1": 436.1597300000001, "r_y1": 300.61658, "r_x2": 436.1597300000001, "r_y2": 292.09106, "r_x3": 429.59744, "r_y3": 292.09106, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.68759000000006, "r_y0": 300.53781000000004, "r_x1": 447.24987999999996, "r_y1": 300.53781000000004, "r_x2": 447.24987999999996, "r_y2": 292.01230000000004, "r_x3": 440.68759000000006, "r_y3": 292.01230000000004, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.6232, "r_y0": 311.82034, "r_x1": 425.18549, "r_y1": 311.82034, "r_x2": 425.18549, "r_y2": 303.29483, "r_x3": 418.6232, "r_y3": 303.29483, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.7095299999999, "r_y0": 311.82562, "r_x1": 436.27182, "r_y1": 311.82562, "r_x2": 436.27182, "r_y2": 303.30011, "r_x3": 429.7095299999999, "r_y3": 303.30011, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.7996800000001, "r_y0": 311.74762, "r_x1": 447.36197, "r_y1": 311.74762, "r_x2": 447.36197, "r_y2": 303.22211, "r_x3": 440.7996800000001, "r_y3": 303.22211, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.62546, "r_y0": 323.09454, "r_x1": 425.18774, "r_y1": 323.09454, "r_x2": 425.18774, "r_y2": 314.56903, "r_x3": 418.62546, "r_y3": 314.56903, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.71181999999993, "r_y0": 323.09985, "r_x1": 436.27411, "r_y1": 323.09985, "r_x2": 436.27411, "r_y2": 314.57434, "r_x3": 429.71181999999993, "r_y3": 314.57434, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.80194, "r_y0": 323.02182, "r_x1": 447.36423, "r_y1": 323.02182, "r_x2": 447.36423, "r_y2": 314.49631, "r_x3": 440.80194, "r_y3": 314.49631, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.39746, "r_y0": 333.81583, "r_x1": 413.95975, "r_y1": 333.81583, "r_x2": 413.95975, "r_y2": 325.29031, "r_x3": 407.39746, "r_y3": 325.29031, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.45959, "r_y0": 333.97867, "r_x1": 425.02188, "r_y1": 333.97867, "r_x2": 425.02188, "r_y2": 325.45316, "r_x3": 418.45959, "r_y3": 325.45316, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.54593, "r_y0": 333.98471, "r_x1": 436.10822, "r_y1": 333.98471, "r_x2": 436.10822, "r_y2": 325.4592, "r_x3": 429.54593, "r_y3": 325.4592, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.63608, "r_y0": 333.90594, "r_x1": 447.19836, "r_y1": 333.90594, "r_x2": 447.19836, "r_y2": 325.38043, "r_x3": 440.63608, "r_y3": 325.38043, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 451.89511000000005, "r_y0": 288.68268, "r_x1": 463.51273000000003, "r_y1": 288.68268, "r_x2": 463.51273000000003, "r_y2": 280.15717, "r_x3": 451.89511000000005, "r_y3": 280.15717, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.1557, "r_y0": 300.12427, "r_x1": 463.77332, "r_y1": 300.12427, "r_x2": 463.77332, "r_y2": 291.59875000000005, "r_x3": 452.1557, "r_y3": 291.59875000000005, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.17688000000004, "r_y0": 311.36816, "r_x1": 463.79449000000005, "r_y1": 311.36816, "r_x2": 463.79449000000005, "r_y2": 302.84265, "r_x3": 452.17688000000004, "r_y3": 302.84265, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.09887999999995, "r_y0": 322.6499299999999, "r_x1": 463.71648999999996, "r_y1": 322.6499299999999, "r_x2": 463.71648999999996, "r_y2": 314.12441999999993, "r_x3": 452.09887999999995, "r_y3": 314.12441999999993, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.29733, "r_y0": 333.99457, "r_x1": 463.91495, "r_y1": 333.99457, "r_x2": 463.91495, "r_y2": 325.46906, "r_x3": 452.29733, "r_y3": 325.46906, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.09677, "r_y0": 323.02029000000005, "r_x1": 402.65906, "r_y1": 323.02029000000005, "r_x2": 402.65906, "r_y2": 314.49478, "r_x3": 396.09677, "r_y3": 314.49478, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.99829, "r_y0": 333.91428, "r_x1": 402.56058, "r_y1": 333.91428, "r_x2": 402.56058, "r_y2": 325.38876000000005, "r_x3": 395.99829, "r_y3": 325.38876000000005, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.27475, "r_y0": 300.79608, "r_x1": 402.83704, "r_y1": 300.79608, "r_x2": 402.83704, "r_y2": 292.27057, "r_x3": 396.27475, "r_y3": 292.27057, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.54724, "r_y0": 289.49463, "r_x1": 413.60074, "r_y1": 289.49463, "r_x2": 413.60074, "r_y2": 280.96912, "r_x3": 408.54724, "r_y3": 280.96912, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 430.58966, "r_y0": 289.02277, "r_x1": 435.6431600000001, "r_y1": 289.02277, "r_x2": 435.6431600000001, "r_y2": 280.49725, "r_x3": 430.58966, "r_y3": 280.49725, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 441.08069, "r_y0": 288.90613, "r_x1": 446.13419, "r_y1": 288.90613, "r_x2": 446.13419, "r_y2": 280.38062, "r_x3": 441.08069, "r_y3": 280.38062, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.97388, "r_y0": 300.65976, "r_x1": 414.03625, "r_y1": 300.65976, "r_x2": 414.03625, "r_y2": 292.13425, "r_x3": 407.97388, "r_y3": 292.13425, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 441.25640999999996, "r_y0": 419.7062700000001, "r_x1": 452.87402, "r_y1": 419.7062700000001, "r_x2": 452.87402, "r_y2": 411.1807600000001, "r_x3": 441.25640999999996, "r_y3": 411.1807600000001, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.75256, "r_y0": 406.89935, "r_x1": 432.48929, "r_y1": 406.89935, "r_x2": 432.48929, "r_y2": 399.7947700000001, "r_x3": 393.75256, "r_y3": 399.7947700000001, "coord_origin": "TOPLEFT" }, "text": "vocabulary:", "orig": "vocabulary:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 434.5896000000001, "r_y0": 406.89935, "r_x1": 438.80083999999994, "r_y1": 406.89935, "r_x2": 438.80083999999994, "r_y2": 399.7947700000001, "r_x3": 434.5896000000001, "r_y3": 399.7947700000001, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.90573, "r_y0": 406.89935, "r_x1": 463.22235, "r_y1": 406.89935, "r_x2": 463.22235, "r_y2": 399.7947700000001, "r_x3": 440.90573, "r_y3": 399.7947700000001, "coord_origin": "TOPLEFT" }, "text": "tokens", "orig": "tokens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 384.11816, "r_y0": 265.65179, "r_x1": 413.99307, "r_y1": 265.65179, "r_x2": 413.99307, "r_y2": 258.54718, "r_x3": 384.11816, "r_y3": 258.54718, "coord_origin": "TOPLEFT" }, "text": "D OTSL", "orig": "D OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.75256, "r_y0": 273.77966000000004, "r_x1": 451.45129000000003, "r_y1": 273.77966000000004, "r_x2": 451.45129000000003, "r_y2": 266.67505000000006, "r_x3": 393.75256, "r_y3": 266.67505000000006, "coord_origin": "TOPLEFT" }, "text": "sequence length:", "orig": "sequence length:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 453.55083999999994, "r_y0": 273.77966000000004, "r_x1": 461.97485, "r_y1": 273.77966000000004, "r_x2": 461.97485, "r_y2": 266.67505000000006, "r_x3": 453.55083999999994, "r_y3": 266.67505000000006, "coord_origin": "TOPLEFT" }, "text": "30", "orig": "30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.79318, "r_y0": 406.86474999999996, "r_x1": 233.89371000000003, "r_y1": 406.86474999999996, "r_x2": 233.89371000000003, "r_y2": 399.76016, "r_x3": 151.79318, "r_y3": 399.76016, "coord_origin": "TOPLEFT" }, "text": "vocabulary for this table:", "orig": "vocabulary for this table:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 235.99332, "r_y0": 406.86474999999996, "r_x1": 244.41734000000002, "r_y1": 406.86474999999996, "r_x2": 244.41734000000002, "r_y2": 399.76016, "r_x3": 235.99332, "r_y3": 399.76016, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.52222, "r_y0": 406.86474999999996, "r_x1": 268.83884, "r_y1": 406.86474999999996, "r_x2": 268.83884, "r_y2": 399.76016, "r_x3": 246.52222, "r_y3": 399.76016, "coord_origin": "TOPLEFT" }, "text": "tokens", "orig": "tokens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.3298, "r_y0": 220.67920000000004, "r_x1": 159.79837, "r_y1": 220.67920000000004, "r_x2": 159.79837, "r_y2": 213.57457999999997, "r_x3": 154.3298, "r_y3": 213.57457999999997, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 321.07053, "r_y0": 220.67920000000004, "r_x1": 326.53909, "r_y1": 220.67920000000004, "r_x2": 326.53909, "r_y2": 213.57457999999997, "r_x3": 321.07053, "r_y3": 213.57457999999997, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 153.0947, "r_y0": 286.69824, "r_x1": 175.83888, "r_y1": 286.69824, "r_x2": 175.83888, "r_y2": 280.30411, "r_x3": 153.0947, "r_y3": 280.30411, "coord_origin": "TOPLEFT" }, "text": "", "orig": "
", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67039, "r_y0": 293.51501, "r_x1": 172.79608, "r_y1": 293.51501, "r_x2": 172.79608, "r_y2": 287.12088, "r_x3": 160.67039, "r_y3": 287.12088, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.24603, "r_y0": 300.33179, "r_x1": 177.91019, "r_y1": 300.33179, "r_x2": 177.91019, "r_y2": 293.93765, "r_x3": 168.24603, "r_y3": 293.93765, "coord_origin": "TOPLEFT" }, "text": "", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.35785, "r_y0": 300.33179, "r_x1": 278.89804, "r_y1": 300.33179, "r_x2": 278.89804, "r_y2": 293.93765, "r_x3": 263.35785, "r_y3": 293.93765, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 280.79175, "r_y0": 300.33179, "r_x1": 290.4559, "r_y1": 300.33179, "r_x2": 290.4559, "r_y2": 293.93765, "r_x3": 280.79175, "r_y3": 293.93765, "coord_origin": "TOPLEFT" }, "text": "", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 335.92926, "r_y0": 300.33179, "r_x1": 351.46945, "r_y1": 300.33179, "r_x2": 351.46945, "r_y2": 293.93765, "r_x3": 335.92926, "r_y3": 293.93765, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67039, "r_y0": 307.14856, "r_x1": 174.68979, "r_y1": 307.14856, "r_x2": 174.68979, "r_y2": 300.75442999999996, "r_x3": 160.67039, "r_y3": 300.75442999999996, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67039, "r_y0": 313.96536, "r_x1": 172.79608, "r_y1": 313.96536, "r_x2": 172.79608, "r_y2": 307.57122999999996, "r_x3": 160.67039, "r_y3": 307.57122999999996, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.24603, "r_y0": 320.78214, "r_x1": 181.89255, "r_y1": 320.78214, "r_x2": 181.89255, "r_y2": 314.388, "r_x3": 168.24603, "r_y3": 314.388, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 201.22015, "r_y0": 320.78214, "r_x1": 214.86666999999997, "r_y1": 320.78214, "r_x2": 214.86666999999997, "r_y2": 314.388, "r_x3": 201.22015, "r_y3": 314.388, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.19427000000002, "r_y0": 320.78214, "r_x1": 247.84079000000003, "r_y1": 320.78214, "r_x2": 247.84079000000003, "r_y2": 314.388, "r_x3": 234.19427000000002, "r_y3": 314.388, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67039, "r_y0": 327.59890999999993, "r_x1": 174.68979, "r_y1": 327.59890999999993, "r_x2": 174.68979, "r_y2": 321.20477, "r_x3": 160.67039, "r_y3": 321.20477, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67039, "r_y0": 334.41571000000005, "r_x1": 172.79608, "r_y1": 334.41571000000005, "r_x2": 172.79608, "r_y2": 328.02158, "r_x3": 160.67039, "r_y3": 328.02158, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.24603, "r_y0": 341.23248, "r_x1": 373.09091, "r_y1": 341.23248, "r_x2": 373.09091, "r_y2": 334.83835, "r_x3": 168.24603, "r_y3": 334.83835, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67039, "r_y0": 348.04926, "r_x1": 174.68979, "r_y1": 348.04926, "r_x2": 174.68979, "r_y2": 341.65512, "r_x3": 160.67039, "r_y3": 341.65512, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67039, "r_y0": 354.86572, "r_x1": 172.79608, "r_y1": 354.86572, "r_x2": 172.79608, "r_y2": 348.47159, "r_x3": 160.67039, "r_y3": 348.47159, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.24603, "r_y0": 361.68249999999995, "r_x1": 181.89255, "r_y1": 361.68249999999995, "r_x2": 181.89255, "r_y2": 355.28836000000007, "r_x3": 168.24603, "r_y3": 355.28836000000007, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 201.22015, "r_y0": 361.68249999999995, "r_x1": 214.86666999999997, "r_y1": 361.68249999999995, "r_x2": 214.86666999999997, "r_y2": 355.28836000000007, "r_x3": 201.22015, "r_y3": 355.28836000000007, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.19427000000002, "r_y0": 361.68249999999995, "r_x1": 247.84079000000003, "r_y1": 361.68249999999995, "r_x2": 247.84079000000003, "r_y2": 355.28836000000007, "r_x3": 234.19427000000002, "r_y3": 355.28836000000007, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 267.1684, "r_y0": 361.68249999999995, "r_x1": 280.81488, "r_y1": 361.68249999999995, "r_x2": 280.81488, "r_y2": 355.28836000000007, "r_x3": 267.1684, "r_y3": 355.28836000000007, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67039, "r_y0": 368.49929999999995, "r_x1": 174.68979, "r_y1": 368.49929999999995, "r_x2": 174.68979, "r_y2": 362.10516000000007, "r_x3": 160.67039, "r_y3": 362.10516000000007, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67039, "r_y0": 375.31607, "r_x1": 172.79608, "r_y1": 375.31607, "r_x2": 172.79608, "r_y2": 368.92194, "r_x3": 160.67039, "r_y3": 368.92194, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.24603, "r_y0": 382.13284, "r_x1": 181.89255, "r_y1": 382.13284, "r_x2": 181.89255, "r_y2": 375.73871, "r_x3": 168.24603, "r_y3": 375.73871, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 201.22015, "r_y0": 382.13284, "r_x1": 214.86666999999997, "r_y1": 382.13284, "r_x2": 214.86666999999997, "r_y2": 375.73871, "r_x3": 201.22015, "r_y3": 375.73871, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.19427000000002, "r_y0": 382.13284, "r_x1": 247.84079000000003, "r_y1": 382.13284, "r_x2": 247.84079000000003, "r_y2": 375.73871, "r_x3": 234.19427000000002, "r_y3": 375.73871, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 267.1684, "r_y0": 382.13284, "r_x1": 280.81488, "r_y1": 382.13284, "r_x2": 280.81488, "r_y2": 375.73871, "r_x3": 267.1684, "r_y3": 375.73871, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67039, "r_y0": 388.94965, "r_x1": 174.68979, "r_y1": 388.94965, "r_x2": 174.68979, "r_y2": 382.55551, "r_x3": 160.67039, "r_y3": 382.55551, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 153.0947, "r_y0": 395.76642, "r_x1": 177.73259, "r_y1": 395.76642, "r_x2": 177.73259, "r_y2": 389.37228, "r_x3": 153.0947, "r_y3": 389.37228, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.78624, "r_y0": 320.78214, "r_x1": 199.32646, "r_y1": 320.78214, "r_x2": 199.32646, "r_y2": 314.388, "r_x3": 183.78624, "r_y3": 314.388, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 216.76038, "r_y0": 320.78214, "r_x1": 232.30058, "r_y1": 320.78214, "r_x2": 232.30058, "r_y2": 314.388, "r_x3": 216.76038, "r_y3": 314.388, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.73447999999996, "r_y0": 320.78214, "r_x1": 265.27469, "r_y1": 320.78214, "r_x2": 265.27469, "r_y2": 314.388, "r_x3": 249.73447999999996, "r_y3": 314.388, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.78624, "r_y0": 361.68249999999995, "r_x1": 199.32646, "r_y1": 361.68249999999995, "r_x2": 199.32646, "r_y2": 355.28836000000007, "r_x3": 183.78624, "r_y3": 355.28836000000007, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 216.76038, "r_y0": 361.68249999999995, "r_x1": 232.30058, "r_y1": 361.68249999999995, "r_x2": 232.30058, "r_y2": 355.28836000000007, "r_x3": 216.76038, "r_y3": 355.28836000000007, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.73447999999996, "r_y0": 361.68249999999995, "r_x1": 265.27469, "r_y1": 361.68249999999995, "r_x2": 265.27469, "r_y2": 355.28836000000007, "r_x3": 249.73447999999996, "r_y3": 355.28836000000007, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.70862, "r_y0": 361.68249999999995, "r_x1": 298.24881, "r_y1": 361.68249999999995, "r_x2": 298.24881, "r_y2": 355.28836000000007, "r_x3": 282.70862, "r_y3": 355.28836000000007, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.78624, "r_y0": 382.13284, "r_x1": 199.32646, "r_y1": 382.13284, "r_x2": 199.32646, "r_y2": 375.73871, "r_x3": 183.78624, "r_y3": 375.73871, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 216.76038, "r_y0": 382.13284, "r_x1": 232.30058, "r_y1": 382.13284, "r_x2": 232.30058, "r_y2": 375.73871, "r_x3": 216.76038, "r_y3": 375.73871, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.73447999999996, "r_y0": 382.13284, "r_x1": 265.27469, "r_y1": 382.13284, "r_x2": 265.27469, "r_y2": 375.73871, "r_x3": 249.73447999999996, "r_y3": 375.73871, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.70862, "r_y0": 382.13284, "r_x1": 298.24881, "r_y1": 382.13284, "r_x2": 298.24881, "r_y2": 375.73871, "r_x3": 282.70862, "r_y3": 375.73871, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.06137, "r_y0": 419.85904, "r_x1": 401.62366, "r_y1": 419.85904, "r_x2": 401.62366, "r_y2": 411.33353, "r_x3": 395.06137, "r_y3": 411.33353, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.42249, "r_y0": 419.85904, "r_x1": 412.47598, "r_y1": 419.85904, "r_x2": 412.47598, "r_y2": 411.33353, "r_x3": 407.42249, "r_y3": 411.33353, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.69287, "r_y0": 419.85904, "r_x1": 425.25516, "r_y1": 419.85904, "r_x2": 425.25516, "r_y2": 411.33353, "r_x3": 418.69287, "r_y3": 411.33353, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 430.5086099999999, "r_y0": 419.85904, "r_x1": 436.5709800000001, "r_y1": 419.85904, "r_x2": 436.5709800000001, "r_y2": 411.33353, "r_x3": 430.5086099999999, "r_y3": 411.33353, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 152.36208, "r_y0": 416.16776, "r_x1": 175.10626, "r_y1": 416.16776, "r_x2": 175.10626, "r_y2": 409.77362, "r_x3": 152.36208, "r_y3": 409.77362, "coord_origin": "TOPLEFT" }, "text": "", "orig": "
", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 178.89366, "r_y0": 416.16776, "r_x1": 191.01935, "r_y1": 416.16776, "r_x2": 191.01935, "r_y2": 409.77362, "r_x3": 178.89366, "r_y3": 409.77362, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.80676, "r_y0": 416.16776, "r_x1": 208.82614, "r_y1": 416.16776, "r_x2": 208.82614, "r_y2": 409.77362, "r_x3": 194.80676, "r_y3": 409.77362, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 212.61354, "r_y0": 416.16776, "r_x1": 226.26003999999998, "r_y1": 416.16776, "r_x2": 226.26003999999998, "r_y2": 409.77362, "r_x3": 212.61354, "r_y3": 409.77362, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.37506000000002, "r_y0": 416.16776, "r_x1": 259.03918, "r_y1": 416.16776, "r_x2": 259.03918, "r_y2": 409.77362, "r_x3": 249.37506000000002, "r_y3": 409.77362, "coord_origin": "TOPLEFT" }, "text": "", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 244.46358, "r_y0": 424.49936, "r_x1": 269.10144, "r_y1": 424.49936, "r_x2": 269.10144, "r_y2": 418.10522, "r_x3": 244.46358, "r_y3": 418.10522, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 230.04745000000003, "r_y0": 416.16776, "r_x1": 245.58765000000002, "r_y1": 416.16776, "r_x2": 245.58765000000002, "r_y2": 409.77362, "r_x3": 230.04745000000003, "r_y3": 409.77362, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.50595, "r_y0": 265.70556999999997, "r_x1": 159.62473, "r_y1": 265.70556999999997, "r_x2": 159.62473, "r_y2": 258.60095, "r_x3": 154.50595, "r_y3": 258.60095, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 164.74348, "r_y0": 265.70556999999997, "r_x1": 185.21857, "r_y1": 265.70556999999997, "r_x2": 185.21857, "r_y2": 258.60095, "r_x3": 164.74348, "r_y3": 258.60095, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 164.3548, "r_y0": 273.60168, "r_x1": 222.05352999999997, "r_y1": 273.60168, "r_x2": 222.05352999999997, "r_y2": 266.49707, "r_x3": 164.3548, "r_y3": 266.49707, "coord_origin": "TOPLEFT" }, "text": "sequence length:", "orig": "sequence length:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 224.15326, "r_y0": 273.60168, "r_x1": 232.57729, "r_y1": 273.60168, "r_x2": 232.57729, "r_y2": 266.49707, "r_x3": 224.15326, "r_y3": 266.49707, "coord_origin": "TOPLEFT" }, "text": "55", "orig": "55", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 11, "label": "text", "bbox": { "l": 396.41107, "t": 280.98352, "r": 402.97336, "b": 289.50903, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.41107, "r_y0": 289.50903, "r_x1": 402.97336, "r_y1": 289.50903, "r_x2": 402.97336, "r_y2": 280.98352, "r_x3": 396.41107, "r_y3": 280.98352, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 12, "label": "text", "bbox": { "l": 418.58682, "t": 280.89792, "r": 425.14911, "b": 289.42343, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.58682, "r_y0": 289.42343, "r_x1": 425.14911, "r_y1": 289.42343, "r_x2": 425.14911, "r_y2": 280.89792, "r_x3": 418.58682, "r_y3": 280.89792, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 13, "label": "text", "bbox": { "l": 395.74835, "t": 303.23727, "r": 402.31064, "b": 311.76279, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.74835, "r_y0": 311.76279, "r_x1": 402.31064, "r_y1": 311.76279, "r_x2": 402.31064, "r_y2": 303.23727, "r_x3": 395.74835, "r_y3": 303.23727, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 14, "label": "text", "bbox": { "l": 407.54214, "t": 303.36981, "r": 414.10443, "b": 311.89532, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.54214, "r_y0": 311.89532, "r_x1": 414.10443, "r_y1": 311.89532, "r_x2": 414.10443, "r_y2": 303.36981, "r_x3": 407.54214, "r_y3": 303.36981, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 15, "label": "text", "bbox": { "l": 407.56335, "t": 314.40619, "r": 414.12564, "b": 322.9317, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.56335, "r_y0": 322.9317, "r_x1": 414.12564, "r_y1": 322.9317, "r_x2": 414.12564, "r_y2": 314.40619, "r_x3": 407.56335, "r_y3": 314.40619, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 16, "label": "text", "bbox": { "l": 418.51108, "t": 292.08502000000004, "r": 425.07336, "b": 300.61053000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.51108, "r_y0": 300.61053000000004, "r_x1": 425.07336, "r_y1": 300.61053000000004, "r_x2": 425.07336, "r_y2": 292.08502000000004, "r_x3": 418.51108, "r_y3": 292.08502000000004, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 17, "label": "text", "bbox": { "l": 429.59744, "t": 292.09106, "r": 436.1597300000001, "b": 300.61658, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.59744, "r_y0": 300.61658, "r_x1": 436.1597300000001, "r_y1": 300.61658, "r_x2": 436.1597300000001, "r_y2": 292.09106, "r_x3": 429.59744, "r_y3": 292.09106, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 18, "label": "text", "bbox": { "l": 440.68759000000006, "t": 292.01230000000004, "r": 447.24987999999996, "b": 300.53781000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.68759000000006, "r_y0": 300.53781000000004, "r_x1": 447.24987999999996, "r_y1": 300.53781000000004, "r_x2": 447.24987999999996, "r_y2": 292.01230000000004, "r_x3": 440.68759000000006, "r_y3": 292.01230000000004, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 19, "label": "text", "bbox": { "l": 418.6232, "t": 303.29483, "r": 425.18549, "b": 311.82034, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.6232, "r_y0": 311.82034, "r_x1": 425.18549, "r_y1": 311.82034, "r_x2": 425.18549, "r_y2": 303.29483, "r_x3": 418.6232, "r_y3": 303.29483, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 20, "label": "text", "bbox": { "l": 429.7095299999999, "t": 303.30011, "r": 436.27182, "b": 311.82562, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.7095299999999, "r_y0": 311.82562, "r_x1": 436.27182, "r_y1": 311.82562, "r_x2": 436.27182, "r_y2": 303.30011, "r_x3": 429.7095299999999, "r_y3": 303.30011, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 21, "label": "text", "bbox": { "l": 440.7996800000001, "t": 303.22211, "r": 447.36197, "b": 311.74762, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.7996800000001, "r_y0": 311.74762, "r_x1": 447.36197, "r_y1": 311.74762, "r_x2": 447.36197, "r_y2": 303.22211, "r_x3": 440.7996800000001, "r_y3": 303.22211, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 22, "label": "text", "bbox": { "l": 418.62546, "t": 314.56903, "r": 425.18774, "b": 323.09454, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.62546, "r_y0": 323.09454, "r_x1": 425.18774, "r_y1": 323.09454, "r_x2": 425.18774, "r_y2": 314.56903, "r_x3": 418.62546, "r_y3": 314.56903, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 23, "label": "text", "bbox": { "l": 429.71181999999993, "t": 314.57434, "r": 436.27411, "b": 323.09985, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.71181999999993, "r_y0": 323.09985, "r_x1": 436.27411, "r_y1": 323.09985, "r_x2": 436.27411, "r_y2": 314.57434, "r_x3": 429.71181999999993, "r_y3": 314.57434, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 24, "label": "text", "bbox": { "l": 440.80194, "t": 314.49631, "r": 447.36423, "b": 323.02182, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.80194, "r_y0": 323.02182, "r_x1": 447.36423, "r_y1": 323.02182, "r_x2": 447.36423, "r_y2": 314.49631, "r_x3": 440.80194, "r_y3": 314.49631, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 25, "label": "text", "bbox": { "l": 407.39746, "t": 325.29031, "r": 413.95975, "b": 333.81583, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.39746, "r_y0": 333.81583, "r_x1": 413.95975, "r_y1": 333.81583, "r_x2": 413.95975, "r_y2": 325.29031, "r_x3": 407.39746, "r_y3": 325.29031, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 26, "label": "text", "bbox": { "l": 418.45959, "t": 325.45316, "r": 425.02188, "b": 333.97867, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.45959, "r_y0": 333.97867, "r_x1": 425.02188, "r_y1": 333.97867, "r_x2": 425.02188, "r_y2": 325.45316, "r_x3": 418.45959, "r_y3": 325.45316, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 27, "label": "text", "bbox": { "l": 429.54593, "t": 325.4592, "r": 436.10822, "b": 333.98471, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.54593, "r_y0": 333.98471, "r_x1": 436.10822, "r_y1": 333.98471, "r_x2": 436.10822, "r_y2": 325.4592, "r_x3": 429.54593, "r_y3": 325.4592, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 28, "label": "text", "bbox": { "l": 440.63608, "t": 325.38043, "r": 447.19836, "b": 333.90594, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.63608, "r_y0": 333.90594, "r_x1": 447.19836, "r_y1": 333.90594, "r_x2": 447.19836, "r_y2": 325.38043, "r_x3": 440.63608, "r_y3": 325.38043, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 29, "label": "text", "bbox": { "l": 451.89511000000005, "t": 280.15717, "r": 463.51273000000003, "b": 288.68268, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 451.89511000000005, "r_y0": 288.68268, "r_x1": 463.51273000000003, "r_y1": 288.68268, "r_x2": 463.51273000000003, "r_y2": 280.15717, "r_x3": 451.89511000000005, "r_y3": 280.15717, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 30, "label": "text", "bbox": { "l": 452.1557, "t": 291.59875000000005, "r": 463.77332, "b": 300.12427, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.1557, "r_y0": 300.12427, "r_x1": 463.77332, "r_y1": 300.12427, "r_x2": 463.77332, "r_y2": 291.59875000000005, "r_x3": 452.1557, "r_y3": 291.59875000000005, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 31, "label": "text", "bbox": { "l": 452.17688000000004, "t": 302.84265, "r": 463.79449000000005, "b": 311.36816, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.17688000000004, "r_y0": 311.36816, "r_x1": 463.79449000000005, "r_y1": 311.36816, "r_x2": 463.79449000000005, "r_y2": 302.84265, "r_x3": 452.17688000000004, "r_y3": 302.84265, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 32, "label": "text", "bbox": { "l": 452.09887999999995, "t": 314.12441999999993, "r": 463.71648999999996, "b": 322.6499299999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.09887999999995, "r_y0": 322.6499299999999, "r_x1": 463.71648999999996, "r_y1": 322.6499299999999, "r_x2": 463.71648999999996, "r_y2": 314.12441999999993, "r_x3": 452.09887999999995, "r_y3": 314.12441999999993, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 33, "label": "text", "bbox": { "l": 452.29733, "t": 325.46906, "r": 463.91495, "b": 333.99457, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.29733, "r_y0": 333.99457, "r_x1": 463.91495, "r_y1": 333.99457, "r_x2": 463.91495, "r_y2": 325.46906, "r_x3": 452.29733, "r_y3": 325.46906, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 34, "label": "text", "bbox": { "l": 396.09677, "t": 314.49478, "r": 402.65906, "b": 323.02029000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.09677, "r_y0": 323.02029000000005, "r_x1": 402.65906, "r_y1": 323.02029000000005, "r_x2": 402.65906, "r_y2": 314.49478, "r_x3": 396.09677, "r_y3": 314.49478, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 35, "label": "text", "bbox": { "l": 395.99829, "t": 325.38876000000005, "r": 402.56058, "b": 333.91428, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.99829, "r_y0": 333.91428, "r_x1": 402.56058, "r_y1": 333.91428, "r_x2": 402.56058, "r_y2": 325.38876000000005, "r_x3": 395.99829, "r_y3": 325.38876000000005, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 36, "label": "text", "bbox": { "l": 396.27475, "t": 292.27057, "r": 402.83704, "b": 300.79608, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.27475, "r_y0": 300.79608, "r_x1": 402.83704, "r_y1": 300.79608, "r_x2": 402.83704, "r_y2": 292.27057, "r_x3": 396.27475, "r_y3": 292.27057, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 37, "label": "text", "bbox": { "l": 408.54724, "t": 280.96912, "r": 413.60074, "b": 289.49463, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.54724, "r_y0": 289.49463, "r_x1": 413.60074, "r_y1": 289.49463, "r_x2": 413.60074, "r_y2": 280.96912, "r_x3": 408.54724, "r_y3": 280.96912, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 38, "label": "text", "bbox": { "l": 430.58966, "t": 280.49725, "r": 435.6431600000001, "b": 289.02277, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 430.58966, "r_y0": 289.02277, "r_x1": 435.6431600000001, "r_y1": 289.02277, "r_x2": 435.6431600000001, "r_y2": 280.49725, "r_x3": 430.58966, "r_y3": 280.49725, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 39, "label": "text", "bbox": { "l": 441.08069, "t": 280.38062, "r": 446.13419, "b": 288.90613, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 441.08069, "r_y0": 288.90613, "r_x1": 446.13419, "r_y1": 288.90613, "r_x2": 446.13419, "r_y2": 280.38062, "r_x3": 441.08069, "r_y3": 280.38062, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 40, "label": "text", "bbox": { "l": 407.97388, "t": 292.13425, "r": 414.03625, "b": 300.65976, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.97388, "r_y0": 300.65976, "r_x1": 414.03625, "r_y1": 300.65976, "r_x2": 414.03625, "r_y2": 292.13425, "r_x3": 407.97388, "r_y3": 292.13425, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 441.25640999999996, "t": 411.1807600000001, "r": 452.87402, "b": 419.7062700000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 441.25640999999996, "r_y0": 419.7062700000001, "r_x1": 452.87402, "r_y1": 419.7062700000001, "r_x2": 452.87402, "r_y2": 411.1807600000001, "r_x3": 441.25640999999996, "r_y3": 411.1807600000001, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 393.75256, "t": 399.7947700000001, "r": 432.48929, "b": 406.89935, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.75256, "r_y0": 406.89935, "r_x1": 432.48929, "r_y1": 406.89935, "r_x2": 432.48929, "r_y2": 399.7947700000001, "r_x3": 393.75256, "r_y3": 399.7947700000001, "coord_origin": "TOPLEFT" }, "text": "vocabulary:", "orig": "vocabulary:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 434.5896000000001, "t": 399.7947700000001, "r": 438.80083999999994, "b": 406.89935, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 434.5896000000001, "r_y0": 406.89935, "r_x1": 438.80083999999994, "r_y1": 406.89935, "r_x2": 438.80083999999994, "r_y2": 399.7947700000001, "r_x3": 434.5896000000001, "r_y3": 399.7947700000001, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 440.90573, "t": 399.7947700000001, "r": 463.22235, "b": 406.89935, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.90573, "r_y0": 406.89935, "r_x1": 463.22235, "r_y1": 406.89935, "r_x2": 463.22235, "r_y2": 399.7947700000001, "r_x3": 440.90573, "r_y3": 399.7947700000001, "coord_origin": "TOPLEFT" }, "text": "tokens", "orig": "tokens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 384.11816, "t": 258.54718, "r": 413.99307, "b": 265.65179, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 384.11816, "r_y0": 265.65179, "r_x1": 413.99307, "r_y1": 265.65179, "r_x2": 413.99307, "r_y2": 258.54718, "r_x3": 384.11816, "r_y3": 258.54718, "coord_origin": "TOPLEFT" }, "text": "D OTSL", "orig": "D OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 393.75256, "t": 266.67505000000006, "r": 451.45129000000003, "b": 273.77966000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.75256, "r_y0": 273.77966000000004, "r_x1": 451.45129000000003, "r_y1": 273.77966000000004, "r_x2": 451.45129000000003, "r_y2": 266.67505000000006, "r_x3": 393.75256, "r_y3": 266.67505000000006, "coord_origin": "TOPLEFT" }, "text": "sequence length:", "orig": "sequence length:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 453.55083999999994, "t": 266.67505000000006, "r": 461.97485, "b": 273.77966000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 453.55083999999994, "r_y0": 273.77966000000004, "r_x1": 461.97485, "r_y1": 273.77966000000004, "r_x2": 461.97485, "r_y2": 266.67505000000006, "r_x3": 453.55083999999994, "r_y3": 266.67505000000006, "coord_origin": "TOPLEFT" }, "text": "30", "orig": "30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 151.79318, "t": 399.76016, "r": 233.89371000000003, "b": 406.86474999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.79318, "r_y0": 406.86474999999996, "r_x1": 233.89371000000003, "r_y1": 406.86474999999996, "r_x2": 233.89371000000003, "r_y2": 399.76016, "r_x3": 151.79318, "r_y3": 399.76016, "coord_origin": "TOPLEFT" }, "text": "vocabulary for this table:", "orig": "vocabulary for this table:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 235.99332, "t": 399.76016, "r": 244.41734000000002, "b": 406.86474999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 235.99332, "r_y0": 406.86474999999996, "r_x1": 244.41734000000002, "r_y1": 406.86474999999996, "r_x2": 244.41734000000002, "r_y2": 399.76016, "r_x3": 235.99332, "r_y3": 399.76016, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 246.52222, "t": 399.76016, "r": 268.83884, "b": 406.86474999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.52222, "r_y0": 406.86474999999996, "r_x1": 268.83884, "r_y1": 406.86474999999996, "r_x2": 268.83884, "r_y2": 399.76016, "r_x3": 246.52222, "r_y3": 399.76016, "coord_origin": "TOPLEFT" }, "text": "tokens", "orig": "tokens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 51, "label": "text", "bbox": { "l": 154.3298, "t": 213.57457999999997, "r": 159.79837, "b": 220.67920000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.3298, "r_y0": 220.67920000000004, "r_x1": 159.79837, "r_y1": 220.67920000000004, "r_x2": 159.79837, "r_y2": 213.57457999999997, "r_x3": 154.3298, "r_y3": 213.57457999999997, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 52, "label": "text", "bbox": { "l": 321.07053, "t": 213.57457999999997, "r": 326.53909, "b": 220.67920000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 321.07053, "r_y0": 220.67920000000004, "r_x1": 326.53909, "r_y1": 220.67920000000004, "r_x2": 326.53909, "r_y2": 213.57457999999997, "r_x3": 321.07053, "r_y3": 213.57457999999997, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 53, "label": "text", "bbox": { "l": 153.0947, "t": 280.30411, "r": 175.83888, "b": 286.69824, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 153.0947, "r_y0": 286.69824, "r_x1": 175.83888, "r_y1": 286.69824, "r_x2": 175.83888, "r_y2": 280.30411, "r_x3": 153.0947, "r_y3": 280.30411, "coord_origin": "TOPLEFT" }, "text": "", "orig": "
", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 54, "label": "text", "bbox": { "l": 160.67039, "t": 287.12088, "r": 172.79608, "b": 293.51501, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67039, "r_y0": 293.51501, "r_x1": 172.79608, "r_y1": 293.51501, "r_x2": 172.79608, "r_y2": 287.12088, "r_x3": 160.67039, "r_y3": 287.12088, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 55, "label": "text", "bbox": { "l": 168.24603, "t": 293.93765, "r": 177.91019, "b": 300.33179, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.24603, "r_y0": 300.33179, "r_x1": 177.91019, "r_y1": 300.33179, "r_x2": 177.91019, "r_y2": 293.93765, "r_x3": 168.24603, "r_y3": 293.93765, "coord_origin": "TOPLEFT" }, "text": "", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 59, "label": "text", "bbox": { "l": 263.35785, "t": 293.93765, "r": 278.89804, "b": 300.33179, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.35785, "r_y0": 300.33179, "r_x1": 278.89804, "r_y1": 300.33179, "r_x2": 278.89804, "r_y2": 293.93765, "r_x3": 263.35785, "r_y3": 293.93765, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 60, "label": "text", "bbox": { "l": 280.79175, "t": 293.93765, "r": 290.4559, "b": 300.33179, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 280.79175, "r_y0": 300.33179, "r_x1": 290.4559, "r_y1": 300.33179, "r_x2": 290.4559, "r_y2": 293.93765, "r_x3": 280.79175, "r_y3": 293.93765, "coord_origin": "TOPLEFT" }, "text": "", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 335.92926, "t": 293.93765, "r": 351.46945, "b": 300.33179, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 335.92926, "r_y0": 300.33179, "r_x1": 351.46945, "r_y1": 300.33179, "r_x2": 351.46945, "r_y2": 293.93765, "r_x3": 335.92926, "r_y3": 293.93765, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 160.67039, "t": 300.75442999999996, "r": 174.68979, "b": 307.14856, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67039, "r_y0": 307.14856, "r_x1": 174.68979, "r_y1": 307.14856, "r_x2": 174.68979, "r_y2": 300.75442999999996, "r_x3": 160.67039, "r_y3": 300.75442999999996, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 160.67039, "t": 307.57122999999996, "r": 172.79608, "b": 313.96536, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67039, "r_y0": 313.96536, "r_x1": 172.79608, "r_y1": 313.96536, "r_x2": 172.79608, "r_y2": 307.57122999999996, "r_x3": 160.67039, "r_y3": 307.57122999999996, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 168.24603, "t": 314.388, "r": 181.89255, "b": 320.78214, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.24603, "r_y0": 320.78214, "r_x1": 181.89255, "r_y1": 320.78214, "r_x2": 181.89255, "r_y2": 314.388, "r_x3": 168.24603, "r_y3": 314.388, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 201.22015, "t": 314.388, "r": 214.86666999999997, "b": 320.78214, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 201.22015, "r_y0": 320.78214, "r_x1": 214.86666999999997, "r_y1": 320.78214, "r_x2": 214.86666999999997, "r_y2": 314.388, "r_x3": 201.22015, "r_y3": 314.388, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 234.19427000000002, "t": 314.388, "r": 247.84079000000003, "b": 320.78214, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.19427000000002, "r_y0": 320.78214, "r_x1": 247.84079000000003, "r_y1": 320.78214, "r_x2": 247.84079000000003, "r_y2": 314.388, "r_x3": 234.19427000000002, "r_y3": 314.388, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 160.67039, "t": 321.20477, "r": 174.68979, "b": 327.59890999999993, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67039, "r_y0": 327.59890999999993, "r_x1": 174.68979, "r_y1": 327.59890999999993, "r_x2": 174.68979, "r_y2": 321.20477, "r_x3": 160.67039, "r_y3": 321.20477, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 160.67039, "t": 328.02158, "r": 172.79608, "b": 334.41571000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67039, "r_y0": 334.41571000000005, "r_x1": 172.79608, "r_y1": 334.41571000000005, "r_x2": 172.79608, "r_y2": 328.02158, "r_x3": 160.67039, "r_y3": 328.02158, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 168.24603, "t": 334.83835, "r": 373.09091, "b": 341.23248, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.24603, "r_y0": 341.23248, "r_x1": 373.09091, "r_y1": 341.23248, "r_x2": 373.09091, "r_y2": 334.83835, "r_x3": 168.24603, "r_y3": 334.83835, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 160.67039, "t": 341.65512, "r": 174.68979, "b": 348.04926, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67039, "r_y0": 348.04926, "r_x1": 174.68979, "r_y1": 348.04926, "r_x2": 174.68979, "r_y2": 341.65512, "r_x3": 160.67039, "r_y3": 341.65512, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 160.67039, "t": 348.47159, "r": 172.79608, "b": 354.86572, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67039, "r_y0": 354.86572, "r_x1": 172.79608, "r_y1": 354.86572, "r_x2": 172.79608, "r_y2": 348.47159, "r_x3": 160.67039, "r_y3": 348.47159, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 168.24603, "t": 355.28836000000007, "r": 181.89255, "b": 361.68249999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.24603, "r_y0": 361.68249999999995, "r_x1": 181.89255, "r_y1": 361.68249999999995, "r_x2": 181.89255, "r_y2": 355.28836000000007, "r_x3": 168.24603, "r_y3": 355.28836000000007, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 201.22015, "t": 355.28836000000007, "r": 214.86666999999997, "b": 361.68249999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 201.22015, "r_y0": 361.68249999999995, "r_x1": 214.86666999999997, "r_y1": 361.68249999999995, "r_x2": 214.86666999999997, "r_y2": 355.28836000000007, "r_x3": 201.22015, "r_y3": 355.28836000000007, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 81, "label": "text", "bbox": { "l": 234.19427000000002, "t": 355.28836000000007, "r": 247.84079000000003, "b": 361.68249999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.19427000000002, "r_y0": 361.68249999999995, "r_x1": 247.84079000000003, "r_y1": 361.68249999999995, "r_x2": 247.84079000000003, "r_y2": 355.28836000000007, "r_x3": 234.19427000000002, "r_y3": 355.28836000000007, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 83, "label": "text", "bbox": { "l": 267.1684, "t": 355.28836000000007, "r": 280.81488, "b": 361.68249999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 267.1684, "r_y0": 361.68249999999995, "r_x1": 280.81488, "r_y1": 361.68249999999995, "r_x2": 280.81488, "r_y2": 355.28836000000007, "r_x3": 267.1684, "r_y3": 355.28836000000007, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 85, "label": "text", "bbox": { "l": 160.67039, "t": 362.10516000000007, "r": 174.68979, "b": 368.49929999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67039, "r_y0": 368.49929999999995, "r_x1": 174.68979, "r_y1": 368.49929999999995, "r_x2": 174.68979, "r_y2": 362.10516000000007, "r_x3": 160.67039, "r_y3": 362.10516000000007, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 86, "label": "text", "bbox": { "l": 160.67039, "t": 368.92194, "r": 172.79608, "b": 375.31607, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67039, "r_y0": 375.31607, "r_x1": 172.79608, "r_y1": 375.31607, "r_x2": 172.79608, "r_y2": 368.92194, "r_x3": 160.67039, "r_y3": 368.92194, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 87, "label": "text", "bbox": { "l": 168.24603, "t": 375.73871, "r": 181.89255, "b": 382.13284, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.24603, "r_y0": 382.13284, "r_x1": 181.89255, "r_y1": 382.13284, "r_x2": 181.89255, "r_y2": 375.73871, "r_x3": 168.24603, "r_y3": 375.73871, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 89, "label": "text", "bbox": { "l": 201.22015, "t": 375.73871, "r": 214.86666999999997, "b": 382.13284, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 201.22015, "r_y0": 382.13284, "r_x1": 214.86666999999997, "r_y1": 382.13284, "r_x2": 214.86666999999997, "r_y2": 375.73871, "r_x3": 201.22015, "r_y3": 375.73871, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 91, "label": "text", "bbox": { "l": 234.19427000000002, "t": 375.73871, "r": 247.84079000000003, "b": 382.13284, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.19427000000002, "r_y0": 382.13284, "r_x1": 247.84079000000003, "r_y1": 382.13284, "r_x2": 247.84079000000003, "r_y2": 375.73871, "r_x3": 234.19427000000002, "r_y3": 375.73871, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 93, "label": "text", "bbox": { "l": 267.1684, "t": 375.73871, "r": 280.81488, "b": 382.13284, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 267.1684, "r_y0": 382.13284, "r_x1": 280.81488, "r_y1": 382.13284, "r_x2": 280.81488, "r_y2": 375.73871, "r_x3": 267.1684, "r_y3": 375.73871, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 95, "label": "text", "bbox": { "l": 160.67039, "t": 382.55551, "r": 174.68979, "b": 388.94965, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67039, "r_y0": 388.94965, "r_x1": 174.68979, "r_y1": 388.94965, "r_x2": 174.68979, "r_y2": 382.55551, "r_x3": 160.67039, "r_y3": 382.55551, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 96, "label": "text", "bbox": { "l": 153.0947, "t": 389.37228, "r": 177.73259, "b": 395.76642, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 153.0947, "r_y0": 395.76642, "r_x1": 177.73259, "r_y1": 395.76642, "r_x2": 177.73259, "r_y2": 389.37228, "r_x3": 153.0947, "r_y3": 389.37228, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 183.78624, "t": 314.388, "r": 199.32646, "b": 320.78214, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.78624, "r_y0": 320.78214, "r_x1": 199.32646, "r_y1": 320.78214, "r_x2": 199.32646, "r_y2": 314.388, "r_x3": 183.78624, "r_y3": 314.388, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 216.76038, "t": 314.388, "r": 232.30058, "b": 320.78214, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 216.76038, "r_y0": 320.78214, "r_x1": 232.30058, "r_y1": 320.78214, "r_x2": 232.30058, "r_y2": 314.388, "r_x3": 216.76038, "r_y3": 314.388, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 249.73447999999996, "t": 314.388, "r": 265.27469, "b": 320.78214, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.73447999999996, "r_y0": 320.78214, "r_x1": 265.27469, "r_y1": 320.78214, "r_x2": 265.27469, "r_y2": 314.388, "r_x3": 249.73447999999996, "r_y3": 314.388, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 183.78624, "t": 355.28836000000007, "r": 199.32646, "b": 361.68249999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.78624, "r_y0": 361.68249999999995, "r_x1": 199.32646, "r_y1": 361.68249999999995, "r_x2": 199.32646, "r_y2": 355.28836000000007, "r_x3": 183.78624, "r_y3": 355.28836000000007, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 80, "label": "text", "bbox": { "l": 216.76038, "t": 355.28836000000007, "r": 232.30058, "b": 361.68249999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 216.76038, "r_y0": 361.68249999999995, "r_x1": 232.30058, "r_y1": 361.68249999999995, "r_x2": 232.30058, "r_y2": 355.28836000000007, "r_x3": 216.76038, "r_y3": 355.28836000000007, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 82, "label": "text", "bbox": { "l": 249.73447999999996, "t": 355.28836000000007, "r": 265.27469, "b": 361.68249999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.73447999999996, "r_y0": 361.68249999999995, "r_x1": 265.27469, "r_y1": 361.68249999999995, "r_x2": 265.27469, "r_y2": 355.28836000000007, "r_x3": 249.73447999999996, "r_y3": 355.28836000000007, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 84, "label": "text", "bbox": { "l": 282.70862, "t": 355.28836000000007, "r": 298.24881, "b": 361.68249999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.70862, "r_y0": 361.68249999999995, "r_x1": 298.24881, "r_y1": 361.68249999999995, "r_x2": 298.24881, "r_y2": 355.28836000000007, "r_x3": 282.70862, "r_y3": 355.28836000000007, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 88, "label": "text", "bbox": { "l": 183.78624, "t": 375.73871, "r": 199.32646, "b": 382.13284, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.78624, "r_y0": 382.13284, "r_x1": 199.32646, "r_y1": 382.13284, "r_x2": 199.32646, "r_y2": 375.73871, "r_x3": 183.78624, "r_y3": 375.73871, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 90, "label": "text", "bbox": { "l": 216.76038, "t": 375.73871, "r": 232.30058, "b": 382.13284, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 216.76038, "r_y0": 382.13284, "r_x1": 232.30058, "r_y1": 382.13284, "r_x2": 232.30058, "r_y2": 375.73871, "r_x3": 216.76038, "r_y3": 375.73871, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 92, "label": "text", "bbox": { "l": 249.73447999999996, "t": 375.73871, "r": 265.27469, "b": 382.13284, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.73447999999996, "r_y0": 382.13284, "r_x1": 265.27469, "r_y1": 382.13284, "r_x2": 265.27469, "r_y2": 375.73871, "r_x3": 249.73447999999996, "r_y3": 375.73871, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 94, "label": "text", "bbox": { "l": 282.70862, "t": 375.73871, "r": 298.24881, "b": 382.13284, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.70862, "r_y0": 382.13284, "r_x1": 298.24881, "r_y1": 382.13284, "r_x2": 298.24881, "r_y2": 375.73871, "r_x3": 282.70862, "r_y3": 375.73871, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 97, "label": "text", "bbox": { "l": 395.06137, "t": 411.33353, "r": 401.62366, "b": 419.85904, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.06137, "r_y0": 419.85904, "r_x1": 401.62366, "r_y1": 419.85904, "r_x2": 401.62366, "r_y2": 411.33353, "r_x3": 395.06137, "r_y3": 411.33353, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 98, "label": "text", "bbox": { "l": 407.42249, "t": 411.33353, "r": 412.47598, "b": 419.85904, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.42249, "r_y0": 419.85904, "r_x1": 412.47598, "r_y1": 419.85904, "r_x2": 412.47598, "r_y2": 411.33353, "r_x3": 407.42249, "r_y3": 411.33353, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 99, "label": "text", "bbox": { "l": 418.69287, "t": 411.33353, "r": 425.25516, "b": 419.85904, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.69287, "r_y0": 419.85904, "r_x1": 425.25516, "r_y1": 419.85904, "r_x2": 425.25516, "r_y2": 411.33353, "r_x3": 418.69287, "r_y3": 411.33353, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 100, "label": "text", "bbox": { "l": 430.5086099999999, "t": 411.33353, "r": 436.5709800000001, "b": 419.85904, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 430.5086099999999, "r_y0": 419.85904, "r_x1": 436.5709800000001, "r_y1": 419.85904, "r_x2": 436.5709800000001, "r_y2": 411.33353, "r_x3": 430.5086099999999, "r_y3": 411.33353, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 101, "label": "text", "bbox": { "l": 152.36208, "t": 409.77362, "r": 175.10626, "b": 416.16776, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 152.36208, "r_y0": 416.16776, "r_x1": 175.10626, "r_y1": 416.16776, "r_x2": 175.10626, "r_y2": 409.77362, "r_x3": 152.36208, "r_y3": 409.77362, "coord_origin": "TOPLEFT" }, "text": "", "orig": "
", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 102, "label": "text", "bbox": { "l": 178.89366, "t": 409.77362, "r": 191.01935, "b": 416.16776, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 178.89366, "r_y0": 416.16776, "r_x1": 191.01935, "r_y1": 416.16776, "r_x2": 191.01935, "r_y2": 409.77362, "r_x3": 178.89366, "r_y3": 409.77362, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 103, "label": "text", "bbox": { "l": 194.80676, "t": 409.77362, "r": 208.82614, "b": 416.16776, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.80676, "r_y0": 416.16776, "r_x1": 208.82614, "r_y1": 416.16776, "r_x2": 208.82614, "r_y2": 409.77362, "r_x3": 194.80676, "r_y3": 409.77362, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 104, "label": "text", "bbox": { "l": 212.61354, "t": 409.77362, "r": 226.26003999999998, "b": 416.16776, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 212.61354, "r_y0": 416.16776, "r_x1": 226.26003999999998, "r_y1": 416.16776, "r_x2": 226.26003999999998, "r_y2": 409.77362, "r_x3": 212.61354, "r_y3": 409.77362, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 106, "label": "text", "bbox": { "l": 249.37506000000002, "t": 409.77362, "r": 259.03918, "b": 416.16776, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.37506000000002, "r_y0": 416.16776, "r_x1": 259.03918, "r_y1": 416.16776, "r_x2": 259.03918, "r_y2": 409.77362, "r_x3": 249.37506000000002, "r_y3": 409.77362, "coord_origin": "TOPLEFT" }, "text": "", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 112, "label": "text", "bbox": { "l": 244.46358, "t": 418.10522, "r": 269.10144, "b": 424.49936, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 244.46358, "r_y0": 424.49936, "r_x1": 269.10144, "r_y1": 424.49936, "r_x2": 269.10144, "r_y2": 418.10522, "r_x3": 244.46358, "r_y3": 418.10522, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 105, "label": "text", "bbox": { "l": 230.04745000000003, "t": 409.77362, "r": 245.58765000000002, "b": 416.16776, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 230.04745000000003, "r_y0": 416.16776, "r_x1": 245.58765000000002, "r_y1": 416.16776, "r_x2": 245.58765000000002, "r_y2": 409.77362, "r_x3": 230.04745000000003, "r_y3": 409.77362, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 113, "label": "text", "bbox": { "l": 154.50595, "t": 258.60095, "r": 159.62473, "b": 265.70556999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.50595, "r_y0": 265.70556999999997, "r_x1": 159.62473, "r_y1": 265.70556999999997, "r_x2": 159.62473, "r_y2": 258.60095, "r_x3": 154.50595, "r_y3": 258.60095, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 114, "label": "text", "bbox": { "l": 164.74348, "t": 258.60095, "r": 185.21857, "b": 265.70556999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 164.74348, "r_y0": 265.70556999999997, "r_x1": 185.21857, "r_y1": 265.70556999999997, "r_x2": 185.21857, "r_y2": 258.60095, "r_x3": 164.74348, "r_y3": 258.60095, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 115, "label": "text", "bbox": { "l": 164.3548, "t": 266.49707, "r": 222.05352999999997, "b": 273.60168, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 164.3548, "r_y0": 273.60168, "r_x1": 222.05352999999997, "r_y1": 273.60168, "r_x2": 222.05352999999997, "r_y2": 266.49707, "r_x3": 164.3548, "r_y3": 266.49707, "coord_origin": "TOPLEFT" }, "text": "sequence length:", "orig": "sequence length:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 116, "label": "text", "bbox": { "l": 224.15326, "t": 266.49707, "r": 232.57729, "b": 273.60168, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 224.15326, "r_y0": 273.60168, "r_x1": 232.57729, "r_y1": 273.60168, "r_x2": 232.57729, "r_y2": 266.49707, "r_x3": 224.15326, "r_y3": 266.49707, "coord_origin": "TOPLEFT" }, "text": "55", "orig": "55", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "text", "id": 2, "page_no": 1, "cluster": { "id": 2, "label": "text", "bbox": { "l": 134.765, "t": 452.31378, "r": 480.59232000000003, "b": 520.88669, "coord_origin": "TOPLEFT" }, "confidence": 0.950499951839447, "cells": [ { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 461.11075, "r_x1": 161.32928, "r_y1": 461.11075, "r_x2": 161.32928, "r_y2": 452.31378, "r_x3": 134.765, "r_y3": 452.31378, "coord_origin": "TOPLEFT" }, "text": "today,", "orig": "today,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 164.269, "r_y0": 461.11075, "r_x1": 226.28617999999997, "r_y1": 461.11075, "r_x2": 226.28617999999997, "r_y2": 452.31378, "r_x3": 164.269, "r_y3": 452.31378, "coord_origin": "TOPLEFT" }, "text": "table detection", "orig": "table detection", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.992, "r_y0": 461.11075, "r_x1": 480.59232000000003, "r_y1": 461.11075, "r_x2": 480.59232000000003, "r_y2": 452.31378, "r_x3": 229.992, "r_y3": 452.31378, "coord_origin": "TOPLEFT" }, "text": "in documents is a well understood problem, and the latest", "orig": "in documents is a well understood problem, and the latest", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 473.06573, "r_x1": 480.59180000000003, "r_y1": 473.06573, "r_x2": 480.59180000000003, "r_y2": 464.26877, "r_x3": 134.76501, "r_y3": 464.26877, "coord_origin": "TOPLEFT" }, "text": "state-of-the-art (SOTA) object detection methods provide an accuracy compa-", "orig": "state-of-the-art (SOTA) object detection methods provide an accuracy compa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 485.02072, "r_x1": 480.58673, "r_y1": 485.02072, "r_x2": 480.58673, "r_y2": 476.22375, "r_x3": 134.76501, "r_y3": 476.22375, "coord_origin": "TOPLEFT" }, "text": "rable to human observers [7,8,10,14,23]. On the other hand, the problem of table", "orig": "rable to human observers [7,8,10,14,23]. On the other hand, the problem of table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 496.97672, "r_x1": 480.58658, "r_y1": 496.97672, "r_x2": 480.58658, "r_y2": 488.17975, "r_x3": 134.76501, "r_y3": 488.17975, "coord_origin": "TOPLEFT" }, "text": "structure recognition (TSR) is a lot more challenging and remains a very active", "orig": "structure recognition (TSR) is a lot more challenging and remains a very active", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 508.9317, "r_x1": 480.58978, "r_y1": 508.9317, "r_x2": 480.58978, "r_y2": 500.13474, "r_x3": 134.76501, "r_y3": 500.13474, "coord_origin": "TOPLEFT" }, "text": "area of research, in which many novel machine learning algorithms are being", "orig": "area of research, in which many novel machine learning algorithms are being", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 520.88669, "r_x1": 313.24597, "r_y1": 520.88669, "r_x2": 313.24597, "r_y2": 512.0897199999999, "r_x3": 134.76501, "r_y3": 512.0897199999999, "coord_origin": "TOPLEFT" }, "text": "explored [3,4,5,9,11,12,13,14,17,18,21,22].", "orig": "explored [3,4,5,9,11,12,13,14,17,18,21,22].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "today, table detection in documents is a well understood problem, and the latest state-of-the-art (SOTA) object detection methods provide an accuracy comparable to human observers [7,8,10,14,23]. On the other hand, the problem of table structure recognition (TSR) is a lot more challenging and remains a very active area of research, in which many novel machine learning algorithms are being explored [3,4,5,9,11,12,13,14,17,18,21,22]." }, { "label": "text", "id": 0, "page_no": 1, "cluster": { "id": 0, "label": "text", "bbox": { "l": 134.76501, "t": 524.55072, "r": 480.59482, "b": 664.8547, "coord_origin": "TOPLEFT" }, "confidence": 0.9845512509346008, "cells": [ { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.70901, "r_y0": 533.3476900000001, "r_x1": 480.58884000000006, "r_y1": 533.3476900000001, "r_x2": 480.58884000000006, "r_y2": 524.55072, "r_x3": 149.70901, "r_y3": 524.55072, "coord_origin": "TOPLEFT" }, "text": "Recently emerging SOTA methods for table structure recognition employ", "orig": "Recently emerging SOTA methods for table structure recognition employ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 545.30368, "r_x1": 480.5917400000001, "r_y1": 545.30368, "r_x2": 480.5917400000001, "r_y2": 536.50671, "r_x3": 134.76501, "r_y3": 536.50671, "coord_origin": "TOPLEFT" }, "text": "transformer-based models, in which an image of the table is provided to the net-", "orig": "transformer-based models, in which an image of the table is provided to the net-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 557.25868, "r_x1": 480.58868, "r_y1": 557.25868, "r_x2": 480.58868, "r_y2": 548.46172, "r_x3": 134.76501, "r_y3": 548.46172, "coord_origin": "TOPLEFT" }, "text": "work in order to predict the structure of the table as a sequence of tokens. These", "orig": "work in order to predict the structure of the table as a sequence of tokens. These", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 569.2136800000001, "r_x1": 480.58795, "r_y1": 569.2136800000001, "r_x2": 480.58795, "r_y2": 560.41672, "r_x3": 134.76501, "r_y3": 560.41672, "coord_origin": "TOPLEFT" }, "text": "image-to-sequence (Im2Seq) models are extremely powerful, since they allow for", "orig": "image-to-sequence (Im2Seq) models are extremely powerful, since they allow for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 581.16869, "r_x1": 480.58978, "r_y1": 581.16869, "r_x2": 480.58978, "r_y2": 572.37172, "r_x3": 134.76501, "r_y3": 572.37172, "coord_origin": "TOPLEFT" }, "text": "a purely data-driven solution. The tokens of the sequence typically belong to a", "orig": "a purely data-driven solution. The tokens of the sequence typically belong to a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 593.12369, "r_x1": 480.59479, "r_y1": 593.12369, "r_x2": 480.59479, "r_y2": 584.32672, "r_x3": 134.76501, "r_y3": 584.32672, "coord_origin": "TOPLEFT" }, "text": "markup language such as HTML, Latex or Markdown, which allow to describe", "orig": "markup language such as HTML, Latex or Markdown, which allow to describe", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 605.0796799999999, "r_x1": 480.58678999999995, "r_y1": 605.0796799999999, "r_x2": 480.58678999999995, "r_y2": 596.28271, "r_x3": 134.76501, "r_y3": 596.28271, "coord_origin": "TOPLEFT" }, "text": "table structure as rows, columns and spanning cells in various configurations.", "orig": "table structure as rows, columns and spanning cells in various configurations.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 617.03468, "r_x1": 480.59476, "r_y1": 617.03468, "r_x2": 480.59476, "r_y2": 608.23772, "r_x3": 134.76501, "r_y3": 608.23772, "coord_origin": "TOPLEFT" }, "text": "In Figure 1, we illustrate how HTML is used to represent the table-structure", "orig": "In Figure 1, we illustrate how HTML is used to represent the table-structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 628.98969, "r_x1": 480.5938100000001, "r_y1": 628.98969, "r_x2": 480.5938100000001, "r_y2": 620.19272, "r_x3": 134.76501, "r_y3": 620.19272, "coord_origin": "TOPLEFT" }, "text": "of a particular example table. Public table-structure data sets such as PubTab-", "orig": "of a particular example table. Public table-structure data sets such as PubTab-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 640.94469, "r_x1": 480.59482, "r_y1": 640.94469, "r_x2": 480.59482, "r_y2": 632.1477199999999, "r_x3": 134.76501, "r_y3": 632.1477199999999, "coord_origin": "TOPLEFT" }, "text": "Net [22], and FinTabNet [21], which were created in a semi-automated way from", "orig": "Net [22], and FinTabNet [21], which were created in a semi-automated way from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 652.89969, "r_x1": 480.58771, "r_y1": 652.89969, "r_x2": 480.58771, "r_y2": 644.10272, "r_x3": 134.76501, "r_y3": 644.10272, "coord_origin": "TOPLEFT" }, "text": "paired PDF and HTML sources (e.g. PubMed Central), popularized primarily", "orig": "paired PDF and HTML sources (e.g. PubMed Central), popularized primarily", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 664.8547, "r_x1": 421.45377, "r_y1": 664.8547, "r_x2": 421.45377, "r_y2": 656.05772, "r_x3": 134.76501, "r_y3": 656.05772, "coord_origin": "TOPLEFT" }, "text": "the use of HTML as ground-truth representation format for TSR.", "orig": "the use of HTML as ground-truth representation format for TSR.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Recently emerging SOTA methods for table structure recognition employ transformer-based models, in which an image of the table is provided to the network in order to predict the structure of the table as a sequence of tokens. These image-to-sequence (Im2Seq) models are extremely powerful, since they allow for a purely data-driven solution. The tokens of the sequence typically belong to a markup language such as HTML, Latex or Markdown, which allow to describe table structure as rows, columns and spanning cells in various configurations. In Figure 1, we illustrate how HTML is used to represent the table-structure of a particular example table. Public table-structure data sets such as PubTabNet [22], and FinTabNet [21], which were created in a semi-automated way from paired PDF and HTML sources (e.g. PubMed Central), popularized primarily the use of HTML as ground-truth representation format for TSR." } ], "headers": [ { "label": "page_header", "id": 5, "page_no": 1, "cluster": { "id": 5, "label": "page_header", "bbox": { "l": 134.765, "t": 93.77099999999996, "r": 139.37193, "b": 101.84069999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.8580349683761597, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 101.84069999999997, "r_x1": 139.37193, "r_y1": 101.84069999999997, "r_x2": 139.37193, "r_y2": 93.77099999999996, "r_x3": 134.765, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "2" }, { "label": "page_header", "id": 3, "page_no": 1, "cluster": { "id": 3, "label": "page_header", "bbox": { "l": 167.81335, "t": 93.77099999999996, "r": 231.72227, "b": 101.84069999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.9076642990112305, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.81335, "r_y0": 101.84069999999997, "r_x1": 178.07675, "r_y1": 101.84069999999997, "r_x2": 178.07675, "r_y2": 93.77099999999996, "r_x3": 167.81335, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.37415, "r_y0": 101.84069999999997, "r_x1": 231.72227, "r_y1": 101.84069999999997, "r_x2": 231.72227, "r_y2": 93.77099999999996, "r_x3": 182.37415, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "M. Lysak, et al." } ] } }, { "page_no": 2, "size": { "width": 612.0, "height": 792.0 }, "parsed_page": { "dimension": { "angle": 0.0, "rect": { "r_x0": 0.0, "r_y0": 0.0, "r_x1": 612.0, "r_y1": 0.0, "r_x2": 612.0, "r_y2": 792.0, "r_x3": 0.0, "r_y3": 792.0, "coord_origin": "BOTTOMLEFT" }, "boundary_type": "crop_box", "art_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "bleed_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "crop_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "media_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "trim_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" } }, "bitmap_resources": [], "char_cells": [], "word_cells": [], "textline_cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.478, "r_y0": 101.84069999999997, "r_x1": 447.54291000000006, "r_y1": 101.84069999999997, "r_x2": 447.54291000000006, "r_y2": 93.77099999999996, "r_x3": 194.478, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 475.98431, "r_y0": 101.84069999999997, "r_x1": 480.59125000000006, "r_y1": 101.84069999999997, "r_x2": 480.59125000000006, "r_y2": 93.77099999999996, "r_x3": 475.98431, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.709, "r_y0": 127.73077, "r_x1": 480.59183, "r_y1": 127.73077, "r_x2": 480.59183, "r_y2": 118.93377999999996, "r_x3": 149.709, "r_y3": 118.93377999999996, "coord_origin": "TOPLEFT" }, "text": "While the majority of research in TSR is currently focused on the develop-", "orig": "While the majority of research in TSR is currently focused on the develop-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 139.68579, "r_x1": 480.58675999999997, "r_y1": 139.68579, "r_x2": 480.58675999999997, "r_y2": 130.88878999999997, "r_x3": 134.765, "r_y3": 130.88878999999997, "coord_origin": "TOPLEFT" }, "text": "ment and application of novel neural model architectures, the table structure", "orig": "ment and application of novel neural model architectures, the table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 151.64178000000004, "r_x1": 480.5917400000001, "r_y1": 151.64178000000004, "r_x2": 480.5917400000001, "r_y2": 142.84479, "r_x3": 134.765, "r_y3": 142.84479, "coord_origin": "TOPLEFT" }, "text": "representation language (e.g. HTML in PubTabNet and FinTabNet) is usually", "orig": "representation language (e.g. HTML in PubTabNet and FinTabNet) is usually", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 163.59680000000003, "r_x1": 169.62514, "r_y1": 163.59680000000003, "r_x2": 169.62514, "r_y2": 154.7998, "r_x3": 134.765, "r_y3": 154.7998, "coord_origin": "TOPLEFT" }, "text": "adopted", "orig": "adopted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 173.86099, "r_y0": 163.59680000000003, "r_x1": 194.55531, "r_y1": 163.59680000000003, "r_x2": 194.55531, "r_y2": 154.7998, "r_x3": 173.86099, "r_y3": 154.7998, "coord_origin": "TOPLEFT" }, "text": "as is", "orig": "as is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 199.60999, "r_y0": 163.59680000000003, "r_x1": 480.58618, "r_y1": 163.59680000000003, "r_x2": 480.58618, "r_y2": 154.7998, "r_x3": 199.60999, "r_y3": 154.7998, "coord_origin": "TOPLEFT" }, "text": "for the sequence tokenization in Im2Seq models. In this paper,", "orig": "for the sequence tokenization in Im2Seq models. In this paper,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 175.55182000000002, "r_x1": 480.59167, "r_y1": 175.55182000000002, "r_x2": 480.59167, "r_y2": 166.75482, "r_x3": 134.76498, "r_y3": 166.75482, "coord_origin": "TOPLEFT" }, "text": "we aim for the opposite and investigate the impact of the table structure rep-", "orig": "we aim for the opposite and investigate the impact of the table structure rep-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 187.50684, "r_x1": 480.58968999999996, "r_y1": 187.50684, "r_x2": 480.58968999999996, "r_y2": 178.70983999999999, "r_x3": 134.76498, "r_y3": 178.70983999999999, "coord_origin": "TOPLEFT" }, "text": "resentation language with an otherwise unmodified Im2Seq transformer-based", "orig": "resentation language with an otherwise unmodified Im2Seq transformer-based", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 199.46185000000003, "r_x1": 480.5917400000001, "r_y1": 199.46185000000003, "r_x2": 480.5917400000001, "r_y2": 190.66485999999998, "r_x3": 134.76498, "r_y3": 190.66485999999998, "coord_origin": "TOPLEFT" }, "text": "architecture. Since the current state-of-the-art Im2Seq model is TableFormer [9],", "orig": "architecture. Since the current state-of-the-art Im2Seq model is TableFormer [9],", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 211.41687000000002, "r_x1": 348.35519, "r_y1": 211.41687000000002, "r_x2": 348.35519, "r_y2": 202.61987, "r_x3": 134.76498, "r_y3": 202.61987, "coord_origin": "TOPLEFT" }, "text": "we select this model to perform our experiments.", "orig": "we select this model to perform our experiments.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.70898, "r_y0": 223.63287000000003, "r_x1": 480.5939, "r_y1": 223.63287000000003, "r_x2": 480.5939, "r_y2": 214.83587999999997, "r_x3": 149.70898, "r_y3": 214.83587999999997, "coord_origin": "TOPLEFT" }, "text": "The main contribution of this paper is the introduction of a new optimised ta-", "orig": "The main contribution of this paper is the introduction of a new optimised ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 235.58789000000002, "r_x1": 480.5938100000001, "r_y1": 235.58789000000002, "r_x2": 480.5938100000001, "r_y2": 226.79089, "r_x3": 134.76498, "r_y3": 226.79089, "coord_origin": "TOPLEFT" }, "text": "ble structure language (OTSL), specifically designed to describe table-structure", "orig": "ble structure language (OTSL), specifically designed to describe table-structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 247.54387999999994, "r_x1": 480.58667, "r_y1": 247.54387999999994, "r_x2": 480.58667, "r_y2": 238.74689, "r_x3": 134.76498, "r_y3": 238.74689, "coord_origin": "TOPLEFT" }, "text": "in an compact and structured way for Im2Seq models. OTSL has a number of", "orig": "in an compact and structured way for Im2Seq models. OTSL has a number of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 259.49890000000005, "r_x1": 480.5867, "r_y1": 259.49890000000005, "r_x2": 480.5867, "r_y2": 250.70190000000002, "r_x3": 134.76498, "r_y3": 250.70190000000002, "coord_origin": "TOPLEFT" }, "text": "key features, which make it very attractive to use in Im2Seq models. Specifically,", "orig": "key features, which make it very attractive to use in Im2Seq models. Specifically,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 271.45392000000004, "r_x1": 480.58771, "r_y1": 271.45392000000004, "r_x2": 480.58771, "r_y2": 262.65692, "r_x3": 134.76498, "r_y3": 262.65692, "coord_origin": "TOPLEFT" }, "text": "compared to other languages such as HTML, OTSL has a minimized vocabulary", "orig": "compared to other languages such as HTML, OTSL has a minimized vocabulary", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 283.40891, "r_x1": 480.59572999999995, "r_y1": 283.40891, "r_x2": 480.59572999999995, "r_y2": 274.61194, "r_x3": 134.76498, "r_y3": 274.61194, "coord_origin": "TOPLEFT" }, "text": "which yields short sequence length, strong inherent structure (e.g. strict rectan-", "orig": "which yields short sequence length, strong inherent structure (e.g. strict rectan-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 295.36389, "r_x1": 480.59274, "r_y1": 295.36389, "r_x2": 480.59274, "r_y2": 286.56692999999996, "r_x3": 134.76498, "r_y3": 286.56692999999996, "coord_origin": "TOPLEFT" }, "text": "gular layout) and a strict syntax with rules that only look backwards. The latter", "orig": "gular layout) and a strict syntax with rules that only look backwards. The latter", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 307.31888, "r_x1": 480.59473, "r_y1": 307.31888, "r_x2": 480.59473, "r_y2": 298.52190999999993, "r_x3": 134.76498, "r_y3": 298.52190999999993, "coord_origin": "TOPLEFT" }, "text": "allows for syntax validation during inference and ensures a syntactically correct", "orig": "allows for syntax validation during inference and ensures a syntactically correct", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 319.27487, "r_x1": 480.58667, "r_y1": 319.27487, "r_x2": 480.58667, "r_y2": 310.47791, "r_x3": 134.76498, "r_y3": 310.47791, "coord_origin": "TOPLEFT" }, "text": "table-structure. These OTSL features are illustrated in Figure 1, in comparison", "orig": "table-structure. These OTSL features are illustrated in Figure 1, in comparison", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 331.22986, "r_x1": 179.72021, "r_y1": 331.22986, "r_x2": 179.72021, "r_y2": 322.43289, "r_x3": 134.76498, "r_y3": 322.43289, "coord_origin": "TOPLEFT" }, "text": "to HTML.", "orig": "to HTML.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.70898, "r_y0": 343.44485000000003, "r_x1": 480.5878000000001, "r_y1": 343.44485000000003, "r_x2": 480.5878000000001, "r_y2": 334.64789, "r_x3": 149.70898, "r_y3": 334.64789, "coord_origin": "TOPLEFT" }, "text": "The paper is structured as follows. In section 2, we give an overview of the", "orig": "The paper is structured as follows. In section 2, we give an overview of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 355.40085, "r_x1": 480.59375, "r_y1": 355.40085, "r_x2": 480.59375, "r_y2": 346.60388000000006, "r_x3": 134.76498, "r_y3": 346.60388000000006, "coord_origin": "TOPLEFT" }, "text": "latest developments in table-structure reconstruction. In section 3 we review", "orig": "latest developments in table-structure reconstruction. In section 3 we review", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 367.3558300000001, "r_x1": 480.58673, "r_y1": 367.3558300000001, "r_x2": 480.58673, "r_y2": 358.55887, "r_x3": 134.76498, "r_y3": 358.55887, "coord_origin": "TOPLEFT" }, "text": "the current HTML table encoding (popularised by PubTabNet and FinTabNet)", "orig": "the current HTML table encoding (popularised by PubTabNet and FinTabNet)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 379.31082, "r_x1": 480.59161, "r_y1": 379.31082, "r_x2": 480.59161, "r_y2": 370.51385, "r_x3": 134.76498, "r_y3": 370.51385, "coord_origin": "TOPLEFT" }, "text": "and discuss its flaws. Subsequently, we introduce OTSL in section 4, which in-", "orig": "and discuss its flaws. Subsequently, we introduce OTSL in section 4, which in-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 391.26581, "r_x1": 480.59177000000005, "r_y1": 391.26581, "r_x2": 480.59177000000005, "r_y2": 382.46883999999994, "r_x3": 134.76498, "r_y3": 382.46883999999994, "coord_origin": "TOPLEFT" }, "text": "cludes the language definition, syntax rules and error-correction procedures. In", "orig": "cludes the language definition, syntax rules and error-correction procedures. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 403.2207900000001, "r_x1": 480.58774, "r_y1": 403.2207900000001, "r_x2": 480.58774, "r_y2": 394.42383, "r_x3": 134.76498, "r_y3": 394.42383, "coord_origin": "TOPLEFT" }, "text": "section 5, we apply OTSL on the TableFormer architecture, compare it to Table-", "orig": "section 5, we apply OTSL on the TableFormer architecture, compare it to Table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 415.17679, "r_x1": 480.59469999999993, "r_y1": 415.17679, "r_x2": 480.59469999999993, "r_y2": 406.37982, "r_x3": 134.76498, "r_y3": 406.37982, "coord_origin": "TOPLEFT" }, "text": "Former models trained on HTML and ultimately demonstrate the advantages", "orig": "Former models trained on HTML and ultimately demonstrate the advantages", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 427.13177, "r_x1": 480.59567, "r_y1": 427.13177, "r_x2": 480.59567, "r_y2": 418.33481, "r_x3": 134.76498, "r_y3": 418.33481, "coord_origin": "TOPLEFT" }, "text": "of using OTSL. Finally, in section 6 we conclude our work and outline next", "orig": "of using OTSL. Finally, in section 6 we conclude our work and outline next", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 439.08676, "r_x1": 201.27232, "r_y1": 439.08676, "r_x2": 201.27232, "r_y2": 430.28979, "r_x3": 134.76498, "r_y3": 430.28979, "coord_origin": "TOPLEFT" }, "text": "potential steps.", "orig": "potential steps.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 472.65634, "r_x1": 141.48859, "r_y1": 472.65634, "r_x2": 141.48859, "r_y2": 462.08795, "r_x3": 134.76498, "r_y3": 462.08795, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.93819, "r_y0": 472.65634, "r_x1": 236.76912999999996, "r_y1": 472.65634, "r_x2": 236.76912999999996, "r_y2": 462.08795, "r_x3": 154.93819, "r_y3": 462.08795, "coord_origin": "TOPLEFT" }, "text": "Related Work", "orig": "Related Work", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 497.48279, "r_x1": 480.59067, "r_y1": 497.48279, "r_x2": 480.59067, "r_y2": 488.68582, "r_x3": 134.76498, "r_y3": 488.68582, "coord_origin": "TOPLEFT" }, "text": "Approaches to formalize the logical structure and layout of tables in electronic", "orig": "Approaches to formalize the logical structure and layout of tables in electronic", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 509.43777, "r_x1": 480.5917400000001, "r_y1": 509.43777, "r_x2": 480.5917400000001, "r_y2": 500.64081, "r_x3": 134.76498, "r_y3": 500.64081, "coord_origin": "TOPLEFT" }, "text": "documents date back more than two decades [16]. In the recent past, a wide", "orig": "documents date back more than two decades [16]. In the recent past, a wide", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 521.39276, "r_x1": 480.58971999999994, "r_y1": 521.39276, "r_x2": 480.58971999999994, "r_y2": 512.5957900000001, "r_x3": 134.76498, "r_y3": 512.5957900000001, "coord_origin": "TOPLEFT" }, "text": "variety of computer vision methods have been explored to tackle the prob-", "orig": "variety of computer vision methods have been explored to tackle the prob-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 533.34875, "r_x1": 480.58966, "r_y1": 533.34875, "r_x2": 480.58966, "r_y2": 524.55179, "r_x3": 134.76498, "r_y3": 524.55179, "coord_origin": "TOPLEFT" }, "text": "lem of table structure recognition, i.e. the correct identification of columns,", "orig": "lem of table structure recognition, i.e. the correct identification of columns,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 545.30376, "r_x1": 480.5897499999999, "r_y1": 545.30376, "r_x2": 480.5897499999999, "r_y2": 536.50679, "r_x3": 134.76498, "r_y3": 536.50679, "coord_origin": "TOPLEFT" }, "text": "rows and spanning cells in a given table. Broadly speaking, the current deep-", "orig": "rows and spanning cells in a given table. Broadly speaking, the current deep-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 557.2587599999999, "r_x1": 480.58862000000005, "r_y1": 557.2587599999999, "r_x2": 480.58862000000005, "r_y2": 548.4617900000001, "r_x3": 134.76498, "r_y3": 548.4617900000001, "coord_origin": "TOPLEFT" }, "text": "learning based approaches fall into three categories: object detection (OD) meth-", "orig": "learning based approaches fall into three categories: object detection (OD) meth-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 569.21376, "r_x1": 480.59072999999995, "r_y1": 569.21376, "r_x2": 480.59072999999995, "r_y2": 560.41679, "r_x3": 134.76498, "r_y3": 560.41679, "coord_origin": "TOPLEFT" }, "text": "ods, Graph-Neural-Network (GNN) methods and Image-to-Markup-Sequence", "orig": "ods, Graph-Neural-Network (GNN) methods and Image-to-Markup-Sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 581.16876, "r_x1": 484.12047999999993, "r_y1": 581.16876, "r_x2": 484.12047999999993, "r_y2": 572.3718, "r_x3": 134.76498, "r_y3": 572.3718, "coord_origin": "TOPLEFT" }, "text": "(Im2Seq) methods. Object-detection based methods [11,12,13,14,21] rely on table-", "orig": "(Im2Seq) methods. Object-detection based methods [11,12,13,14,21] rely on table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 593.12376, "r_x1": 480.59567, "r_y1": 593.12376, "r_x2": 480.59567, "r_y2": 584.3267999999999, "r_x3": 134.76498, "r_y3": 584.3267999999999, "coord_origin": "TOPLEFT" }, "text": "structure annotation using (overlapping) bounding boxes for training, and pro-", "orig": "structure annotation using (overlapping) bounding boxes for training, and pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 605.07976, "r_x1": 480.58871, "r_y1": 605.07976, "r_x2": 480.58871, "r_y2": 596.28279, "r_x3": 134.76498, "r_y3": 596.28279, "coord_origin": "TOPLEFT" }, "text": "duce bounding-box predictions to define table cells, rows, and columns on a table", "orig": "duce bounding-box predictions to define table cells, rows, and columns on a table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 617.03476, "r_x1": 480.59075999999993, "r_y1": 617.03476, "r_x2": 480.59075999999993, "r_y2": 608.23779, "r_x3": 134.76498, "r_y3": 608.23779, "coord_origin": "TOPLEFT" }, "text": "image. Graph Neural Network (GNN) based methods [3,6,17,18], as the name", "orig": "image. Graph Neural Network (GNN) based methods [3,6,17,18], as the name", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 628.9897599999999, "r_x1": 480.58574999999996, "r_y1": 628.9897599999999, "r_x2": 480.58574999999996, "r_y2": 620.1927900000001, "r_x3": 134.76498, "r_y3": 620.1927900000001, "coord_origin": "TOPLEFT" }, "text": "suggests, represent tables as graph structures. The graph nodes represent the", "orig": "suggests, represent tables as graph structures. The graph nodes represent the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 640.94476, "r_x1": 480.58875, "r_y1": 640.94476, "r_x2": 480.58875, "r_y2": 632.1478, "r_x3": 134.76498, "r_y3": 632.1478, "coord_origin": "TOPLEFT" }, "text": "content of each table cell, an embedding vector from the table image, or geomet-", "orig": "content of each table cell, an embedding vector from the table image, or geomet-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 652.89977, "r_x1": 480.58875, "r_y1": 652.89977, "r_x2": 480.58875, "r_y2": 644.1028, "r_x3": 134.76498, "r_y3": 644.1028, "coord_origin": "TOPLEFT" }, "text": "ric coordinates of the table cell. The edges of the graph define the relationship", "orig": "ric coordinates of the table cell. The edges of the graph define the relationship", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 664.85577, "r_x1": 480.59069999999997, "r_y1": 664.85577, "r_x2": 480.59069999999997, "r_y2": 656.05879, "r_x3": 134.76498, "r_y3": 656.05879, "coord_origin": "TOPLEFT" }, "text": "between the nodes, e.g. if they belong to the same column, row, or table cell.", "orig": "between the nodes, e.g. if they belong to the same column, row, or table cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "has_chars": false, "has_words": false, "has_lines": true, "image": null, "lines": [] }, "predictions": { "layout": { "clusters": [ { "id": 5, "label": "page_header", "bbox": { "l": 194.478, "t": 93.77099999999996, "r": 447.54291000000006, "b": 101.84069999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.9325801730155945, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.478, "r_y0": 101.84069999999997, "r_x1": 447.54291000000006, "r_y1": 101.84069999999997, "r_x2": 447.54291000000006, "r_y2": 93.77099999999996, "r_x3": 194.478, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 6, "label": "page_header", "bbox": { "l": 475.98431, "t": 93.77099999999996, "r": 480.59125000000006, "b": 101.84069999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.8773486614227295, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 475.98431, "r_y0": 101.84069999999997, "r_x1": 480.59125000000006, "r_y1": 101.84069999999997, "r_x2": 480.59125000000006, "r_y2": 93.77099999999996, "r_x3": 475.98431, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 2, "label": "text", "bbox": { "l": 134.76498, "t": 118.93377999999996, "r": 480.59183, "b": 211.41687000000002, "coord_origin": "TOPLEFT" }, "confidence": 0.9871802926063538, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.709, "r_y0": 127.73077, "r_x1": 480.59183, "r_y1": 127.73077, "r_x2": 480.59183, "r_y2": 118.93377999999996, "r_x3": 149.709, "r_y3": 118.93377999999996, "coord_origin": "TOPLEFT" }, "text": "While the majority of research in TSR is currently focused on the develop-", "orig": "While the majority of research in TSR is currently focused on the develop-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 139.68579, "r_x1": 480.58675999999997, "r_y1": 139.68579, "r_x2": 480.58675999999997, "r_y2": 130.88878999999997, "r_x3": 134.765, "r_y3": 130.88878999999997, "coord_origin": "TOPLEFT" }, "text": "ment and application of novel neural model architectures, the table structure", "orig": "ment and application of novel neural model architectures, the table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 151.64178000000004, "r_x1": 480.5917400000001, "r_y1": 151.64178000000004, "r_x2": 480.5917400000001, "r_y2": 142.84479, "r_x3": 134.765, "r_y3": 142.84479, "coord_origin": "TOPLEFT" }, "text": "representation language (e.g. HTML in PubTabNet and FinTabNet) is usually", "orig": "representation language (e.g. HTML in PubTabNet and FinTabNet) is usually", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 163.59680000000003, "r_x1": 169.62514, "r_y1": 163.59680000000003, "r_x2": 169.62514, "r_y2": 154.7998, "r_x3": 134.765, "r_y3": 154.7998, "coord_origin": "TOPLEFT" }, "text": "adopted", "orig": "adopted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 173.86099, "r_y0": 163.59680000000003, "r_x1": 194.55531, "r_y1": 163.59680000000003, "r_x2": 194.55531, "r_y2": 154.7998, "r_x3": 173.86099, "r_y3": 154.7998, "coord_origin": "TOPLEFT" }, "text": "as is", "orig": "as is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 199.60999, "r_y0": 163.59680000000003, "r_x1": 480.58618, "r_y1": 163.59680000000003, "r_x2": 480.58618, "r_y2": 154.7998, "r_x3": 199.60999, "r_y3": 154.7998, "coord_origin": "TOPLEFT" }, "text": "for the sequence tokenization in Im2Seq models. In this paper,", "orig": "for the sequence tokenization in Im2Seq models. In this paper,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 175.55182000000002, "r_x1": 480.59167, "r_y1": 175.55182000000002, "r_x2": 480.59167, "r_y2": 166.75482, "r_x3": 134.76498, "r_y3": 166.75482, "coord_origin": "TOPLEFT" }, "text": "we aim for the opposite and investigate the impact of the table structure rep-", "orig": "we aim for the opposite and investigate the impact of the table structure rep-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 187.50684, "r_x1": 480.58968999999996, "r_y1": 187.50684, "r_x2": 480.58968999999996, "r_y2": 178.70983999999999, "r_x3": 134.76498, "r_y3": 178.70983999999999, "coord_origin": "TOPLEFT" }, "text": "resentation language with an otherwise unmodified Im2Seq transformer-based", "orig": "resentation language with an otherwise unmodified Im2Seq transformer-based", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 199.46185000000003, "r_x1": 480.5917400000001, "r_y1": 199.46185000000003, "r_x2": 480.5917400000001, "r_y2": 190.66485999999998, "r_x3": 134.76498, "r_y3": 190.66485999999998, "coord_origin": "TOPLEFT" }, "text": "architecture. Since the current state-of-the-art Im2Seq model is TableFormer [9],", "orig": "architecture. Since the current state-of-the-art Im2Seq model is TableFormer [9],", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 211.41687000000002, "r_x1": 348.35519, "r_y1": 211.41687000000002, "r_x2": 348.35519, "r_y2": 202.61987, "r_x3": 134.76498, "r_y3": 202.61987, "coord_origin": "TOPLEFT" }, "text": "we select this model to perform our experiments.", "orig": "we select this model to perform our experiments.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 1, "label": "text", "bbox": { "l": 134.76498, "t": 214.83587999999997, "r": 480.59572999999995, "b": 331.22986, "coord_origin": "TOPLEFT" }, "confidence": 0.9871861338615417, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.70898, "r_y0": 223.63287000000003, "r_x1": 480.5939, "r_y1": 223.63287000000003, "r_x2": 480.5939, "r_y2": 214.83587999999997, "r_x3": 149.70898, "r_y3": 214.83587999999997, "coord_origin": "TOPLEFT" }, "text": "The main contribution of this paper is the introduction of a new optimised ta-", "orig": "The main contribution of this paper is the introduction of a new optimised ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 235.58789000000002, "r_x1": 480.5938100000001, "r_y1": 235.58789000000002, "r_x2": 480.5938100000001, "r_y2": 226.79089, "r_x3": 134.76498, "r_y3": 226.79089, "coord_origin": "TOPLEFT" }, "text": "ble structure language (OTSL), specifically designed to describe table-structure", "orig": "ble structure language (OTSL), specifically designed to describe table-structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 247.54387999999994, "r_x1": 480.58667, "r_y1": 247.54387999999994, "r_x2": 480.58667, "r_y2": 238.74689, "r_x3": 134.76498, "r_y3": 238.74689, "coord_origin": "TOPLEFT" }, "text": "in an compact and structured way for Im2Seq models. OTSL has a number of", "orig": "in an compact and structured way for Im2Seq models. OTSL has a number of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 259.49890000000005, "r_x1": 480.5867, "r_y1": 259.49890000000005, "r_x2": 480.5867, "r_y2": 250.70190000000002, "r_x3": 134.76498, "r_y3": 250.70190000000002, "coord_origin": "TOPLEFT" }, "text": "key features, which make it very attractive to use in Im2Seq models. Specifically,", "orig": "key features, which make it very attractive to use in Im2Seq models. Specifically,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 271.45392000000004, "r_x1": 480.58771, "r_y1": 271.45392000000004, "r_x2": 480.58771, "r_y2": 262.65692, "r_x3": 134.76498, "r_y3": 262.65692, "coord_origin": "TOPLEFT" }, "text": "compared to other languages such as HTML, OTSL has a minimized vocabulary", "orig": "compared to other languages such as HTML, OTSL has a minimized vocabulary", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 283.40891, "r_x1": 480.59572999999995, "r_y1": 283.40891, "r_x2": 480.59572999999995, "r_y2": 274.61194, "r_x3": 134.76498, "r_y3": 274.61194, "coord_origin": "TOPLEFT" }, "text": "which yields short sequence length, strong inherent structure (e.g. strict rectan-", "orig": "which yields short sequence length, strong inherent structure (e.g. strict rectan-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 295.36389, "r_x1": 480.59274, "r_y1": 295.36389, "r_x2": 480.59274, "r_y2": 286.56692999999996, "r_x3": 134.76498, "r_y3": 286.56692999999996, "coord_origin": "TOPLEFT" }, "text": "gular layout) and a strict syntax with rules that only look backwards. The latter", "orig": "gular layout) and a strict syntax with rules that only look backwards. The latter", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 307.31888, "r_x1": 480.59473, "r_y1": 307.31888, "r_x2": 480.59473, "r_y2": 298.52190999999993, "r_x3": 134.76498, "r_y3": 298.52190999999993, "coord_origin": "TOPLEFT" }, "text": "allows for syntax validation during inference and ensures a syntactically correct", "orig": "allows for syntax validation during inference and ensures a syntactically correct", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 319.27487, "r_x1": 480.58667, "r_y1": 319.27487, "r_x2": 480.58667, "r_y2": 310.47791, "r_x3": 134.76498, "r_y3": 310.47791, "coord_origin": "TOPLEFT" }, "text": "table-structure. These OTSL features are illustrated in Figure 1, in comparison", "orig": "table-structure. These OTSL features are illustrated in Figure 1, in comparison", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 331.22986, "r_x1": 179.72021, "r_y1": 331.22986, "r_x2": 179.72021, "r_y2": 322.43289, "r_x3": 134.76498, "r_y3": 322.43289, "coord_origin": "TOPLEFT" }, "text": "to HTML.", "orig": "to HTML.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 0, "label": "text", "bbox": { "l": 134.76498, "t": 334.64789, "r": 480.59567, "b": 439.08676, "coord_origin": "TOPLEFT" }, "confidence": 0.988121747970581, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.70898, "r_y0": 343.44485000000003, "r_x1": 480.5878000000001, "r_y1": 343.44485000000003, "r_x2": 480.5878000000001, "r_y2": 334.64789, "r_x3": 149.70898, "r_y3": 334.64789, "coord_origin": "TOPLEFT" }, "text": "The paper is structured as follows. In section 2, we give an overview of the", "orig": "The paper is structured as follows. In section 2, we give an overview of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 355.40085, "r_x1": 480.59375, "r_y1": 355.40085, "r_x2": 480.59375, "r_y2": 346.60388000000006, "r_x3": 134.76498, "r_y3": 346.60388000000006, "coord_origin": "TOPLEFT" }, "text": "latest developments in table-structure reconstruction. In section 3 we review", "orig": "latest developments in table-structure reconstruction. In section 3 we review", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 367.3558300000001, "r_x1": 480.58673, "r_y1": 367.3558300000001, "r_x2": 480.58673, "r_y2": 358.55887, "r_x3": 134.76498, "r_y3": 358.55887, "coord_origin": "TOPLEFT" }, "text": "the current HTML table encoding (popularised by PubTabNet and FinTabNet)", "orig": "the current HTML table encoding (popularised by PubTabNet and FinTabNet)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 379.31082, "r_x1": 480.59161, "r_y1": 379.31082, "r_x2": 480.59161, "r_y2": 370.51385, "r_x3": 134.76498, "r_y3": 370.51385, "coord_origin": "TOPLEFT" }, "text": "and discuss its flaws. Subsequently, we introduce OTSL in section 4, which in-", "orig": "and discuss its flaws. Subsequently, we introduce OTSL in section 4, which in-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 391.26581, "r_x1": 480.59177000000005, "r_y1": 391.26581, "r_x2": 480.59177000000005, "r_y2": 382.46883999999994, "r_x3": 134.76498, "r_y3": 382.46883999999994, "coord_origin": "TOPLEFT" }, "text": "cludes the language definition, syntax rules and error-correction procedures. In", "orig": "cludes the language definition, syntax rules and error-correction procedures. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 403.2207900000001, "r_x1": 480.58774, "r_y1": 403.2207900000001, "r_x2": 480.58774, "r_y2": 394.42383, "r_x3": 134.76498, "r_y3": 394.42383, "coord_origin": "TOPLEFT" }, "text": "section 5, we apply OTSL on the TableFormer architecture, compare it to Table-", "orig": "section 5, we apply OTSL on the TableFormer architecture, compare it to Table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 415.17679, "r_x1": 480.59469999999993, "r_y1": 415.17679, "r_x2": 480.59469999999993, "r_y2": 406.37982, "r_x3": 134.76498, "r_y3": 406.37982, "coord_origin": "TOPLEFT" }, "text": "Former models trained on HTML and ultimately demonstrate the advantages", "orig": "Former models trained on HTML and ultimately demonstrate the advantages", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 427.13177, "r_x1": 480.59567, "r_y1": 427.13177, "r_x2": 480.59567, "r_y2": 418.33481, "r_x3": 134.76498, "r_y3": 418.33481, "coord_origin": "TOPLEFT" }, "text": "of using OTSL. Finally, in section 6 we conclude our work and outline next", "orig": "of using OTSL. Finally, in section 6 we conclude our work and outline next", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 439.08676, "r_x1": 201.27232, "r_y1": 439.08676, "r_x2": 201.27232, "r_y2": 430.28979, "r_x3": 134.76498, "r_y3": 430.28979, "coord_origin": "TOPLEFT" }, "text": "potential steps.", "orig": "potential steps.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 4, "label": "section_header", "bbox": { "l": 134.76498, "t": 462.08795, "r": 236.76912999999996, "b": 472.65634, "coord_origin": "TOPLEFT" }, "confidence": 0.9439423680305481, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 472.65634, "r_x1": 141.48859, "r_y1": 472.65634, "r_x2": 141.48859, "r_y2": 462.08795, "r_x3": 134.76498, "r_y3": 462.08795, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.93819, "r_y0": 472.65634, "r_x1": 236.76912999999996, "r_y1": 472.65634, "r_x2": 236.76912999999996, "r_y2": 462.08795, "r_x3": 154.93819, "r_y3": 462.08795, "coord_origin": "TOPLEFT" }, "text": "Related Work", "orig": "Related Work", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 3, "label": "text", "bbox": { "l": 134.76498, "t": 488.68582, "r": 484.12047999999993, "b": 664.85577, "coord_origin": "TOPLEFT" }, "confidence": 0.9870182871818542, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 497.48279, "r_x1": 480.59067, "r_y1": 497.48279, "r_x2": 480.59067, "r_y2": 488.68582, "r_x3": 134.76498, "r_y3": 488.68582, "coord_origin": "TOPLEFT" }, "text": "Approaches to formalize the logical structure and layout of tables in electronic", "orig": "Approaches to formalize the logical structure and layout of tables in electronic", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 509.43777, "r_x1": 480.5917400000001, "r_y1": 509.43777, "r_x2": 480.5917400000001, "r_y2": 500.64081, "r_x3": 134.76498, "r_y3": 500.64081, "coord_origin": "TOPLEFT" }, "text": "documents date back more than two decades [16]. In the recent past, a wide", "orig": "documents date back more than two decades [16]. In the recent past, a wide", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 521.39276, "r_x1": 480.58971999999994, "r_y1": 521.39276, "r_x2": 480.58971999999994, "r_y2": 512.5957900000001, "r_x3": 134.76498, "r_y3": 512.5957900000001, "coord_origin": "TOPLEFT" }, "text": "variety of computer vision methods have been explored to tackle the prob-", "orig": "variety of computer vision methods have been explored to tackle the prob-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 533.34875, "r_x1": 480.58966, "r_y1": 533.34875, "r_x2": 480.58966, "r_y2": 524.55179, "r_x3": 134.76498, "r_y3": 524.55179, "coord_origin": "TOPLEFT" }, "text": "lem of table structure recognition, i.e. the correct identification of columns,", "orig": "lem of table structure recognition, i.e. the correct identification of columns,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 545.30376, "r_x1": 480.5897499999999, "r_y1": 545.30376, "r_x2": 480.5897499999999, "r_y2": 536.50679, "r_x3": 134.76498, "r_y3": 536.50679, "coord_origin": "TOPLEFT" }, "text": "rows and spanning cells in a given table. Broadly speaking, the current deep-", "orig": "rows and spanning cells in a given table. Broadly speaking, the current deep-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 557.2587599999999, "r_x1": 480.58862000000005, "r_y1": 557.2587599999999, "r_x2": 480.58862000000005, "r_y2": 548.4617900000001, "r_x3": 134.76498, "r_y3": 548.4617900000001, "coord_origin": "TOPLEFT" }, "text": "learning based approaches fall into three categories: object detection (OD) meth-", "orig": "learning based approaches fall into three categories: object detection (OD) meth-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 569.21376, "r_x1": 480.59072999999995, "r_y1": 569.21376, "r_x2": 480.59072999999995, "r_y2": 560.41679, "r_x3": 134.76498, "r_y3": 560.41679, "coord_origin": "TOPLEFT" }, "text": "ods, Graph-Neural-Network (GNN) methods and Image-to-Markup-Sequence", "orig": "ods, Graph-Neural-Network (GNN) methods and Image-to-Markup-Sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 581.16876, "r_x1": 484.12047999999993, "r_y1": 581.16876, "r_x2": 484.12047999999993, "r_y2": 572.3718, "r_x3": 134.76498, "r_y3": 572.3718, "coord_origin": "TOPLEFT" }, "text": "(Im2Seq) methods. Object-detection based methods [11,12,13,14,21] rely on table-", "orig": "(Im2Seq) methods. Object-detection based methods [11,12,13,14,21] rely on table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 593.12376, "r_x1": 480.59567, "r_y1": 593.12376, "r_x2": 480.59567, "r_y2": 584.3267999999999, "r_x3": 134.76498, "r_y3": 584.3267999999999, "coord_origin": "TOPLEFT" }, "text": "structure annotation using (overlapping) bounding boxes for training, and pro-", "orig": "structure annotation using (overlapping) bounding boxes for training, and pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 605.07976, "r_x1": 480.58871, "r_y1": 605.07976, "r_x2": 480.58871, "r_y2": 596.28279, "r_x3": 134.76498, "r_y3": 596.28279, "coord_origin": "TOPLEFT" }, "text": "duce bounding-box predictions to define table cells, rows, and columns on a table", "orig": "duce bounding-box predictions to define table cells, rows, and columns on a table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 617.03476, "r_x1": 480.59075999999993, "r_y1": 617.03476, "r_x2": 480.59075999999993, "r_y2": 608.23779, "r_x3": 134.76498, "r_y3": 608.23779, "coord_origin": "TOPLEFT" }, "text": "image. Graph Neural Network (GNN) based methods [3,6,17,18], as the name", "orig": "image. Graph Neural Network (GNN) based methods [3,6,17,18], as the name", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 628.9897599999999, "r_x1": 480.58574999999996, "r_y1": 628.9897599999999, "r_x2": 480.58574999999996, "r_y2": 620.1927900000001, "r_x3": 134.76498, "r_y3": 620.1927900000001, "coord_origin": "TOPLEFT" }, "text": "suggests, represent tables as graph structures. The graph nodes represent the", "orig": "suggests, represent tables as graph structures. The graph nodes represent the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 640.94476, "r_x1": 480.58875, "r_y1": 640.94476, "r_x2": 480.58875, "r_y2": 632.1478, "r_x3": 134.76498, "r_y3": 632.1478, "coord_origin": "TOPLEFT" }, "text": "content of each table cell, an embedding vector from the table image, or geomet-", "orig": "content of each table cell, an embedding vector from the table image, or geomet-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 652.89977, "r_x1": 480.58875, "r_y1": 652.89977, "r_x2": 480.58875, "r_y2": 644.1028, "r_x3": 134.76498, "r_y3": 644.1028, "coord_origin": "TOPLEFT" }, "text": "ric coordinates of the table cell. The edges of the graph define the relationship", "orig": "ric coordinates of the table cell. The edges of the graph define the relationship", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 664.85577, "r_x1": 480.59069999999997, "r_y1": 664.85577, "r_x2": 480.59069999999997, "r_y2": 656.05879, "r_x3": 134.76498, "r_y3": 656.05879, "coord_origin": "TOPLEFT" }, "text": "between the nodes, e.g. if they belong to the same column, row, or table cell.", "orig": "between the nodes, e.g. if they belong to the same column, row, or table cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "tablestructure": { "table_map": {} }, "figures_classification": null, "equations_prediction": null, "vlm_response": null }, "assembled": { "elements": [ { "label": "page_header", "id": 5, "page_no": 2, "cluster": { "id": 5, "label": "page_header", "bbox": { "l": 194.478, "t": 93.77099999999996, "r": 447.54291000000006, "b": 101.84069999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.9325801730155945, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.478, "r_y0": 101.84069999999997, "r_x1": 447.54291000000006, "r_y1": 101.84069999999997, "r_x2": 447.54291000000006, "r_y2": 93.77099999999996, "r_x3": 194.478, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Optimized Table Tokenization for Table Structure Recognition" }, { "label": "page_header", "id": 6, "page_no": 2, "cluster": { "id": 6, "label": "page_header", "bbox": { "l": 475.98431, "t": 93.77099999999996, "r": 480.59125000000006, "b": 101.84069999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.8773486614227295, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 475.98431, "r_y0": 101.84069999999997, "r_x1": 480.59125000000006, "r_y1": 101.84069999999997, "r_x2": 480.59125000000006, "r_y2": 93.77099999999996, "r_x3": 475.98431, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "3" }, { "label": "text", "id": 2, "page_no": 2, "cluster": { "id": 2, "label": "text", "bbox": { "l": 134.76498, "t": 118.93377999999996, "r": 480.59183, "b": 211.41687000000002, "coord_origin": "TOPLEFT" }, "confidence": 0.9871802926063538, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.709, "r_y0": 127.73077, "r_x1": 480.59183, "r_y1": 127.73077, "r_x2": 480.59183, "r_y2": 118.93377999999996, "r_x3": 149.709, "r_y3": 118.93377999999996, "coord_origin": "TOPLEFT" }, "text": "While the majority of research in TSR is currently focused on the develop-", "orig": "While the majority of research in TSR is currently focused on the develop-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 139.68579, "r_x1": 480.58675999999997, "r_y1": 139.68579, "r_x2": 480.58675999999997, "r_y2": 130.88878999999997, "r_x3": 134.765, "r_y3": 130.88878999999997, "coord_origin": "TOPLEFT" }, "text": "ment and application of novel neural model architectures, the table structure", "orig": "ment and application of novel neural model architectures, the table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 151.64178000000004, "r_x1": 480.5917400000001, "r_y1": 151.64178000000004, "r_x2": 480.5917400000001, "r_y2": 142.84479, "r_x3": 134.765, "r_y3": 142.84479, "coord_origin": "TOPLEFT" }, "text": "representation language (e.g. HTML in PubTabNet and FinTabNet) is usually", "orig": "representation language (e.g. HTML in PubTabNet and FinTabNet) is usually", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 163.59680000000003, "r_x1": 169.62514, "r_y1": 163.59680000000003, "r_x2": 169.62514, "r_y2": 154.7998, "r_x3": 134.765, "r_y3": 154.7998, "coord_origin": "TOPLEFT" }, "text": "adopted", "orig": "adopted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 173.86099, "r_y0": 163.59680000000003, "r_x1": 194.55531, "r_y1": 163.59680000000003, "r_x2": 194.55531, "r_y2": 154.7998, "r_x3": 173.86099, "r_y3": 154.7998, "coord_origin": "TOPLEFT" }, "text": "as is", "orig": "as is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 199.60999, "r_y0": 163.59680000000003, "r_x1": 480.58618, "r_y1": 163.59680000000003, "r_x2": 480.58618, "r_y2": 154.7998, "r_x3": 199.60999, "r_y3": 154.7998, "coord_origin": "TOPLEFT" }, "text": "for the sequence tokenization in Im2Seq models. In this paper,", "orig": "for the sequence tokenization in Im2Seq models. In this paper,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 175.55182000000002, "r_x1": 480.59167, "r_y1": 175.55182000000002, "r_x2": 480.59167, "r_y2": 166.75482, "r_x3": 134.76498, "r_y3": 166.75482, "coord_origin": "TOPLEFT" }, "text": "we aim for the opposite and investigate the impact of the table structure rep-", "orig": "we aim for the opposite and investigate the impact of the table structure rep-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 187.50684, "r_x1": 480.58968999999996, "r_y1": 187.50684, "r_x2": 480.58968999999996, "r_y2": 178.70983999999999, "r_x3": 134.76498, "r_y3": 178.70983999999999, "coord_origin": "TOPLEFT" }, "text": "resentation language with an otherwise unmodified Im2Seq transformer-based", "orig": "resentation language with an otherwise unmodified Im2Seq transformer-based", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 199.46185000000003, "r_x1": 480.5917400000001, "r_y1": 199.46185000000003, "r_x2": 480.5917400000001, "r_y2": 190.66485999999998, "r_x3": 134.76498, "r_y3": 190.66485999999998, "coord_origin": "TOPLEFT" }, "text": "architecture. Since the current state-of-the-art Im2Seq model is TableFormer [9],", "orig": "architecture. Since the current state-of-the-art Im2Seq model is TableFormer [9],", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 211.41687000000002, "r_x1": 348.35519, "r_y1": 211.41687000000002, "r_x2": 348.35519, "r_y2": 202.61987, "r_x3": 134.76498, "r_y3": 202.61987, "coord_origin": "TOPLEFT" }, "text": "we select this model to perform our experiments.", "orig": "we select this model to perform our experiments.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "While the majority of research in TSR is currently focused on the development and application of novel neural model architectures, the table structure representation language (e.g. HTML in PubTabNet and FinTabNet) is usually adopted as is for the sequence tokenization in Im2Seq models. In this paper, we aim for the opposite and investigate the impact of the table structure representation language with an otherwise unmodified Im2Seq transformer-based architecture. Since the current state-of-the-art Im2Seq model is TableFormer [9], we select this model to perform our experiments." }, { "label": "text", "id": 1, "page_no": 2, "cluster": { "id": 1, "label": "text", "bbox": { "l": 134.76498, "t": 214.83587999999997, "r": 480.59572999999995, "b": 331.22986, "coord_origin": "TOPLEFT" }, "confidence": 0.9871861338615417, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.70898, "r_y0": 223.63287000000003, "r_x1": 480.5939, "r_y1": 223.63287000000003, "r_x2": 480.5939, "r_y2": 214.83587999999997, "r_x3": 149.70898, "r_y3": 214.83587999999997, "coord_origin": "TOPLEFT" }, "text": "The main contribution of this paper is the introduction of a new optimised ta-", "orig": "The main contribution of this paper is the introduction of a new optimised ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 235.58789000000002, "r_x1": 480.5938100000001, "r_y1": 235.58789000000002, "r_x2": 480.5938100000001, "r_y2": 226.79089, "r_x3": 134.76498, "r_y3": 226.79089, "coord_origin": "TOPLEFT" }, "text": "ble structure language (OTSL), specifically designed to describe table-structure", "orig": "ble structure language (OTSL), specifically designed to describe table-structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 247.54387999999994, "r_x1": 480.58667, "r_y1": 247.54387999999994, "r_x2": 480.58667, "r_y2": 238.74689, "r_x3": 134.76498, "r_y3": 238.74689, "coord_origin": "TOPLEFT" }, "text": "in an compact and structured way for Im2Seq models. OTSL has a number of", "orig": "in an compact and structured way for Im2Seq models. OTSL has a number of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 259.49890000000005, "r_x1": 480.5867, "r_y1": 259.49890000000005, "r_x2": 480.5867, "r_y2": 250.70190000000002, "r_x3": 134.76498, "r_y3": 250.70190000000002, "coord_origin": "TOPLEFT" }, "text": "key features, which make it very attractive to use in Im2Seq models. Specifically,", "orig": "key features, which make it very attractive to use in Im2Seq models. Specifically,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 271.45392000000004, "r_x1": 480.58771, "r_y1": 271.45392000000004, "r_x2": 480.58771, "r_y2": 262.65692, "r_x3": 134.76498, "r_y3": 262.65692, "coord_origin": "TOPLEFT" }, "text": "compared to other languages such as HTML, OTSL has a minimized vocabulary", "orig": "compared to other languages such as HTML, OTSL has a minimized vocabulary", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 283.40891, "r_x1": 480.59572999999995, "r_y1": 283.40891, "r_x2": 480.59572999999995, "r_y2": 274.61194, "r_x3": 134.76498, "r_y3": 274.61194, "coord_origin": "TOPLEFT" }, "text": "which yields short sequence length, strong inherent structure (e.g. strict rectan-", "orig": "which yields short sequence length, strong inherent structure (e.g. strict rectan-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 295.36389, "r_x1": 480.59274, "r_y1": 295.36389, "r_x2": 480.59274, "r_y2": 286.56692999999996, "r_x3": 134.76498, "r_y3": 286.56692999999996, "coord_origin": "TOPLEFT" }, "text": "gular layout) and a strict syntax with rules that only look backwards. The latter", "orig": "gular layout) and a strict syntax with rules that only look backwards. The latter", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 307.31888, "r_x1": 480.59473, "r_y1": 307.31888, "r_x2": 480.59473, "r_y2": 298.52190999999993, "r_x3": 134.76498, "r_y3": 298.52190999999993, "coord_origin": "TOPLEFT" }, "text": "allows for syntax validation during inference and ensures a syntactically correct", "orig": "allows for syntax validation during inference and ensures a syntactically correct", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 319.27487, "r_x1": 480.58667, "r_y1": 319.27487, "r_x2": 480.58667, "r_y2": 310.47791, "r_x3": 134.76498, "r_y3": 310.47791, "coord_origin": "TOPLEFT" }, "text": "table-structure. These OTSL features are illustrated in Figure 1, in comparison", "orig": "table-structure. These OTSL features are illustrated in Figure 1, in comparison", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 331.22986, "r_x1": 179.72021, "r_y1": 331.22986, "r_x2": 179.72021, "r_y2": 322.43289, "r_x3": 134.76498, "r_y3": 322.43289, "coord_origin": "TOPLEFT" }, "text": "to HTML.", "orig": "to HTML.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The main contribution of this paper is the introduction of a new optimised table structure language (OTSL), specifically designed to describe table-structure in an compact and structured way for Im2Seq models. OTSL has a number of key features, which make it very attractive to use in Im2Seq models. Specifically, compared to other languages such as HTML, OTSL has a minimized vocabulary which yields short sequence length, strong inherent structure (e.g. strict rectangular layout) and a strict syntax with rules that only look backwards. The latter allows for syntax validation during inference and ensures a syntactically correct table-structure. These OTSL features are illustrated in Figure 1, in comparison to HTML." }, { "label": "text", "id": 0, "page_no": 2, "cluster": { "id": 0, "label": "text", "bbox": { "l": 134.76498, "t": 334.64789, "r": 480.59567, "b": 439.08676, "coord_origin": "TOPLEFT" }, "confidence": 0.988121747970581, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.70898, "r_y0": 343.44485000000003, "r_x1": 480.5878000000001, "r_y1": 343.44485000000003, "r_x2": 480.5878000000001, "r_y2": 334.64789, "r_x3": 149.70898, "r_y3": 334.64789, "coord_origin": "TOPLEFT" }, "text": "The paper is structured as follows. In section 2, we give an overview of the", "orig": "The paper is structured as follows. In section 2, we give an overview of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 355.40085, "r_x1": 480.59375, "r_y1": 355.40085, "r_x2": 480.59375, "r_y2": 346.60388000000006, "r_x3": 134.76498, "r_y3": 346.60388000000006, "coord_origin": "TOPLEFT" }, "text": "latest developments in table-structure reconstruction. In section 3 we review", "orig": "latest developments in table-structure reconstruction. In section 3 we review", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 367.3558300000001, "r_x1": 480.58673, "r_y1": 367.3558300000001, "r_x2": 480.58673, "r_y2": 358.55887, "r_x3": 134.76498, "r_y3": 358.55887, "coord_origin": "TOPLEFT" }, "text": "the current HTML table encoding (popularised by PubTabNet and FinTabNet)", "orig": "the current HTML table encoding (popularised by PubTabNet and FinTabNet)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 379.31082, "r_x1": 480.59161, "r_y1": 379.31082, "r_x2": 480.59161, "r_y2": 370.51385, "r_x3": 134.76498, "r_y3": 370.51385, "coord_origin": "TOPLEFT" }, "text": "and discuss its flaws. Subsequently, we introduce OTSL in section 4, which in-", "orig": "and discuss its flaws. Subsequently, we introduce OTSL in section 4, which in-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 391.26581, "r_x1": 480.59177000000005, "r_y1": 391.26581, "r_x2": 480.59177000000005, "r_y2": 382.46883999999994, "r_x3": 134.76498, "r_y3": 382.46883999999994, "coord_origin": "TOPLEFT" }, "text": "cludes the language definition, syntax rules and error-correction procedures. In", "orig": "cludes the language definition, syntax rules and error-correction procedures. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 403.2207900000001, "r_x1": 480.58774, "r_y1": 403.2207900000001, "r_x2": 480.58774, "r_y2": 394.42383, "r_x3": 134.76498, "r_y3": 394.42383, "coord_origin": "TOPLEFT" }, "text": "section 5, we apply OTSL on the TableFormer architecture, compare it to Table-", "orig": "section 5, we apply OTSL on the TableFormer architecture, compare it to Table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 415.17679, "r_x1": 480.59469999999993, "r_y1": 415.17679, "r_x2": 480.59469999999993, "r_y2": 406.37982, "r_x3": 134.76498, "r_y3": 406.37982, "coord_origin": "TOPLEFT" }, "text": "Former models trained on HTML and ultimately demonstrate the advantages", "orig": "Former models trained on HTML and ultimately demonstrate the advantages", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 427.13177, "r_x1": 480.59567, "r_y1": 427.13177, "r_x2": 480.59567, "r_y2": 418.33481, "r_x3": 134.76498, "r_y3": 418.33481, "coord_origin": "TOPLEFT" }, "text": "of using OTSL. Finally, in section 6 we conclude our work and outline next", "orig": "of using OTSL. Finally, in section 6 we conclude our work and outline next", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 439.08676, "r_x1": 201.27232, "r_y1": 439.08676, "r_x2": 201.27232, "r_y2": 430.28979, "r_x3": 134.76498, "r_y3": 430.28979, "coord_origin": "TOPLEFT" }, "text": "potential steps.", "orig": "potential steps.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The paper is structured as follows. In section 2, we give an overview of the latest developments in table-structure reconstruction. In section 3 we review the current HTML table encoding (popularised by PubTabNet and FinTabNet) and discuss its flaws. Subsequently, we introduce OTSL in section 4, which includes the language definition, syntax rules and error-correction procedures. In section 5, we apply OTSL on the TableFormer architecture, compare it to TableFormer models trained on HTML and ultimately demonstrate the advantages of using OTSL. Finally, in section 6 we conclude our work and outline next potential steps." }, { "label": "section_header", "id": 4, "page_no": 2, "cluster": { "id": 4, "label": "section_header", "bbox": { "l": 134.76498, "t": 462.08795, "r": 236.76912999999996, "b": 472.65634, "coord_origin": "TOPLEFT" }, "confidence": 0.9439423680305481, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 472.65634, "r_x1": 141.48859, "r_y1": 472.65634, "r_x2": 141.48859, "r_y2": 462.08795, "r_x3": 134.76498, "r_y3": 462.08795, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.93819, "r_y0": 472.65634, "r_x1": 236.76912999999996, "r_y1": 472.65634, "r_x2": 236.76912999999996, "r_y2": 462.08795, "r_x3": 154.93819, "r_y3": 462.08795, "coord_origin": "TOPLEFT" }, "text": "Related Work", "orig": "Related Work", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "2 Related Work" }, { "label": "text", "id": 3, "page_no": 2, "cluster": { "id": 3, "label": "text", "bbox": { "l": 134.76498, "t": 488.68582, "r": 484.12047999999993, "b": 664.85577, "coord_origin": "TOPLEFT" }, "confidence": 0.9870182871818542, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 497.48279, "r_x1": 480.59067, "r_y1": 497.48279, "r_x2": 480.59067, "r_y2": 488.68582, "r_x3": 134.76498, "r_y3": 488.68582, "coord_origin": "TOPLEFT" }, "text": "Approaches to formalize the logical structure and layout of tables in electronic", "orig": "Approaches to formalize the logical structure and layout of tables in electronic", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 509.43777, "r_x1": 480.5917400000001, "r_y1": 509.43777, "r_x2": 480.5917400000001, "r_y2": 500.64081, "r_x3": 134.76498, "r_y3": 500.64081, "coord_origin": "TOPLEFT" }, "text": "documents date back more than two decades [16]. In the recent past, a wide", "orig": "documents date back more than two decades [16]. In the recent past, a wide", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 521.39276, "r_x1": 480.58971999999994, "r_y1": 521.39276, "r_x2": 480.58971999999994, "r_y2": 512.5957900000001, "r_x3": 134.76498, "r_y3": 512.5957900000001, "coord_origin": "TOPLEFT" }, "text": "variety of computer vision methods have been explored to tackle the prob-", "orig": "variety of computer vision methods have been explored to tackle the prob-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 533.34875, "r_x1": 480.58966, "r_y1": 533.34875, "r_x2": 480.58966, "r_y2": 524.55179, "r_x3": 134.76498, "r_y3": 524.55179, "coord_origin": "TOPLEFT" }, "text": "lem of table structure recognition, i.e. the correct identification of columns,", "orig": "lem of table structure recognition, i.e. the correct identification of columns,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 545.30376, "r_x1": 480.5897499999999, "r_y1": 545.30376, "r_x2": 480.5897499999999, "r_y2": 536.50679, "r_x3": 134.76498, "r_y3": 536.50679, "coord_origin": "TOPLEFT" }, "text": "rows and spanning cells in a given table. Broadly speaking, the current deep-", "orig": "rows and spanning cells in a given table. Broadly speaking, the current deep-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 557.2587599999999, "r_x1": 480.58862000000005, "r_y1": 557.2587599999999, "r_x2": 480.58862000000005, "r_y2": 548.4617900000001, "r_x3": 134.76498, "r_y3": 548.4617900000001, "coord_origin": "TOPLEFT" }, "text": "learning based approaches fall into three categories: object detection (OD) meth-", "orig": "learning based approaches fall into three categories: object detection (OD) meth-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 569.21376, "r_x1": 480.59072999999995, "r_y1": 569.21376, "r_x2": 480.59072999999995, "r_y2": 560.41679, "r_x3": 134.76498, "r_y3": 560.41679, "coord_origin": "TOPLEFT" }, "text": "ods, Graph-Neural-Network (GNN) methods and Image-to-Markup-Sequence", "orig": "ods, Graph-Neural-Network (GNN) methods and Image-to-Markup-Sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 581.16876, "r_x1": 484.12047999999993, "r_y1": 581.16876, "r_x2": 484.12047999999993, "r_y2": 572.3718, "r_x3": 134.76498, "r_y3": 572.3718, "coord_origin": "TOPLEFT" }, "text": "(Im2Seq) methods. Object-detection based methods [11,12,13,14,21] rely on table-", "orig": "(Im2Seq) methods. Object-detection based methods [11,12,13,14,21] rely on table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 593.12376, "r_x1": 480.59567, "r_y1": 593.12376, "r_x2": 480.59567, "r_y2": 584.3267999999999, "r_x3": 134.76498, "r_y3": 584.3267999999999, "coord_origin": "TOPLEFT" }, "text": "structure annotation using (overlapping) bounding boxes for training, and pro-", "orig": "structure annotation using (overlapping) bounding boxes for training, and pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 605.07976, "r_x1": 480.58871, "r_y1": 605.07976, "r_x2": 480.58871, "r_y2": 596.28279, "r_x3": 134.76498, "r_y3": 596.28279, "coord_origin": "TOPLEFT" }, "text": "duce bounding-box predictions to define table cells, rows, and columns on a table", "orig": "duce bounding-box predictions to define table cells, rows, and columns on a table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 617.03476, "r_x1": 480.59075999999993, "r_y1": 617.03476, "r_x2": 480.59075999999993, "r_y2": 608.23779, "r_x3": 134.76498, "r_y3": 608.23779, "coord_origin": "TOPLEFT" }, "text": "image. Graph Neural Network (GNN) based methods [3,6,17,18], as the name", "orig": "image. Graph Neural Network (GNN) based methods [3,6,17,18], as the name", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 628.9897599999999, "r_x1": 480.58574999999996, "r_y1": 628.9897599999999, "r_x2": 480.58574999999996, "r_y2": 620.1927900000001, "r_x3": 134.76498, "r_y3": 620.1927900000001, "coord_origin": "TOPLEFT" }, "text": "suggests, represent tables as graph structures. The graph nodes represent the", "orig": "suggests, represent tables as graph structures. The graph nodes represent the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 640.94476, "r_x1": 480.58875, "r_y1": 640.94476, "r_x2": 480.58875, "r_y2": 632.1478, "r_x3": 134.76498, "r_y3": 632.1478, "coord_origin": "TOPLEFT" }, "text": "content of each table cell, an embedding vector from the table image, or geomet-", "orig": "content of each table cell, an embedding vector from the table image, or geomet-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 652.89977, "r_x1": 480.58875, "r_y1": 652.89977, "r_x2": 480.58875, "r_y2": 644.1028, "r_x3": 134.76498, "r_y3": 644.1028, "coord_origin": "TOPLEFT" }, "text": "ric coordinates of the table cell. The edges of the graph define the relationship", "orig": "ric coordinates of the table cell. The edges of the graph define the relationship", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 664.85577, "r_x1": 480.59069999999997, "r_y1": 664.85577, "r_x2": 480.59069999999997, "r_y2": 656.05879, "r_x3": 134.76498, "r_y3": 656.05879, "coord_origin": "TOPLEFT" }, "text": "between the nodes, e.g. if they belong to the same column, row, or table cell.", "orig": "between the nodes, e.g. if they belong to the same column, row, or table cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Approaches to formalize the logical structure and layout of tables in electronic documents date back more than two decades [16]. In the recent past, a wide variety of computer vision methods have been explored to tackle the problem of table structure recognition, i.e. the correct identification of columns, rows and spanning cells in a given table. Broadly speaking, the current deeplearning based approaches fall into three categories: object detection (OD) methods, Graph-Neural-Network (GNN) methods and Image-to-Markup-Sequence (Im2Seq) methods. Object-detection based methods [11,12,13,14,21] rely on tablestructure annotation using (overlapping) bounding boxes for training, and produce bounding-box predictions to define table cells, rows, and columns on a table image. Graph Neural Network (GNN) based methods [3,6,17,18], as the name suggests, represent tables as graph structures. The graph nodes represent the content of each table cell, an embedding vector from the table image, or geometric coordinates of the table cell. The edges of the graph define the relationship between the nodes, e.g. if they belong to the same column, row, or table cell." } ], "body": [ { "label": "text", "id": 2, "page_no": 2, "cluster": { "id": 2, "label": "text", "bbox": { "l": 134.76498, "t": 118.93377999999996, "r": 480.59183, "b": 211.41687000000002, "coord_origin": "TOPLEFT" }, "confidence": 0.9871802926063538, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.709, "r_y0": 127.73077, "r_x1": 480.59183, "r_y1": 127.73077, "r_x2": 480.59183, "r_y2": 118.93377999999996, "r_x3": 149.709, "r_y3": 118.93377999999996, "coord_origin": "TOPLEFT" }, "text": "While the majority of research in TSR is currently focused on the develop-", "orig": "While the majority of research in TSR is currently focused on the develop-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 139.68579, "r_x1": 480.58675999999997, "r_y1": 139.68579, "r_x2": 480.58675999999997, "r_y2": 130.88878999999997, "r_x3": 134.765, "r_y3": 130.88878999999997, "coord_origin": "TOPLEFT" }, "text": "ment and application of novel neural model architectures, the table structure", "orig": "ment and application of novel neural model architectures, the table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 151.64178000000004, "r_x1": 480.5917400000001, "r_y1": 151.64178000000004, "r_x2": 480.5917400000001, "r_y2": 142.84479, "r_x3": 134.765, "r_y3": 142.84479, "coord_origin": "TOPLEFT" }, "text": "representation language (e.g. HTML in PubTabNet and FinTabNet) is usually", "orig": "representation language (e.g. HTML in PubTabNet and FinTabNet) is usually", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 163.59680000000003, "r_x1": 169.62514, "r_y1": 163.59680000000003, "r_x2": 169.62514, "r_y2": 154.7998, "r_x3": 134.765, "r_y3": 154.7998, "coord_origin": "TOPLEFT" }, "text": "adopted", "orig": "adopted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 173.86099, "r_y0": 163.59680000000003, "r_x1": 194.55531, "r_y1": 163.59680000000003, "r_x2": 194.55531, "r_y2": 154.7998, "r_x3": 173.86099, "r_y3": 154.7998, "coord_origin": "TOPLEFT" }, "text": "as is", "orig": "as is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 199.60999, "r_y0": 163.59680000000003, "r_x1": 480.58618, "r_y1": 163.59680000000003, "r_x2": 480.58618, "r_y2": 154.7998, "r_x3": 199.60999, "r_y3": 154.7998, "coord_origin": "TOPLEFT" }, "text": "for the sequence tokenization in Im2Seq models. In this paper,", "orig": "for the sequence tokenization in Im2Seq models. In this paper,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 175.55182000000002, "r_x1": 480.59167, "r_y1": 175.55182000000002, "r_x2": 480.59167, "r_y2": 166.75482, "r_x3": 134.76498, "r_y3": 166.75482, "coord_origin": "TOPLEFT" }, "text": "we aim for the opposite and investigate the impact of the table structure rep-", "orig": "we aim for the opposite and investigate the impact of the table structure rep-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 187.50684, "r_x1": 480.58968999999996, "r_y1": 187.50684, "r_x2": 480.58968999999996, "r_y2": 178.70983999999999, "r_x3": 134.76498, "r_y3": 178.70983999999999, "coord_origin": "TOPLEFT" }, "text": "resentation language with an otherwise unmodified Im2Seq transformer-based", "orig": "resentation language with an otherwise unmodified Im2Seq transformer-based", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 199.46185000000003, "r_x1": 480.5917400000001, "r_y1": 199.46185000000003, "r_x2": 480.5917400000001, "r_y2": 190.66485999999998, "r_x3": 134.76498, "r_y3": 190.66485999999998, "coord_origin": "TOPLEFT" }, "text": "architecture. Since the current state-of-the-art Im2Seq model is TableFormer [9],", "orig": "architecture. Since the current state-of-the-art Im2Seq model is TableFormer [9],", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 211.41687000000002, "r_x1": 348.35519, "r_y1": 211.41687000000002, "r_x2": 348.35519, "r_y2": 202.61987, "r_x3": 134.76498, "r_y3": 202.61987, "coord_origin": "TOPLEFT" }, "text": "we select this model to perform our experiments.", "orig": "we select this model to perform our experiments.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "While the majority of research in TSR is currently focused on the development and application of novel neural model architectures, the table structure representation language (e.g. HTML in PubTabNet and FinTabNet) is usually adopted as is for the sequence tokenization in Im2Seq models. In this paper, we aim for the opposite and investigate the impact of the table structure representation language with an otherwise unmodified Im2Seq transformer-based architecture. Since the current state-of-the-art Im2Seq model is TableFormer [9], we select this model to perform our experiments." }, { "label": "text", "id": 1, "page_no": 2, "cluster": { "id": 1, "label": "text", "bbox": { "l": 134.76498, "t": 214.83587999999997, "r": 480.59572999999995, "b": 331.22986, "coord_origin": "TOPLEFT" }, "confidence": 0.9871861338615417, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.70898, "r_y0": 223.63287000000003, "r_x1": 480.5939, "r_y1": 223.63287000000003, "r_x2": 480.5939, "r_y2": 214.83587999999997, "r_x3": 149.70898, "r_y3": 214.83587999999997, "coord_origin": "TOPLEFT" }, "text": "The main contribution of this paper is the introduction of a new optimised ta-", "orig": "The main contribution of this paper is the introduction of a new optimised ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 235.58789000000002, "r_x1": 480.5938100000001, "r_y1": 235.58789000000002, "r_x2": 480.5938100000001, "r_y2": 226.79089, "r_x3": 134.76498, "r_y3": 226.79089, "coord_origin": "TOPLEFT" }, "text": "ble structure language (OTSL), specifically designed to describe table-structure", "orig": "ble structure language (OTSL), specifically designed to describe table-structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 247.54387999999994, "r_x1": 480.58667, "r_y1": 247.54387999999994, "r_x2": 480.58667, "r_y2": 238.74689, "r_x3": 134.76498, "r_y3": 238.74689, "coord_origin": "TOPLEFT" }, "text": "in an compact and structured way for Im2Seq models. OTSL has a number of", "orig": "in an compact and structured way for Im2Seq models. OTSL has a number of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 259.49890000000005, "r_x1": 480.5867, "r_y1": 259.49890000000005, "r_x2": 480.5867, "r_y2": 250.70190000000002, "r_x3": 134.76498, "r_y3": 250.70190000000002, "coord_origin": "TOPLEFT" }, "text": "key features, which make it very attractive to use in Im2Seq models. Specifically,", "orig": "key features, which make it very attractive to use in Im2Seq models. Specifically,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 271.45392000000004, "r_x1": 480.58771, "r_y1": 271.45392000000004, "r_x2": 480.58771, "r_y2": 262.65692, "r_x3": 134.76498, "r_y3": 262.65692, "coord_origin": "TOPLEFT" }, "text": "compared to other languages such as HTML, OTSL has a minimized vocabulary", "orig": "compared to other languages such as HTML, OTSL has a minimized vocabulary", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 283.40891, "r_x1": 480.59572999999995, "r_y1": 283.40891, "r_x2": 480.59572999999995, "r_y2": 274.61194, "r_x3": 134.76498, "r_y3": 274.61194, "coord_origin": "TOPLEFT" }, "text": "which yields short sequence length, strong inherent structure (e.g. strict rectan-", "orig": "which yields short sequence length, strong inherent structure (e.g. strict rectan-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 295.36389, "r_x1": 480.59274, "r_y1": 295.36389, "r_x2": 480.59274, "r_y2": 286.56692999999996, "r_x3": 134.76498, "r_y3": 286.56692999999996, "coord_origin": "TOPLEFT" }, "text": "gular layout) and a strict syntax with rules that only look backwards. The latter", "orig": "gular layout) and a strict syntax with rules that only look backwards. The latter", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 307.31888, "r_x1": 480.59473, "r_y1": 307.31888, "r_x2": 480.59473, "r_y2": 298.52190999999993, "r_x3": 134.76498, "r_y3": 298.52190999999993, "coord_origin": "TOPLEFT" }, "text": "allows for syntax validation during inference and ensures a syntactically correct", "orig": "allows for syntax validation during inference and ensures a syntactically correct", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 319.27487, "r_x1": 480.58667, "r_y1": 319.27487, "r_x2": 480.58667, "r_y2": 310.47791, "r_x3": 134.76498, "r_y3": 310.47791, "coord_origin": "TOPLEFT" }, "text": "table-structure. These OTSL features are illustrated in Figure 1, in comparison", "orig": "table-structure. These OTSL features are illustrated in Figure 1, in comparison", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 331.22986, "r_x1": 179.72021, "r_y1": 331.22986, "r_x2": 179.72021, "r_y2": 322.43289, "r_x3": 134.76498, "r_y3": 322.43289, "coord_origin": "TOPLEFT" }, "text": "to HTML.", "orig": "to HTML.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The main contribution of this paper is the introduction of a new optimised table structure language (OTSL), specifically designed to describe table-structure in an compact and structured way for Im2Seq models. OTSL has a number of key features, which make it very attractive to use in Im2Seq models. Specifically, compared to other languages such as HTML, OTSL has a minimized vocabulary which yields short sequence length, strong inherent structure (e.g. strict rectangular layout) and a strict syntax with rules that only look backwards. The latter allows for syntax validation during inference and ensures a syntactically correct table-structure. These OTSL features are illustrated in Figure 1, in comparison to HTML." }, { "label": "text", "id": 0, "page_no": 2, "cluster": { "id": 0, "label": "text", "bbox": { "l": 134.76498, "t": 334.64789, "r": 480.59567, "b": 439.08676, "coord_origin": "TOPLEFT" }, "confidence": 0.988121747970581, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.70898, "r_y0": 343.44485000000003, "r_x1": 480.5878000000001, "r_y1": 343.44485000000003, "r_x2": 480.5878000000001, "r_y2": 334.64789, "r_x3": 149.70898, "r_y3": 334.64789, "coord_origin": "TOPLEFT" }, "text": "The paper is structured as follows. In section 2, we give an overview of the", "orig": "The paper is structured as follows. In section 2, we give an overview of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 355.40085, "r_x1": 480.59375, "r_y1": 355.40085, "r_x2": 480.59375, "r_y2": 346.60388000000006, "r_x3": 134.76498, "r_y3": 346.60388000000006, "coord_origin": "TOPLEFT" }, "text": "latest developments in table-structure reconstruction. In section 3 we review", "orig": "latest developments in table-structure reconstruction. In section 3 we review", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 367.3558300000001, "r_x1": 480.58673, "r_y1": 367.3558300000001, "r_x2": 480.58673, "r_y2": 358.55887, "r_x3": 134.76498, "r_y3": 358.55887, "coord_origin": "TOPLEFT" }, "text": "the current HTML table encoding (popularised by PubTabNet and FinTabNet)", "orig": "the current HTML table encoding (popularised by PubTabNet and FinTabNet)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 379.31082, "r_x1": 480.59161, "r_y1": 379.31082, "r_x2": 480.59161, "r_y2": 370.51385, "r_x3": 134.76498, "r_y3": 370.51385, "coord_origin": "TOPLEFT" }, "text": "and discuss its flaws. Subsequently, we introduce OTSL in section 4, which in-", "orig": "and discuss its flaws. Subsequently, we introduce OTSL in section 4, which in-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 391.26581, "r_x1": 480.59177000000005, "r_y1": 391.26581, "r_x2": 480.59177000000005, "r_y2": 382.46883999999994, "r_x3": 134.76498, "r_y3": 382.46883999999994, "coord_origin": "TOPLEFT" }, "text": "cludes the language definition, syntax rules and error-correction procedures. In", "orig": "cludes the language definition, syntax rules and error-correction procedures. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 403.2207900000001, "r_x1": 480.58774, "r_y1": 403.2207900000001, "r_x2": 480.58774, "r_y2": 394.42383, "r_x3": 134.76498, "r_y3": 394.42383, "coord_origin": "TOPLEFT" }, "text": "section 5, we apply OTSL on the TableFormer architecture, compare it to Table-", "orig": "section 5, we apply OTSL on the TableFormer architecture, compare it to Table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 415.17679, "r_x1": 480.59469999999993, "r_y1": 415.17679, "r_x2": 480.59469999999993, "r_y2": 406.37982, "r_x3": 134.76498, "r_y3": 406.37982, "coord_origin": "TOPLEFT" }, "text": "Former models trained on HTML and ultimately demonstrate the advantages", "orig": "Former models trained on HTML and ultimately demonstrate the advantages", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 427.13177, "r_x1": 480.59567, "r_y1": 427.13177, "r_x2": 480.59567, "r_y2": 418.33481, "r_x3": 134.76498, "r_y3": 418.33481, "coord_origin": "TOPLEFT" }, "text": "of using OTSL. Finally, in section 6 we conclude our work and outline next", "orig": "of using OTSL. Finally, in section 6 we conclude our work and outline next", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 439.08676, "r_x1": 201.27232, "r_y1": 439.08676, "r_x2": 201.27232, "r_y2": 430.28979, "r_x3": 134.76498, "r_y3": 430.28979, "coord_origin": "TOPLEFT" }, "text": "potential steps.", "orig": "potential steps.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The paper is structured as follows. In section 2, we give an overview of the latest developments in table-structure reconstruction. In section 3 we review the current HTML table encoding (popularised by PubTabNet and FinTabNet) and discuss its flaws. Subsequently, we introduce OTSL in section 4, which includes the language definition, syntax rules and error-correction procedures. In section 5, we apply OTSL on the TableFormer architecture, compare it to TableFormer models trained on HTML and ultimately demonstrate the advantages of using OTSL. Finally, in section 6 we conclude our work and outline next potential steps." }, { "label": "section_header", "id": 4, "page_no": 2, "cluster": { "id": 4, "label": "section_header", "bbox": { "l": 134.76498, "t": 462.08795, "r": 236.76912999999996, "b": 472.65634, "coord_origin": "TOPLEFT" }, "confidence": 0.9439423680305481, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 472.65634, "r_x1": 141.48859, "r_y1": 472.65634, "r_x2": 141.48859, "r_y2": 462.08795, "r_x3": 134.76498, "r_y3": 462.08795, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.93819, "r_y0": 472.65634, "r_x1": 236.76912999999996, "r_y1": 472.65634, "r_x2": 236.76912999999996, "r_y2": 462.08795, "r_x3": 154.93819, "r_y3": 462.08795, "coord_origin": "TOPLEFT" }, "text": "Related Work", "orig": "Related Work", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "2 Related Work" }, { "label": "text", "id": 3, "page_no": 2, "cluster": { "id": 3, "label": "text", "bbox": { "l": 134.76498, "t": 488.68582, "r": 484.12047999999993, "b": 664.85577, "coord_origin": "TOPLEFT" }, "confidence": 0.9870182871818542, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 497.48279, "r_x1": 480.59067, "r_y1": 497.48279, "r_x2": 480.59067, "r_y2": 488.68582, "r_x3": 134.76498, "r_y3": 488.68582, "coord_origin": "TOPLEFT" }, "text": "Approaches to formalize the logical structure and layout of tables in electronic", "orig": "Approaches to formalize the logical structure and layout of tables in electronic", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 509.43777, "r_x1": 480.5917400000001, "r_y1": 509.43777, "r_x2": 480.5917400000001, "r_y2": 500.64081, "r_x3": 134.76498, "r_y3": 500.64081, "coord_origin": "TOPLEFT" }, "text": "documents date back more than two decades [16]. In the recent past, a wide", "orig": "documents date back more than two decades [16]. In the recent past, a wide", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 521.39276, "r_x1": 480.58971999999994, "r_y1": 521.39276, "r_x2": 480.58971999999994, "r_y2": 512.5957900000001, "r_x3": 134.76498, "r_y3": 512.5957900000001, "coord_origin": "TOPLEFT" }, "text": "variety of computer vision methods have been explored to tackle the prob-", "orig": "variety of computer vision methods have been explored to tackle the prob-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 533.34875, "r_x1": 480.58966, "r_y1": 533.34875, "r_x2": 480.58966, "r_y2": 524.55179, "r_x3": 134.76498, "r_y3": 524.55179, "coord_origin": "TOPLEFT" }, "text": "lem of table structure recognition, i.e. the correct identification of columns,", "orig": "lem of table structure recognition, i.e. the correct identification of columns,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 545.30376, "r_x1": 480.5897499999999, "r_y1": 545.30376, "r_x2": 480.5897499999999, "r_y2": 536.50679, "r_x3": 134.76498, "r_y3": 536.50679, "coord_origin": "TOPLEFT" }, "text": "rows and spanning cells in a given table. Broadly speaking, the current deep-", "orig": "rows and spanning cells in a given table. Broadly speaking, the current deep-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 557.2587599999999, "r_x1": 480.58862000000005, "r_y1": 557.2587599999999, "r_x2": 480.58862000000005, "r_y2": 548.4617900000001, "r_x3": 134.76498, "r_y3": 548.4617900000001, "coord_origin": "TOPLEFT" }, "text": "learning based approaches fall into three categories: object detection (OD) meth-", "orig": "learning based approaches fall into three categories: object detection (OD) meth-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 569.21376, "r_x1": 480.59072999999995, "r_y1": 569.21376, "r_x2": 480.59072999999995, "r_y2": 560.41679, "r_x3": 134.76498, "r_y3": 560.41679, "coord_origin": "TOPLEFT" }, "text": "ods, Graph-Neural-Network (GNN) methods and Image-to-Markup-Sequence", "orig": "ods, Graph-Neural-Network (GNN) methods and Image-to-Markup-Sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 581.16876, "r_x1": 484.12047999999993, "r_y1": 581.16876, "r_x2": 484.12047999999993, "r_y2": 572.3718, "r_x3": 134.76498, "r_y3": 572.3718, "coord_origin": "TOPLEFT" }, "text": "(Im2Seq) methods. Object-detection based methods [11,12,13,14,21] rely on table-", "orig": "(Im2Seq) methods. Object-detection based methods [11,12,13,14,21] rely on table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 593.12376, "r_x1": 480.59567, "r_y1": 593.12376, "r_x2": 480.59567, "r_y2": 584.3267999999999, "r_x3": 134.76498, "r_y3": 584.3267999999999, "coord_origin": "TOPLEFT" }, "text": "structure annotation using (overlapping) bounding boxes for training, and pro-", "orig": "structure annotation using (overlapping) bounding boxes for training, and pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 605.07976, "r_x1": 480.58871, "r_y1": 605.07976, "r_x2": 480.58871, "r_y2": 596.28279, "r_x3": 134.76498, "r_y3": 596.28279, "coord_origin": "TOPLEFT" }, "text": "duce bounding-box predictions to define table cells, rows, and columns on a table", "orig": "duce bounding-box predictions to define table cells, rows, and columns on a table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 617.03476, "r_x1": 480.59075999999993, "r_y1": 617.03476, "r_x2": 480.59075999999993, "r_y2": 608.23779, "r_x3": 134.76498, "r_y3": 608.23779, "coord_origin": "TOPLEFT" }, "text": "image. Graph Neural Network (GNN) based methods [3,6,17,18], as the name", "orig": "image. Graph Neural Network (GNN) based methods [3,6,17,18], as the name", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 628.9897599999999, "r_x1": 480.58574999999996, "r_y1": 628.9897599999999, "r_x2": 480.58574999999996, "r_y2": 620.1927900000001, "r_x3": 134.76498, "r_y3": 620.1927900000001, "coord_origin": "TOPLEFT" }, "text": "suggests, represent tables as graph structures. The graph nodes represent the", "orig": "suggests, represent tables as graph structures. The graph nodes represent the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 640.94476, "r_x1": 480.58875, "r_y1": 640.94476, "r_x2": 480.58875, "r_y2": 632.1478, "r_x3": 134.76498, "r_y3": 632.1478, "coord_origin": "TOPLEFT" }, "text": "content of each table cell, an embedding vector from the table image, or geomet-", "orig": "content of each table cell, an embedding vector from the table image, or geomet-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 652.89977, "r_x1": 480.58875, "r_y1": 652.89977, "r_x2": 480.58875, "r_y2": 644.1028, "r_x3": 134.76498, "r_y3": 644.1028, "coord_origin": "TOPLEFT" }, "text": "ric coordinates of the table cell. The edges of the graph define the relationship", "orig": "ric coordinates of the table cell. The edges of the graph define the relationship", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 664.85577, "r_x1": 480.59069999999997, "r_y1": 664.85577, "r_x2": 480.59069999999997, "r_y2": 656.05879, "r_x3": 134.76498, "r_y3": 656.05879, "coord_origin": "TOPLEFT" }, "text": "between the nodes, e.g. if they belong to the same column, row, or table cell.", "orig": "between the nodes, e.g. if they belong to the same column, row, or table cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Approaches to formalize the logical structure and layout of tables in electronic documents date back more than two decades [16]. In the recent past, a wide variety of computer vision methods have been explored to tackle the problem of table structure recognition, i.e. the correct identification of columns, rows and spanning cells in a given table. Broadly speaking, the current deeplearning based approaches fall into three categories: object detection (OD) methods, Graph-Neural-Network (GNN) methods and Image-to-Markup-Sequence (Im2Seq) methods. Object-detection based methods [11,12,13,14,21] rely on tablestructure annotation using (overlapping) bounding boxes for training, and produce bounding-box predictions to define table cells, rows, and columns on a table image. Graph Neural Network (GNN) based methods [3,6,17,18], as the name suggests, represent tables as graph structures. The graph nodes represent the content of each table cell, an embedding vector from the table image, or geometric coordinates of the table cell. The edges of the graph define the relationship between the nodes, e.g. if they belong to the same column, row, or table cell." } ], "headers": [ { "label": "page_header", "id": 5, "page_no": 2, "cluster": { "id": 5, "label": "page_header", "bbox": { "l": 194.478, "t": 93.77099999999996, "r": 447.54291000000006, "b": 101.84069999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.9325801730155945, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.478, "r_y0": 101.84069999999997, "r_x1": 447.54291000000006, "r_y1": 101.84069999999997, "r_x2": 447.54291000000006, "r_y2": 93.77099999999996, "r_x3": 194.478, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Optimized Table Tokenization for Table Structure Recognition" }, { "label": "page_header", "id": 6, "page_no": 2, "cluster": { "id": 6, "label": "page_header", "bbox": { "l": 475.98431, "t": 93.77099999999996, "r": 480.59125000000006, "b": 101.84069999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.8773486614227295, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 475.98431, "r_y0": 101.84069999999997, "r_x1": 480.59125000000006, "r_y1": 101.84069999999997, "r_x2": 480.59125000000006, "r_y2": 93.77099999999996, "r_x3": 475.98431, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "3" } ] } }, { "page_no": 3, "size": { "width": 612.0, "height": 792.0 }, "parsed_page": { "dimension": { "angle": 0.0, "rect": { "r_x0": 0.0, "r_y0": 0.0, "r_x1": 612.0, "r_y1": 0.0, "r_x2": 612.0, "r_y2": 792.0, "r_x3": 0.0, "r_y3": 792.0, "coord_origin": "BOTTOMLEFT" }, "boundary_type": "crop_box", "art_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "bleed_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "crop_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "media_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "trim_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" } }, "bitmap_resources": [], "char_cells": [], "word_cells": [], "textline_cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 101.84069999999997, "r_x1": 139.37193, "r_y1": 101.84069999999997, "r_x2": 139.37193, "r_y2": 93.77099999999996, "r_x3": 134.765, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.81335, "r_y0": 101.84069999999997, "r_x1": 178.07675, "r_y1": 101.84069999999997, "r_x2": 178.07675, "r_y2": 93.77099999999996, "r_x3": 167.81335, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.37415, "r_y0": 101.84069999999997, "r_x1": 231.72227, "r_y1": 101.84069999999997, "r_x2": 231.72227, "r_y2": 93.77099999999996, "r_x3": 182.37415, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 127.73077, "r_x1": 480.59375, "r_y1": 127.73077, "r_x2": 480.59375, "r_y2": 118.93377999999996, "r_x3": 134.765, "r_y3": 118.93377999999996, "coord_origin": "TOPLEFT" }, "text": "Other work [20] aims at predicting a grid for each table and deciding which cells", "orig": "Other work [20] aims at predicting a grid for each table and deciding which cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 139.68579, "r_x1": 480.58774, "r_y1": 139.68579, "r_x2": 480.58774, "r_y2": 130.88878999999997, "r_x3": 134.765, "r_y3": 130.88878999999997, "coord_origin": "TOPLEFT" }, "text": "must be merged using an attention network. Im2Seq methods cast the problem", "orig": "must be merged using an attention network. Im2Seq methods cast the problem", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 151.64178000000004, "r_x1": 480.58675999999997, "r_y1": 151.64178000000004, "r_x2": 480.58675999999997, "r_y2": 142.84479, "r_x3": 134.765, "r_y3": 142.84479, "coord_origin": "TOPLEFT" }, "text": "as a sequence generation task [4,5,9,22], and therefore need an internal table-", "orig": "as a sequence generation task [4,5,9,22], and therefore need an internal table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 163.59680000000003, "r_x1": 480.5878000000001, "r_y1": 163.59680000000003, "r_x2": 480.5878000000001, "r_y2": 154.7998, "r_x3": 134.765, "r_y3": 154.7998, "coord_origin": "TOPLEFT" }, "text": "structure representation language, which is often implemented with standard", "orig": "structure representation language, which is often implemented with standard", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 175.55182000000002, "r_x1": 480.59271, "r_y1": 175.55182000000002, "r_x2": 480.59271, "r_y2": 166.75482, "r_x3": 134.765, "r_y3": 166.75482, "coord_origin": "TOPLEFT" }, "text": "markup languages (e.g. HTML, LaTeX, Markdown). In theory, Im2Seq methods", "orig": "markup languages (e.g. HTML, LaTeX, Markdown). In theory, Im2Seq methods", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 187.50684, "r_x1": 480.5957599999999, "r_y1": 187.50684, "r_x2": 480.5957599999999, "r_y2": 178.70983999999999, "r_x3": 134.765, "r_y3": 178.70983999999999, "coord_origin": "TOPLEFT" }, "text": "have a natural advantage over the OD and GNN methods by virtue of directly", "orig": "have a natural advantage over the OD and GNN methods by virtue of directly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 199.46185000000003, "r_x1": 480.59271, "r_y1": 199.46185000000003, "r_x2": 480.59271, "r_y2": 190.66485999999998, "r_x3": 134.765, "r_y3": 190.66485999999998, "coord_origin": "TOPLEFT" }, "text": "predicting the table-structure. As such, no post-processing or rules are needed", "orig": "predicting the table-structure. As such, no post-processing or rules are needed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 211.41687000000002, "r_x1": 480.59378, "r_y1": 211.41687000000002, "r_x2": 480.59378, "r_y2": 202.61987, "r_x3": 134.765, "r_y3": 202.61987, "coord_origin": "TOPLEFT" }, "text": "in order to obtain the table-structure, which is necessary with OD and GNN", "orig": "in order to obtain the table-structure, which is necessary with OD and GNN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 223.37285999999995, "r_x1": 480.58783000000005, "r_y1": 223.37285999999995, "r_x2": 480.58783000000005, "r_y2": 214.57587, "r_x3": 134.765, "r_y3": 214.57587, "coord_origin": "TOPLEFT" }, "text": "approaches. In practice, this is not entirely true, because a predicted sequence", "orig": "approaches. In practice, this is not entirely true, because a predicted sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 235.32788000000005, "r_x1": 480.58978, "r_y1": 235.32788000000005, "r_x2": 480.58978, "r_y2": 226.53088000000002, "r_x3": 134.765, "r_y3": 226.53088000000002, "coord_origin": "TOPLEFT" }, "text": "of table-structure markup does not necessarily have to be syntactically correct.", "orig": "of table-structure markup does not necessarily have to be syntactically correct.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 247.28290000000004, "r_x1": 480.59572999999995, "r_y1": 247.28290000000004, "r_x2": 480.59572999999995, "r_y2": 238.48590000000002, "r_x3": 134.765, "r_y3": 238.48590000000002, "coord_origin": "TOPLEFT" }, "text": "Hence, depending on the quality of the predicted sequence, some post-processing", "orig": "Hence, depending on the quality of the predicted sequence, some post-processing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 259.23792000000003, "r_x1": 480.59473, "r_y1": 259.23792000000003, "r_x2": 480.59473, "r_y2": 250.44092, "r_x3": 134.765, "r_y3": 250.44092, "coord_origin": "TOPLEFT" }, "text": "needs to be performed to ensure a syntactically valid (let alone correct) sequence.", "orig": "needs to be performed to ensure a syntactically valid (let alone correct) sequence.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.709, "r_y0": 271.45392000000004, "r_x1": 480.59280000000007, "r_y1": 271.45392000000004, "r_x2": 480.59280000000007, "r_y2": 262.65692, "r_x3": 149.709, "r_y3": 262.65692, "coord_origin": "TOPLEFT" }, "text": "Within the Im2Seq method, we find several popular models, namely the", "orig": "Within the Im2Seq method, we find several popular models, namely the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 283.40891, "r_x1": 480.59167, "r_y1": 283.40891, "r_x2": 480.59167, "r_y2": 274.61194, "r_x3": 134.765, "r_y3": 274.61194, "coord_origin": "TOPLEFT" }, "text": "encoder-dual-decoder model (EDD) [22], TableFormer [9], Tabsplitter[2] and Ye", "orig": "encoder-dual-decoder model (EDD) [22], TableFormer [9], Tabsplitter[2] and Ye", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 295.36389, "r_x1": 480.59271, "r_y1": 295.36389, "r_x2": 480.59271, "r_y2": 286.56692999999996, "r_x3": 134.765, "r_y3": 286.56692999999996, "coord_origin": "TOPLEFT" }, "text": "et. al. [19]. EDD uses two consecutive long short-term memory (LSTM) decoders", "orig": "et. al. [19]. EDD uses two consecutive long short-term memory (LSTM) decoders", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 307.31888, "r_x1": 342.02097, "r_y1": 307.31888, "r_x2": 342.02097, "r_y2": 298.52190999999993, "r_x3": 134.765, "r_y3": 298.52190999999993, "coord_origin": "TOPLEFT" }, "text": "to predict a table in HTML representation. The", "orig": "to predict a table in HTML representation. The", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.064, "r_y0": 307.31888, "r_x1": 393.04684, "r_y1": 307.31888, "r_x2": 393.04684, "r_y2": 298.52190999999993, "r_x3": 345.064, "r_y3": 298.52190999999993, "coord_origin": "TOPLEFT" }, "text": "tag decoder", "orig": "tag decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.16699, "r_y0": 307.31888, "r_x1": 480.59082, "r_y1": 307.31888, "r_x2": 480.59082, "r_y2": 298.52190999999993, "r_x3": 397.16699, "r_y3": 298.52190999999993, "coord_origin": "TOPLEFT" }, "text": "predicts a sequence", "orig": "predicts a sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 319.27487, "r_x1": 333.29871, "r_y1": 319.27487, "r_x2": 333.29871, "r_y2": 310.47791, "r_x3": 134.76498, "r_y3": 310.47791, "coord_origin": "TOPLEFT" }, "text": "of HTML tags. For each decoded table cell (", "orig": "of HTML tags. For each decoded table cell (", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.29898, "r_y0": 319.27487, "r_x1": 356.9711, "r_y1": 319.27487, "r_x2": 356.9711, "r_y2": 310.47791, "r_x3": 333.29898, "r_y3": 310.47791, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 357.08499, "r_y0": 319.27487, "r_x1": 480.59433000000007, "r_y1": 319.27487, "r_x2": 480.59433000000007, "r_y2": 310.47791, "r_x3": 357.08499, "r_y3": 310.47791, "coord_origin": "TOPLEFT" }, "text": "), the attention is passed to", "orig": "), the attention is passed to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 331.22986, "r_x1": 148.59805, "r_y1": 331.22986, "r_x2": 148.59805, "r_y2": 322.43289, "r_x3": 134.76498, "r_y3": 322.43289, "coord_origin": "TOPLEFT" }, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 152.27698, "r_y0": 331.22986, "r_x1": 202.1109, "r_y1": 331.22986, "r_x2": 202.1109, "r_y2": 322.43289, "r_x3": 152.27698, "r_y3": 322.43289, "coord_origin": "TOPLEFT" }, "text": "cell decoder", "orig": "cell decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 206.86398, "r_y0": 331.22986, "r_x1": 480.58743, "r_y1": 331.22986, "r_x2": 480.58743, "r_y2": 322.43289, "r_x3": 206.86398, "r_y3": 322.43289, "coord_origin": "TOPLEFT" }, "text": "to predict the content with an embedded OCR approach. The", "orig": "to predict the content with an embedded OCR approach. The", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 343.18484, "r_x1": 480.59476, "r_y1": 343.18484, "r_x2": 480.59476, "r_y2": 334.38788, "r_x3": 134.76498, "r_y3": 334.38788, "coord_origin": "TOPLEFT" }, "text": "latter makes it susceptible to transcription errors in the cell content of the table.", "orig": "latter makes it susceptible to transcription errors in the cell content of the table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 355.13983, "r_x1": 480.58675999999997, "r_y1": 355.13983, "r_x2": 480.58675999999997, "r_y2": 346.34286, "r_x3": 134.76498, "r_y3": 346.34286, "coord_origin": "TOPLEFT" }, "text": "TableFormer address this reliance on OCR and uses two transformer decoders for", "orig": "TableFormer address this reliance on OCR and uses two transformer decoders for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 367.09482, "r_x1": 480.58868, "r_y1": 367.09482, "r_x2": 480.58868, "r_y2": 358.29785, "r_x3": 134.76498, "r_y3": 358.29785, "coord_origin": "TOPLEFT" }, "text": "HTML structure and cell bounding box prediction in an end-to-end architecture.", "orig": "HTML structure and cell bounding box prediction in an end-to-end architecture.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 379.0498, "r_x1": 480.58868, "r_y1": 379.0498, "r_x2": 480.58868, "r_y2": 370.25284, "r_x3": 134.76498, "r_y3": 370.25284, "coord_origin": "TOPLEFT" }, "text": "The predicted cell bounding box is then used to extract text tokens from an", "orig": "The predicted cell bounding box is then used to extract text tokens from an", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 391.0058, "r_x1": 480.59357000000006, "r_y1": 391.0058, "r_x2": 480.59357000000006, "r_y2": 382.20883, "r_x3": 134.76498, "r_y3": 382.20883, "coord_origin": "TOPLEFT" }, "text": "originating (digital) PDF page, circumventing any need for OCR. TabSplitter", "orig": "originating (digital) PDF page, circumventing any need for OCR. TabSplitter", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 402.96078, "r_x1": 144.76979, "r_y1": 402.96078, "r_x2": 144.76979, "r_y2": 394.16382, "r_x3": 134.76498, "r_y3": 394.16382, "coord_origin": "TOPLEFT" }, "text": "[2]", "orig": "[2]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.50908, "r_y0": 402.96078, "r_x1": 480.58667, "r_y1": 402.96078, "r_x2": 480.58667, "r_y2": 394.16382, "r_x3": 149.50908, "r_y3": 394.16382, "coord_origin": "TOPLEFT" }, "text": "proposes a compact double-matrix representation of table rows and columns", "orig": "proposes a compact double-matrix representation of table rows and columns", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 414.91576999999995, "r_x1": 480.59569999999997, "r_y1": 414.91576999999995, "r_x2": 480.59569999999997, "r_y2": 406.1188, "r_x3": 134.76498, "r_y3": 406.1188, "coord_origin": "TOPLEFT" }, "text": "to do error detection and error correction of HTML structure sequences based", "orig": "to do error detection and error correction of HTML structure sequences based", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 426.87076, "r_x1": 480.59180000000003, "r_y1": 426.87076, "r_x2": 480.59180000000003, "r_y2": 418.07379, "r_x3": 134.76498, "r_y3": 418.07379, "coord_origin": "TOPLEFT" }, "text": "on predictions from [19]. This compact double-matrix representation can not be", "orig": "on predictions from [19]. This compact double-matrix representation can not be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 438.82574, "r_x1": 480.5878000000001, "r_y1": 438.82574, "r_x2": 480.5878000000001, "r_y2": 430.02878, "r_x3": 134.76498, "r_y3": 430.02878, "coord_origin": "TOPLEFT" }, "text": "used directly by the Img2seq model training, so the model uses HTML as an", "orig": "used directly by the Img2seq model training, so the model uses HTML as an", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 450.78073, "r_x1": 480.58868, "r_y1": 450.78073, "r_x2": 480.58868, "r_y2": 441.98376, "r_x3": 134.76498, "r_y3": 441.98376, "coord_origin": "TOPLEFT" }, "text": "intermediate form. Chi et. al. [4] introduce a data set and a baseline method", "orig": "intermediate form. Chi et. al. [4] introduce a data set and a baseline method", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 462.73672, "r_x1": 384.5752, "r_y1": 462.73672, "r_x2": 384.5752, "r_y2": 453.93976000000004, "r_x3": 134.76498, "r_y3": 453.93976000000004, "coord_origin": "TOPLEFT" }, "text": "using bidirectional LSTMs to predict LaTeX code. Kayal", "orig": "using bidirectional LSTMs to predict LaTeX code. Kayal", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 391.55899, "r_y0": 462.73672, "r_x1": 401.73236, "r_y1": 462.73672, "r_x2": 401.73236, "r_y2": 453.93976000000004, "r_x3": 391.55899, "r_y3": 453.93976000000004, "coord_origin": "TOPLEFT" }, "text": "[5]", "orig": "[5]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 406.55154, "r_y0": 462.73672, "r_x1": 480.58777, "r_y1": 462.73672, "r_x2": 480.58777, "r_y2": 453.93976000000004, "r_x3": 406.55154, "r_y3": 453.93976000000004, "coord_origin": "TOPLEFT" }, "text": "introduces Gated", "orig": "introduces Gated", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 474.69171, "r_x1": 480.59079, "r_y1": 474.69171, "r_x2": 480.59079, "r_y2": 465.89474, "r_x3": 134.76498, "r_y3": 465.89474, "coord_origin": "TOPLEFT" }, "text": "ResNet transformers to predict LaTeX code, and a separate OCR module to", "orig": "ResNet transformers to predict LaTeX code, and a separate OCR module to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 486.6467, "r_x1": 203.68625, "r_y1": 486.6467, "r_x2": 203.68625, "r_y2": 477.84973, "r_x3": 134.76498, "r_y3": 477.84973, "coord_origin": "TOPLEFT" }, "text": "extract content.", "orig": "extract content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.70898, "r_y0": 498.8627, "r_x1": 480.59378, "r_y1": 498.8627, "r_x2": 480.59378, "r_y2": 490.06573, "r_x3": 149.70898, "r_y3": 490.06573, "coord_origin": "TOPLEFT" }, "text": "Im2Seq approaches have shown to be well-suited for the TSR task and allow a", "orig": "Im2Seq approaches have shown to be well-suited for the TSR task and allow a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 510.81769, "r_x1": 480.58871, "r_y1": 510.81769, "r_x2": 480.58871, "r_y2": 502.02072, "r_x3": 134.76498, "r_y3": 502.02072, "coord_origin": "TOPLEFT" }, "text": "full end-to-end network design that can output the final table structure without", "orig": "full end-to-end network design that can output the final table structure without", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 522.7726700000001, "r_x1": 480.58675999999997, "r_y1": 522.7726700000001, "r_x2": 480.58675999999997, "r_y2": 513.9757099999999, "r_x3": 134.76498, "r_y3": 513.9757099999999, "coord_origin": "TOPLEFT" }, "text": "pre- or post-processing logic. Furthermore, Im2Seq models have demonstrated", "orig": "pre- or post-processing logic. Furthermore, Im2Seq models have demonstrated", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 534.72766, "r_x1": 480.58978, "r_y1": 534.72766, "r_x2": 480.58978, "r_y2": 525.93069, "r_x3": 134.76498, "r_y3": 525.93069, "coord_origin": "TOPLEFT" }, "text": "to deliver state-of-the-art prediction accuracy [9]. This motivated the authors", "orig": "to deliver state-of-the-art prediction accuracy [9]. This motivated the authors", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 546.6826599999999, "r_x1": 480.58765, "r_y1": 546.6826599999999, "r_x2": 480.58765, "r_y2": 537.8857, "r_x3": 134.76498, "r_y3": 537.8857, "coord_origin": "TOPLEFT" }, "text": "to investigate if the performance (both in accuracy and inference time) can", "orig": "to investigate if the performance (both in accuracy and inference time) can", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 558.63866, "r_x1": 480.58971999999994, "r_y1": 558.63866, "r_x2": 480.58971999999994, "r_y2": 549.84169, "r_x3": 134.76498, "r_y3": 549.84169, "coord_origin": "TOPLEFT" }, "text": "be further improved by optimising the table structure representation language.", "orig": "be further improved by optimising the table structure representation language.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 570.59366, "r_x1": 480.58871, "r_y1": 570.59366, "r_x2": 480.58871, "r_y2": 561.79669, "r_x3": 134.76498, "r_y3": 561.79669, "coord_origin": "TOPLEFT" }, "text": "We believe this is a necessary step before further improving neural network", "orig": "We believe this is a necessary step before further improving neural network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 582.54866, "r_x1": 249.27811, "r_y1": 582.54866, "r_x2": 249.27811, "r_y2": 573.75169, "r_x3": 134.76498, "r_y3": 573.75169, "coord_origin": "TOPLEFT" }, "text": "architectures for this task.", "orig": "architectures for this task.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 616.11823, "r_x1": 141.48859, "r_y1": 616.11823, "r_x2": 141.48859, "r_y2": 605.54984, "r_x3": 134.76498, "r_y3": 605.54984, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.93819, "r_y0": 616.11823, "r_x1": 269.62442, "r_y1": 616.11823, "r_x2": 269.62442, "r_y2": 605.54984, "r_x3": 154.93819, "r_y3": 605.54984, "coord_origin": "TOPLEFT" }, "text": "Problem Statement", "orig": "Problem Statement", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 640.94466, "r_x1": 480.59064, "r_y1": 640.94466, "r_x2": 480.59064, "r_y2": 632.14769, "r_x3": 134.76498, "r_y3": 632.14769, "coord_origin": "TOPLEFT" }, "text": "All known Im2Seq based models for TSR fundamentally work in similar ways.", "orig": "All known Im2Seq based models for TSR fundamentally work in similar ways.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 652.89966, "r_x1": 480.5867, "r_y1": 652.89966, "r_x2": 480.5867, "r_y2": 644.1026899999999, "r_x3": 134.76498, "r_y3": 644.1026899999999, "coord_origin": "TOPLEFT" }, "text": "Given an image of a table, the Im2Seq model predicts the structure of the table", "orig": "Given an image of a table, the Im2Seq model predicts the structure of the table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 664.85566, "r_x1": 480.5936899999999, "r_y1": 664.85566, "r_x2": 480.5936899999999, "r_y2": 656.0586900000001, "r_x3": 134.76498, "r_y3": 656.0586900000001, "coord_origin": "TOPLEFT" }, "text": "by generating a sequence of tokens. These tokens originate from a finite vocab-", "orig": "by generating a sequence of tokens. These tokens originate from a finite vocab-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "has_chars": false, "has_words": false, "has_lines": true, "image": null, "lines": [] }, "predictions": { "layout": { "clusters": [ { "id": 6, "label": "page_header", "bbox": { "l": 134.765, "t": 93.77099999999996, "r": 139.37193, "b": 101.84069999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.7890051603317261, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 101.84069999999997, "r_x1": 139.37193, "r_y1": 101.84069999999997, "r_x2": 139.37193, "r_y2": 93.77099999999996, "r_x3": 134.765, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 5, "label": "page_header", "bbox": { "l": 167.81335, "t": 93.77099999999996, "r": 231.72227, "b": 101.84069999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.9045588374137878, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.81335, "r_y0": 101.84069999999997, "r_x1": 178.07675, "r_y1": 101.84069999999997, "r_x2": 178.07675, "r_y2": 93.77099999999996, "r_x3": 167.81335, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.37415, "r_y0": 101.84069999999997, "r_x1": 231.72227, "r_y1": 101.84069999999997, "r_x2": 231.72227, "r_y2": 93.77099999999996, "r_x3": 182.37415, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 2, "label": "text", "bbox": { "l": 134.765, "t": 118.93377999999996, "r": 480.5957599999999, "b": 259.23792000000003, "coord_origin": "TOPLEFT" }, "confidence": 0.9467443823814392, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 127.73077, "r_x1": 480.59375, "r_y1": 127.73077, "r_x2": 480.59375, "r_y2": 118.93377999999996, "r_x3": 134.765, "r_y3": 118.93377999999996, "coord_origin": "TOPLEFT" }, "text": "Other work [20] aims at predicting a grid for each table and deciding which cells", "orig": "Other work [20] aims at predicting a grid for each table and deciding which cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 139.68579, "r_x1": 480.58774, "r_y1": 139.68579, "r_x2": 480.58774, "r_y2": 130.88878999999997, "r_x3": 134.765, "r_y3": 130.88878999999997, "coord_origin": "TOPLEFT" }, "text": "must be merged using an attention network. Im2Seq methods cast the problem", "orig": "must be merged using an attention network. Im2Seq methods cast the problem", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 151.64178000000004, "r_x1": 480.58675999999997, "r_y1": 151.64178000000004, "r_x2": 480.58675999999997, "r_y2": 142.84479, "r_x3": 134.765, "r_y3": 142.84479, "coord_origin": "TOPLEFT" }, "text": "as a sequence generation task [4,5,9,22], and therefore need an internal table-", "orig": "as a sequence generation task [4,5,9,22], and therefore need an internal table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 163.59680000000003, "r_x1": 480.5878000000001, "r_y1": 163.59680000000003, "r_x2": 480.5878000000001, "r_y2": 154.7998, "r_x3": 134.765, "r_y3": 154.7998, "coord_origin": "TOPLEFT" }, "text": "structure representation language, which is often implemented with standard", "orig": "structure representation language, which is often implemented with standard", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 175.55182000000002, "r_x1": 480.59271, "r_y1": 175.55182000000002, "r_x2": 480.59271, "r_y2": 166.75482, "r_x3": 134.765, "r_y3": 166.75482, "coord_origin": "TOPLEFT" }, "text": "markup languages (e.g. HTML, LaTeX, Markdown). In theory, Im2Seq methods", "orig": "markup languages (e.g. HTML, LaTeX, Markdown). In theory, Im2Seq methods", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 187.50684, "r_x1": 480.5957599999999, "r_y1": 187.50684, "r_x2": 480.5957599999999, "r_y2": 178.70983999999999, "r_x3": 134.765, "r_y3": 178.70983999999999, "coord_origin": "TOPLEFT" }, "text": "have a natural advantage over the OD and GNN methods by virtue of directly", "orig": "have a natural advantage over the OD and GNN methods by virtue of directly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 199.46185000000003, "r_x1": 480.59271, "r_y1": 199.46185000000003, "r_x2": 480.59271, "r_y2": 190.66485999999998, "r_x3": 134.765, "r_y3": 190.66485999999998, "coord_origin": "TOPLEFT" }, "text": "predicting the table-structure. As such, no post-processing or rules are needed", "orig": "predicting the table-structure. As such, no post-processing or rules are needed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 211.41687000000002, "r_x1": 480.59378, "r_y1": 211.41687000000002, "r_x2": 480.59378, "r_y2": 202.61987, "r_x3": 134.765, "r_y3": 202.61987, "coord_origin": "TOPLEFT" }, "text": "in order to obtain the table-structure, which is necessary with OD and GNN", "orig": "in order to obtain the table-structure, which is necessary with OD and GNN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 223.37285999999995, "r_x1": 480.58783000000005, "r_y1": 223.37285999999995, "r_x2": 480.58783000000005, "r_y2": 214.57587, "r_x3": 134.765, "r_y3": 214.57587, "coord_origin": "TOPLEFT" }, "text": "approaches. In practice, this is not entirely true, because a predicted sequence", "orig": "approaches. In practice, this is not entirely true, because a predicted sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 235.32788000000005, "r_x1": 480.58978, "r_y1": 235.32788000000005, "r_x2": 480.58978, "r_y2": 226.53088000000002, "r_x3": 134.765, "r_y3": 226.53088000000002, "coord_origin": "TOPLEFT" }, "text": "of table-structure markup does not necessarily have to be syntactically correct.", "orig": "of table-structure markup does not necessarily have to be syntactically correct.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 247.28290000000004, "r_x1": 480.59572999999995, "r_y1": 247.28290000000004, "r_x2": 480.59572999999995, "r_y2": 238.48590000000002, "r_x3": 134.765, "r_y3": 238.48590000000002, "coord_origin": "TOPLEFT" }, "text": "Hence, depending on the quality of the predicted sequence, some post-processing", "orig": "Hence, depending on the quality of the predicted sequence, some post-processing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 259.23792000000003, "r_x1": 480.59473, "r_y1": 259.23792000000003, "r_x2": 480.59473, "r_y2": 250.44092, "r_x3": 134.765, "r_y3": 250.44092, "coord_origin": "TOPLEFT" }, "text": "needs to be performed to ensure a syntactically valid (let alone correct) sequence.", "orig": "needs to be performed to ensure a syntactically valid (let alone correct) sequence.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 4, "label": "text", "bbox": { "l": 134.76498, "t": 262.65692, "r": 480.59569999999997, "b": 486.6467, "coord_origin": "TOPLEFT" }, "confidence": 0.929087221622467, "cells": [ { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.709, "r_y0": 271.45392000000004, "r_x1": 480.59280000000007, "r_y1": 271.45392000000004, "r_x2": 480.59280000000007, "r_y2": 262.65692, "r_x3": 149.709, "r_y3": 262.65692, "coord_origin": "TOPLEFT" }, "text": "Within the Im2Seq method, we find several popular models, namely the", "orig": "Within the Im2Seq method, we find several popular models, namely the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 283.40891, "r_x1": 480.59167, "r_y1": 283.40891, "r_x2": 480.59167, "r_y2": 274.61194, "r_x3": 134.765, "r_y3": 274.61194, "coord_origin": "TOPLEFT" }, "text": "encoder-dual-decoder model (EDD) [22], TableFormer [9], Tabsplitter[2] and Ye", "orig": "encoder-dual-decoder model (EDD) [22], TableFormer [9], Tabsplitter[2] and Ye", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 295.36389, "r_x1": 480.59271, "r_y1": 295.36389, "r_x2": 480.59271, "r_y2": 286.56692999999996, "r_x3": 134.765, "r_y3": 286.56692999999996, "coord_origin": "TOPLEFT" }, "text": "et. al. [19]. EDD uses two consecutive long short-term memory (LSTM) decoders", "orig": "et. al. [19]. EDD uses two consecutive long short-term memory (LSTM) decoders", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 307.31888, "r_x1": 342.02097, "r_y1": 307.31888, "r_x2": 342.02097, "r_y2": 298.52190999999993, "r_x3": 134.765, "r_y3": 298.52190999999993, "coord_origin": "TOPLEFT" }, "text": "to predict a table in HTML representation. The", "orig": "to predict a table in HTML representation. The", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.064, "r_y0": 307.31888, "r_x1": 393.04684, "r_y1": 307.31888, "r_x2": 393.04684, "r_y2": 298.52190999999993, "r_x3": 345.064, "r_y3": 298.52190999999993, "coord_origin": "TOPLEFT" }, "text": "tag decoder", "orig": "tag decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.16699, "r_y0": 307.31888, "r_x1": 480.59082, "r_y1": 307.31888, "r_x2": 480.59082, "r_y2": 298.52190999999993, "r_x3": 397.16699, "r_y3": 298.52190999999993, "coord_origin": "TOPLEFT" }, "text": "predicts a sequence", "orig": "predicts a sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 319.27487, "r_x1": 333.29871, "r_y1": 319.27487, "r_x2": 333.29871, "r_y2": 310.47791, "r_x3": 134.76498, "r_y3": 310.47791, "coord_origin": "TOPLEFT" }, "text": "of HTML tags. For each decoded table cell (", "orig": "of HTML tags. For each decoded table cell (", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.29898, "r_y0": 319.27487, "r_x1": 356.9711, "r_y1": 319.27487, "r_x2": 356.9711, "r_y2": 310.47791, "r_x3": 333.29898, "r_y3": 310.47791, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 357.08499, "r_y0": 319.27487, "r_x1": 480.59433000000007, "r_y1": 319.27487, "r_x2": 480.59433000000007, "r_y2": 310.47791, "r_x3": 357.08499, "r_y3": 310.47791, "coord_origin": "TOPLEFT" }, "text": "), the attention is passed to", "orig": "), the attention is passed to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 331.22986, "r_x1": 148.59805, "r_y1": 331.22986, "r_x2": 148.59805, "r_y2": 322.43289, "r_x3": 134.76498, "r_y3": 322.43289, "coord_origin": "TOPLEFT" }, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 152.27698, "r_y0": 331.22986, "r_x1": 202.1109, "r_y1": 331.22986, "r_x2": 202.1109, "r_y2": 322.43289, "r_x3": 152.27698, "r_y3": 322.43289, "coord_origin": "TOPLEFT" }, "text": "cell decoder", "orig": "cell decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 206.86398, "r_y0": 331.22986, "r_x1": 480.58743, "r_y1": 331.22986, "r_x2": 480.58743, "r_y2": 322.43289, "r_x3": 206.86398, "r_y3": 322.43289, "coord_origin": "TOPLEFT" }, "text": "to predict the content with an embedded OCR approach. The", "orig": "to predict the content with an embedded OCR approach. The", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 343.18484, "r_x1": 480.59476, "r_y1": 343.18484, "r_x2": 480.59476, "r_y2": 334.38788, "r_x3": 134.76498, "r_y3": 334.38788, "coord_origin": "TOPLEFT" }, "text": "latter makes it susceptible to transcription errors in the cell content of the table.", "orig": "latter makes it susceptible to transcription errors in the cell content of the table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 355.13983, "r_x1": 480.58675999999997, "r_y1": 355.13983, "r_x2": 480.58675999999997, "r_y2": 346.34286, "r_x3": 134.76498, "r_y3": 346.34286, "coord_origin": "TOPLEFT" }, "text": "TableFormer address this reliance on OCR and uses two transformer decoders for", "orig": "TableFormer address this reliance on OCR and uses two transformer decoders for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 367.09482, "r_x1": 480.58868, "r_y1": 367.09482, "r_x2": 480.58868, "r_y2": 358.29785, "r_x3": 134.76498, "r_y3": 358.29785, "coord_origin": "TOPLEFT" }, "text": "HTML structure and cell bounding box prediction in an end-to-end architecture.", "orig": "HTML structure and cell bounding box prediction in an end-to-end architecture.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 379.0498, "r_x1": 480.58868, "r_y1": 379.0498, "r_x2": 480.58868, "r_y2": 370.25284, "r_x3": 134.76498, "r_y3": 370.25284, "coord_origin": "TOPLEFT" }, "text": "The predicted cell bounding box is then used to extract text tokens from an", "orig": "The predicted cell bounding box is then used to extract text tokens from an", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 391.0058, "r_x1": 480.59357000000006, "r_y1": 391.0058, "r_x2": 480.59357000000006, "r_y2": 382.20883, "r_x3": 134.76498, "r_y3": 382.20883, "coord_origin": "TOPLEFT" }, "text": "originating (digital) PDF page, circumventing any need for OCR. TabSplitter", "orig": "originating (digital) PDF page, circumventing any need for OCR. TabSplitter", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 402.96078, "r_x1": 144.76979, "r_y1": 402.96078, "r_x2": 144.76979, "r_y2": 394.16382, "r_x3": 134.76498, "r_y3": 394.16382, "coord_origin": "TOPLEFT" }, "text": "[2]", "orig": "[2]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.50908, "r_y0": 402.96078, "r_x1": 480.58667, "r_y1": 402.96078, "r_x2": 480.58667, "r_y2": 394.16382, "r_x3": 149.50908, "r_y3": 394.16382, "coord_origin": "TOPLEFT" }, "text": "proposes a compact double-matrix representation of table rows and columns", "orig": "proposes a compact double-matrix representation of table rows and columns", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 414.91576999999995, "r_x1": 480.59569999999997, "r_y1": 414.91576999999995, "r_x2": 480.59569999999997, "r_y2": 406.1188, "r_x3": 134.76498, "r_y3": 406.1188, "coord_origin": "TOPLEFT" }, "text": "to do error detection and error correction of HTML structure sequences based", "orig": "to do error detection and error correction of HTML structure sequences based", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 426.87076, "r_x1": 480.59180000000003, "r_y1": 426.87076, "r_x2": 480.59180000000003, "r_y2": 418.07379, "r_x3": 134.76498, "r_y3": 418.07379, "coord_origin": "TOPLEFT" }, "text": "on predictions from [19]. This compact double-matrix representation can not be", "orig": "on predictions from [19]. This compact double-matrix representation can not be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 438.82574, "r_x1": 480.5878000000001, "r_y1": 438.82574, "r_x2": 480.5878000000001, "r_y2": 430.02878, "r_x3": 134.76498, "r_y3": 430.02878, "coord_origin": "TOPLEFT" }, "text": "used directly by the Img2seq model training, so the model uses HTML as an", "orig": "used directly by the Img2seq model training, so the model uses HTML as an", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 450.78073, "r_x1": 480.58868, "r_y1": 450.78073, "r_x2": 480.58868, "r_y2": 441.98376, "r_x3": 134.76498, "r_y3": 441.98376, "coord_origin": "TOPLEFT" }, "text": "intermediate form. Chi et. al. [4] introduce a data set and a baseline method", "orig": "intermediate form. Chi et. al. [4] introduce a data set and a baseline method", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 462.73672, "r_x1": 384.5752, "r_y1": 462.73672, "r_x2": 384.5752, "r_y2": 453.93976000000004, "r_x3": 134.76498, "r_y3": 453.93976000000004, "coord_origin": "TOPLEFT" }, "text": "using bidirectional LSTMs to predict LaTeX code. Kayal", "orig": "using bidirectional LSTMs to predict LaTeX code. Kayal", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 391.55899, "r_y0": 462.73672, "r_x1": 401.73236, "r_y1": 462.73672, "r_x2": 401.73236, "r_y2": 453.93976000000004, "r_x3": 391.55899, "r_y3": 453.93976000000004, "coord_origin": "TOPLEFT" }, "text": "[5]", "orig": "[5]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 406.55154, "r_y0": 462.73672, "r_x1": 480.58777, "r_y1": 462.73672, "r_x2": 480.58777, "r_y2": 453.93976000000004, "r_x3": 406.55154, "r_y3": 453.93976000000004, "coord_origin": "TOPLEFT" }, "text": "introduces Gated", "orig": "introduces Gated", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 474.69171, "r_x1": 480.59079, "r_y1": 474.69171, "r_x2": 480.59079, "r_y2": 465.89474, "r_x3": 134.76498, "r_y3": 465.89474, "coord_origin": "TOPLEFT" }, "text": "ResNet transformers to predict LaTeX code, and a separate OCR module to", "orig": "ResNet transformers to predict LaTeX code, and a separate OCR module to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 486.6467, "r_x1": 203.68625, "r_y1": 486.6467, "r_x2": 203.68625, "r_y2": 477.84973, "r_x3": 134.76498, "r_y3": 477.84973, "coord_origin": "TOPLEFT" }, "text": "extract content.", "orig": "extract content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 0, "label": "text", "bbox": { "l": 134.76498, "t": 490.06573, "r": 480.59378, "b": 582.54866, "coord_origin": "TOPLEFT" }, "confidence": 0.9853583574295044, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.70898, "r_y0": 498.8627, "r_x1": 480.59378, "r_y1": 498.8627, "r_x2": 480.59378, "r_y2": 490.06573, "r_x3": 149.70898, "r_y3": 490.06573, "coord_origin": "TOPLEFT" }, "text": "Im2Seq approaches have shown to be well-suited for the TSR task and allow a", "orig": "Im2Seq approaches have shown to be well-suited for the TSR task and allow a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 510.81769, "r_x1": 480.58871, "r_y1": 510.81769, "r_x2": 480.58871, "r_y2": 502.02072, "r_x3": 134.76498, "r_y3": 502.02072, "coord_origin": "TOPLEFT" }, "text": "full end-to-end network design that can output the final table structure without", "orig": "full end-to-end network design that can output the final table structure without", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 522.7726700000001, "r_x1": 480.58675999999997, "r_y1": 522.7726700000001, "r_x2": 480.58675999999997, "r_y2": 513.9757099999999, "r_x3": 134.76498, "r_y3": 513.9757099999999, "coord_origin": "TOPLEFT" }, "text": "pre- or post-processing logic. Furthermore, Im2Seq models have demonstrated", "orig": "pre- or post-processing logic. Furthermore, Im2Seq models have demonstrated", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 534.72766, "r_x1": 480.58978, "r_y1": 534.72766, "r_x2": 480.58978, "r_y2": 525.93069, "r_x3": 134.76498, "r_y3": 525.93069, "coord_origin": "TOPLEFT" }, "text": "to deliver state-of-the-art prediction accuracy [9]. This motivated the authors", "orig": "to deliver state-of-the-art prediction accuracy [9]. This motivated the authors", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 546.6826599999999, "r_x1": 480.58765, "r_y1": 546.6826599999999, "r_x2": 480.58765, "r_y2": 537.8857, "r_x3": 134.76498, "r_y3": 537.8857, "coord_origin": "TOPLEFT" }, "text": "to investigate if the performance (both in accuracy and inference time) can", "orig": "to investigate if the performance (both in accuracy and inference time) can", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 558.63866, "r_x1": 480.58971999999994, "r_y1": 558.63866, "r_x2": 480.58971999999994, "r_y2": 549.84169, "r_x3": 134.76498, "r_y3": 549.84169, "coord_origin": "TOPLEFT" }, "text": "be further improved by optimising the table structure representation language.", "orig": "be further improved by optimising the table structure representation language.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 570.59366, "r_x1": 480.58871, "r_y1": 570.59366, "r_x2": 480.58871, "r_y2": 561.79669, "r_x3": 134.76498, "r_y3": 561.79669, "coord_origin": "TOPLEFT" }, "text": "We believe this is a necessary step before further improving neural network", "orig": "We believe this is a necessary step before further improving neural network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 582.54866, "r_x1": 249.27811, "r_y1": 582.54866, "r_x2": 249.27811, "r_y2": 573.75169, "r_x3": 134.76498, "r_y3": 573.75169, "coord_origin": "TOPLEFT" }, "text": "architectures for this task.", "orig": "architectures for this task.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 3, "label": "section_header", "bbox": { "l": 134.76498, "t": 605.54984, "r": 269.62442, "b": 616.11823, "coord_origin": "TOPLEFT" }, "confidence": 0.9393903017044067, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 616.11823, "r_x1": 141.48859, "r_y1": 616.11823, "r_x2": 141.48859, "r_y2": 605.54984, "r_x3": 134.76498, "r_y3": 605.54984, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.93819, "r_y0": 616.11823, "r_x1": 269.62442, "r_y1": 616.11823, "r_x2": 269.62442, "r_y2": 605.54984, "r_x3": 154.93819, "r_y3": 605.54984, "coord_origin": "TOPLEFT" }, "text": "Problem Statement", "orig": "Problem Statement", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 1, "label": "text", "bbox": { "l": 134.76498, "t": 632.14769, "r": 480.5936899999999, "b": 664.85566, "coord_origin": "TOPLEFT" }, "confidence": 0.9692807197570801, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 640.94466, "r_x1": 480.59064, "r_y1": 640.94466, "r_x2": 480.59064, "r_y2": 632.14769, "r_x3": 134.76498, "r_y3": 632.14769, "coord_origin": "TOPLEFT" }, "text": "All known Im2Seq based models for TSR fundamentally work in similar ways.", "orig": "All known Im2Seq based models for TSR fundamentally work in similar ways.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 652.89966, "r_x1": 480.5867, "r_y1": 652.89966, "r_x2": 480.5867, "r_y2": 644.1026899999999, "r_x3": 134.76498, "r_y3": 644.1026899999999, "coord_origin": "TOPLEFT" }, "text": "Given an image of a table, the Im2Seq model predicts the structure of the table", "orig": "Given an image of a table, the Im2Seq model predicts the structure of the table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 664.85566, "r_x1": 480.5936899999999, "r_y1": 664.85566, "r_x2": 480.5936899999999, "r_y2": 656.0586900000001, "r_x3": 134.76498, "r_y3": 656.0586900000001, "coord_origin": "TOPLEFT" }, "text": "by generating a sequence of tokens. These tokens originate from a finite vocab-", "orig": "by generating a sequence of tokens. These tokens originate from a finite vocab-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "tablestructure": { "table_map": {} }, "figures_classification": null, "equations_prediction": null, "vlm_response": null }, "assembled": { "elements": [ { "label": "page_header", "id": 6, "page_no": 3, "cluster": { "id": 6, "label": "page_header", "bbox": { "l": 134.765, "t": 93.77099999999996, "r": 139.37193, "b": 101.84069999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.7890051603317261, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 101.84069999999997, "r_x1": 139.37193, "r_y1": 101.84069999999997, "r_x2": 139.37193, "r_y2": 93.77099999999996, "r_x3": 134.765, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "4" }, { "label": "page_header", "id": 5, "page_no": 3, "cluster": { "id": 5, "label": "page_header", "bbox": { "l": 167.81335, "t": 93.77099999999996, "r": 231.72227, "b": 101.84069999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.9045588374137878, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.81335, "r_y0": 101.84069999999997, "r_x1": 178.07675, "r_y1": 101.84069999999997, "r_x2": 178.07675, "r_y2": 93.77099999999996, "r_x3": 167.81335, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.37415, "r_y0": 101.84069999999997, "r_x1": 231.72227, "r_y1": 101.84069999999997, "r_x2": 231.72227, "r_y2": 93.77099999999996, "r_x3": 182.37415, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "M. Lysak, et al." }, { "label": "text", "id": 2, "page_no": 3, "cluster": { "id": 2, "label": "text", "bbox": { "l": 134.765, "t": 118.93377999999996, "r": 480.5957599999999, "b": 259.23792000000003, "coord_origin": "TOPLEFT" }, "confidence": 0.9467443823814392, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 127.73077, "r_x1": 480.59375, "r_y1": 127.73077, "r_x2": 480.59375, "r_y2": 118.93377999999996, "r_x3": 134.765, "r_y3": 118.93377999999996, "coord_origin": "TOPLEFT" }, "text": "Other work [20] aims at predicting a grid for each table and deciding which cells", "orig": "Other work [20] aims at predicting a grid for each table and deciding which cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 139.68579, "r_x1": 480.58774, "r_y1": 139.68579, "r_x2": 480.58774, "r_y2": 130.88878999999997, "r_x3": 134.765, "r_y3": 130.88878999999997, "coord_origin": "TOPLEFT" }, "text": "must be merged using an attention network. Im2Seq methods cast the problem", "orig": "must be merged using an attention network. Im2Seq methods cast the problem", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 151.64178000000004, "r_x1": 480.58675999999997, "r_y1": 151.64178000000004, "r_x2": 480.58675999999997, "r_y2": 142.84479, "r_x3": 134.765, "r_y3": 142.84479, "coord_origin": "TOPLEFT" }, "text": "as a sequence generation task [4,5,9,22], and therefore need an internal table-", "orig": "as a sequence generation task [4,5,9,22], and therefore need an internal table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 163.59680000000003, "r_x1": 480.5878000000001, "r_y1": 163.59680000000003, "r_x2": 480.5878000000001, "r_y2": 154.7998, "r_x3": 134.765, "r_y3": 154.7998, "coord_origin": "TOPLEFT" }, "text": "structure representation language, which is often implemented with standard", "orig": "structure representation language, which is often implemented with standard", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 175.55182000000002, "r_x1": 480.59271, "r_y1": 175.55182000000002, "r_x2": 480.59271, "r_y2": 166.75482, "r_x3": 134.765, "r_y3": 166.75482, "coord_origin": "TOPLEFT" }, "text": "markup languages (e.g. HTML, LaTeX, Markdown). In theory, Im2Seq methods", "orig": "markup languages (e.g. HTML, LaTeX, Markdown). In theory, Im2Seq methods", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 187.50684, "r_x1": 480.5957599999999, "r_y1": 187.50684, "r_x2": 480.5957599999999, "r_y2": 178.70983999999999, "r_x3": 134.765, "r_y3": 178.70983999999999, "coord_origin": "TOPLEFT" }, "text": "have a natural advantage over the OD and GNN methods by virtue of directly", "orig": "have a natural advantage over the OD and GNN methods by virtue of directly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 199.46185000000003, "r_x1": 480.59271, "r_y1": 199.46185000000003, "r_x2": 480.59271, "r_y2": 190.66485999999998, "r_x3": 134.765, "r_y3": 190.66485999999998, "coord_origin": "TOPLEFT" }, "text": "predicting the table-structure. As such, no post-processing or rules are needed", "orig": "predicting the table-structure. As such, no post-processing or rules are needed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 211.41687000000002, "r_x1": 480.59378, "r_y1": 211.41687000000002, "r_x2": 480.59378, "r_y2": 202.61987, "r_x3": 134.765, "r_y3": 202.61987, "coord_origin": "TOPLEFT" }, "text": "in order to obtain the table-structure, which is necessary with OD and GNN", "orig": "in order to obtain the table-structure, which is necessary with OD and GNN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 223.37285999999995, "r_x1": 480.58783000000005, "r_y1": 223.37285999999995, "r_x2": 480.58783000000005, "r_y2": 214.57587, "r_x3": 134.765, "r_y3": 214.57587, "coord_origin": "TOPLEFT" }, "text": "approaches. In practice, this is not entirely true, because a predicted sequence", "orig": "approaches. In practice, this is not entirely true, because a predicted sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 235.32788000000005, "r_x1": 480.58978, "r_y1": 235.32788000000005, "r_x2": 480.58978, "r_y2": 226.53088000000002, "r_x3": 134.765, "r_y3": 226.53088000000002, "coord_origin": "TOPLEFT" }, "text": "of table-structure markup does not necessarily have to be syntactically correct.", "orig": "of table-structure markup does not necessarily have to be syntactically correct.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 247.28290000000004, "r_x1": 480.59572999999995, "r_y1": 247.28290000000004, "r_x2": 480.59572999999995, "r_y2": 238.48590000000002, "r_x3": 134.765, "r_y3": 238.48590000000002, "coord_origin": "TOPLEFT" }, "text": "Hence, depending on the quality of the predicted sequence, some post-processing", "orig": "Hence, depending on the quality of the predicted sequence, some post-processing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 259.23792000000003, "r_x1": 480.59473, "r_y1": 259.23792000000003, "r_x2": 480.59473, "r_y2": 250.44092, "r_x3": 134.765, "r_y3": 250.44092, "coord_origin": "TOPLEFT" }, "text": "needs to be performed to ensure a syntactically valid (let alone correct) sequence.", "orig": "needs to be performed to ensure a syntactically valid (let alone correct) sequence.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Other work [20] aims at predicting a grid for each table and deciding which cells must be merged using an attention network. Im2Seq methods cast the problem as a sequence generation task [4,5,9,22], and therefore need an internal tablestructure representation language, which is often implemented with standard markup languages (e.g. HTML, LaTeX, Markdown). In theory, Im2Seq methods have a natural advantage over the OD and GNN methods by virtue of directly predicting the table-structure. As such, no post-processing or rules are needed in order to obtain the table-structure, which is necessary with OD and GNN approaches. In practice, this is not entirely true, because a predicted sequence of table-structure markup does not necessarily have to be syntactically correct. Hence, depending on the quality of the predicted sequence, some post-processing needs to be performed to ensure a syntactically valid (let alone correct) sequence." }, { "label": "text", "id": 4, "page_no": 3, "cluster": { "id": 4, "label": "text", "bbox": { "l": 134.76498, "t": 262.65692, "r": 480.59569999999997, "b": 486.6467, "coord_origin": "TOPLEFT" }, "confidence": 0.929087221622467, "cells": [ { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.709, "r_y0": 271.45392000000004, "r_x1": 480.59280000000007, "r_y1": 271.45392000000004, "r_x2": 480.59280000000007, "r_y2": 262.65692, "r_x3": 149.709, "r_y3": 262.65692, "coord_origin": "TOPLEFT" }, "text": "Within the Im2Seq method, we find several popular models, namely the", "orig": "Within the Im2Seq method, we find several popular models, namely the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 283.40891, "r_x1": 480.59167, "r_y1": 283.40891, "r_x2": 480.59167, "r_y2": 274.61194, "r_x3": 134.765, "r_y3": 274.61194, "coord_origin": "TOPLEFT" }, "text": "encoder-dual-decoder model (EDD) [22], TableFormer [9], Tabsplitter[2] and Ye", "orig": "encoder-dual-decoder model (EDD) [22], TableFormer [9], Tabsplitter[2] and Ye", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 295.36389, "r_x1": 480.59271, "r_y1": 295.36389, "r_x2": 480.59271, "r_y2": 286.56692999999996, "r_x3": 134.765, "r_y3": 286.56692999999996, "coord_origin": "TOPLEFT" }, "text": "et. al. [19]. EDD uses two consecutive long short-term memory (LSTM) decoders", "orig": "et. al. [19]. EDD uses two consecutive long short-term memory (LSTM) decoders", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 307.31888, "r_x1": 342.02097, "r_y1": 307.31888, "r_x2": 342.02097, "r_y2": 298.52190999999993, "r_x3": 134.765, "r_y3": 298.52190999999993, "coord_origin": "TOPLEFT" }, "text": "to predict a table in HTML representation. The", "orig": "to predict a table in HTML representation. The", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.064, "r_y0": 307.31888, "r_x1": 393.04684, "r_y1": 307.31888, "r_x2": 393.04684, "r_y2": 298.52190999999993, "r_x3": 345.064, "r_y3": 298.52190999999993, "coord_origin": "TOPLEFT" }, "text": "tag decoder", "orig": "tag decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.16699, "r_y0": 307.31888, "r_x1": 480.59082, "r_y1": 307.31888, "r_x2": 480.59082, "r_y2": 298.52190999999993, "r_x3": 397.16699, "r_y3": 298.52190999999993, "coord_origin": "TOPLEFT" }, "text": "predicts a sequence", "orig": "predicts a sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 319.27487, "r_x1": 333.29871, "r_y1": 319.27487, "r_x2": 333.29871, "r_y2": 310.47791, "r_x3": 134.76498, "r_y3": 310.47791, "coord_origin": "TOPLEFT" }, "text": "of HTML tags. For each decoded table cell (", "orig": "of HTML tags. For each decoded table cell (", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.29898, "r_y0": 319.27487, "r_x1": 356.9711, "r_y1": 319.27487, "r_x2": 356.9711, "r_y2": 310.47791, "r_x3": 333.29898, "r_y3": 310.47791, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 357.08499, "r_y0": 319.27487, "r_x1": 480.59433000000007, "r_y1": 319.27487, "r_x2": 480.59433000000007, "r_y2": 310.47791, "r_x3": 357.08499, "r_y3": 310.47791, "coord_origin": "TOPLEFT" }, "text": "), the attention is passed to", "orig": "), the attention is passed to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 331.22986, "r_x1": 148.59805, "r_y1": 331.22986, "r_x2": 148.59805, "r_y2": 322.43289, "r_x3": 134.76498, "r_y3": 322.43289, "coord_origin": "TOPLEFT" }, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 152.27698, "r_y0": 331.22986, "r_x1": 202.1109, "r_y1": 331.22986, "r_x2": 202.1109, "r_y2": 322.43289, "r_x3": 152.27698, "r_y3": 322.43289, "coord_origin": "TOPLEFT" }, "text": "cell decoder", "orig": "cell decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 206.86398, "r_y0": 331.22986, "r_x1": 480.58743, "r_y1": 331.22986, "r_x2": 480.58743, "r_y2": 322.43289, "r_x3": 206.86398, "r_y3": 322.43289, "coord_origin": "TOPLEFT" }, "text": "to predict the content with an embedded OCR approach. The", "orig": "to predict the content with an embedded OCR approach. The", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 343.18484, "r_x1": 480.59476, "r_y1": 343.18484, "r_x2": 480.59476, "r_y2": 334.38788, "r_x3": 134.76498, "r_y3": 334.38788, "coord_origin": "TOPLEFT" }, "text": "latter makes it susceptible to transcription errors in the cell content of the table.", "orig": "latter makes it susceptible to transcription errors in the cell content of the table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 355.13983, "r_x1": 480.58675999999997, "r_y1": 355.13983, "r_x2": 480.58675999999997, "r_y2": 346.34286, "r_x3": 134.76498, "r_y3": 346.34286, "coord_origin": "TOPLEFT" }, "text": "TableFormer address this reliance on OCR and uses two transformer decoders for", "orig": "TableFormer address this reliance on OCR and uses two transformer decoders for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 367.09482, "r_x1": 480.58868, "r_y1": 367.09482, "r_x2": 480.58868, "r_y2": 358.29785, "r_x3": 134.76498, "r_y3": 358.29785, "coord_origin": "TOPLEFT" }, "text": "HTML structure and cell bounding box prediction in an end-to-end architecture.", "orig": "HTML structure and cell bounding box prediction in an end-to-end architecture.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 379.0498, "r_x1": 480.58868, "r_y1": 379.0498, "r_x2": 480.58868, "r_y2": 370.25284, "r_x3": 134.76498, "r_y3": 370.25284, "coord_origin": "TOPLEFT" }, "text": "The predicted cell bounding box is then used to extract text tokens from an", "orig": "The predicted cell bounding box is then used to extract text tokens from an", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 391.0058, "r_x1": 480.59357000000006, "r_y1": 391.0058, "r_x2": 480.59357000000006, "r_y2": 382.20883, "r_x3": 134.76498, "r_y3": 382.20883, "coord_origin": "TOPLEFT" }, "text": "originating (digital) PDF page, circumventing any need for OCR. TabSplitter", "orig": "originating (digital) PDF page, circumventing any need for OCR. TabSplitter", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 402.96078, "r_x1": 144.76979, "r_y1": 402.96078, "r_x2": 144.76979, "r_y2": 394.16382, "r_x3": 134.76498, "r_y3": 394.16382, "coord_origin": "TOPLEFT" }, "text": "[2]", "orig": "[2]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.50908, "r_y0": 402.96078, "r_x1": 480.58667, "r_y1": 402.96078, "r_x2": 480.58667, "r_y2": 394.16382, "r_x3": 149.50908, "r_y3": 394.16382, "coord_origin": "TOPLEFT" }, "text": "proposes a compact double-matrix representation of table rows and columns", "orig": "proposes a compact double-matrix representation of table rows and columns", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 414.91576999999995, "r_x1": 480.59569999999997, "r_y1": 414.91576999999995, "r_x2": 480.59569999999997, "r_y2": 406.1188, "r_x3": 134.76498, "r_y3": 406.1188, "coord_origin": "TOPLEFT" }, "text": "to do error detection and error correction of HTML structure sequences based", "orig": "to do error detection and error correction of HTML structure sequences based", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 426.87076, "r_x1": 480.59180000000003, "r_y1": 426.87076, "r_x2": 480.59180000000003, "r_y2": 418.07379, "r_x3": 134.76498, "r_y3": 418.07379, "coord_origin": "TOPLEFT" }, "text": "on predictions from [19]. This compact double-matrix representation can not be", "orig": "on predictions from [19]. This compact double-matrix representation can not be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 438.82574, "r_x1": 480.5878000000001, "r_y1": 438.82574, "r_x2": 480.5878000000001, "r_y2": 430.02878, "r_x3": 134.76498, "r_y3": 430.02878, "coord_origin": "TOPLEFT" }, "text": "used directly by the Img2seq model training, so the model uses HTML as an", "orig": "used directly by the Img2seq model training, so the model uses HTML as an", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 450.78073, "r_x1": 480.58868, "r_y1": 450.78073, "r_x2": 480.58868, "r_y2": 441.98376, "r_x3": 134.76498, "r_y3": 441.98376, "coord_origin": "TOPLEFT" }, "text": "intermediate form. Chi et. al. [4] introduce a data set and a baseline method", "orig": "intermediate form. Chi et. al. [4] introduce a data set and a baseline method", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 462.73672, "r_x1": 384.5752, "r_y1": 462.73672, "r_x2": 384.5752, "r_y2": 453.93976000000004, "r_x3": 134.76498, "r_y3": 453.93976000000004, "coord_origin": "TOPLEFT" }, "text": "using bidirectional LSTMs to predict LaTeX code. Kayal", "orig": "using bidirectional LSTMs to predict LaTeX code. Kayal", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 391.55899, "r_y0": 462.73672, "r_x1": 401.73236, "r_y1": 462.73672, "r_x2": 401.73236, "r_y2": 453.93976000000004, "r_x3": 391.55899, "r_y3": 453.93976000000004, "coord_origin": "TOPLEFT" }, "text": "[5]", "orig": "[5]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 406.55154, "r_y0": 462.73672, "r_x1": 480.58777, "r_y1": 462.73672, "r_x2": 480.58777, "r_y2": 453.93976000000004, "r_x3": 406.55154, "r_y3": 453.93976000000004, "coord_origin": "TOPLEFT" }, "text": "introduces Gated", "orig": "introduces Gated", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 474.69171, "r_x1": 480.59079, "r_y1": 474.69171, "r_x2": 480.59079, "r_y2": 465.89474, "r_x3": 134.76498, "r_y3": 465.89474, "coord_origin": "TOPLEFT" }, "text": "ResNet transformers to predict LaTeX code, and a separate OCR module to", "orig": "ResNet transformers to predict LaTeX code, and a separate OCR module to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 486.6467, "r_x1": 203.68625, "r_y1": 486.6467, "r_x2": 203.68625, "r_y2": 477.84973, "r_x3": 134.76498, "r_y3": 477.84973, "coord_origin": "TOPLEFT" }, "text": "extract content.", "orig": "extract content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Within the Im2Seq method, we find several popular models, namely the encoder-dual-decoder model (EDD) [22], TableFormer [9], Tabsplitter[2] and Ye et. al. [19]. EDD uses two consecutive long short-term memory (LSTM) decoders to predict a table in HTML representation. The tag decoder predicts a sequence of HTML tags. For each decoded table cell ( ), the attention is passed to the cell decoder to predict the content with an embedded OCR approach. The latter makes it susceptible to transcription errors in the cell content of the table. TableFormer address this reliance on OCR and uses two transformer decoders for HTML structure and cell bounding box prediction in an end-to-end architecture. The predicted cell bounding box is then used to extract text tokens from an originating (digital) PDF page, circumventing any need for OCR. TabSplitter [2] proposes a compact double-matrix representation of table rows and columns to do error detection and error correction of HTML structure sequences based on predictions from [19]. This compact double-matrix representation can not be used directly by the Img2seq model training, so the model uses HTML as an intermediate form. Chi et. al. [4] introduce a data set and a baseline method using bidirectional LSTMs to predict LaTeX code. Kayal [5] introduces Gated ResNet transformers to predict LaTeX code, and a separate OCR module to extract content." }, { "label": "text", "id": 0, "page_no": 3, "cluster": { "id": 0, "label": "text", "bbox": { "l": 134.76498, "t": 490.06573, "r": 480.59378, "b": 582.54866, "coord_origin": "TOPLEFT" }, "confidence": 0.9853583574295044, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.70898, "r_y0": 498.8627, "r_x1": 480.59378, "r_y1": 498.8627, "r_x2": 480.59378, "r_y2": 490.06573, "r_x3": 149.70898, "r_y3": 490.06573, "coord_origin": "TOPLEFT" }, "text": "Im2Seq approaches have shown to be well-suited for the TSR task and allow a", "orig": "Im2Seq approaches have shown to be well-suited for the TSR task and allow a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 510.81769, "r_x1": 480.58871, "r_y1": 510.81769, "r_x2": 480.58871, "r_y2": 502.02072, "r_x3": 134.76498, "r_y3": 502.02072, "coord_origin": "TOPLEFT" }, "text": "full end-to-end network design that can output the final table structure without", "orig": "full end-to-end network design that can output the final table structure without", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 522.7726700000001, "r_x1": 480.58675999999997, "r_y1": 522.7726700000001, "r_x2": 480.58675999999997, "r_y2": 513.9757099999999, "r_x3": 134.76498, "r_y3": 513.9757099999999, "coord_origin": "TOPLEFT" }, "text": "pre- or post-processing logic. Furthermore, Im2Seq models have demonstrated", "orig": "pre- or post-processing logic. Furthermore, Im2Seq models have demonstrated", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 534.72766, "r_x1": 480.58978, "r_y1": 534.72766, "r_x2": 480.58978, "r_y2": 525.93069, "r_x3": 134.76498, "r_y3": 525.93069, "coord_origin": "TOPLEFT" }, "text": "to deliver state-of-the-art prediction accuracy [9]. This motivated the authors", "orig": "to deliver state-of-the-art prediction accuracy [9]. This motivated the authors", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 546.6826599999999, "r_x1": 480.58765, "r_y1": 546.6826599999999, "r_x2": 480.58765, "r_y2": 537.8857, "r_x3": 134.76498, "r_y3": 537.8857, "coord_origin": "TOPLEFT" }, "text": "to investigate if the performance (both in accuracy and inference time) can", "orig": "to investigate if the performance (both in accuracy and inference time) can", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 558.63866, "r_x1": 480.58971999999994, "r_y1": 558.63866, "r_x2": 480.58971999999994, "r_y2": 549.84169, "r_x3": 134.76498, "r_y3": 549.84169, "coord_origin": "TOPLEFT" }, "text": "be further improved by optimising the table structure representation language.", "orig": "be further improved by optimising the table structure representation language.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 570.59366, "r_x1": 480.58871, "r_y1": 570.59366, "r_x2": 480.58871, "r_y2": 561.79669, "r_x3": 134.76498, "r_y3": 561.79669, "coord_origin": "TOPLEFT" }, "text": "We believe this is a necessary step before further improving neural network", "orig": "We believe this is a necessary step before further improving neural network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 582.54866, "r_x1": 249.27811, "r_y1": 582.54866, "r_x2": 249.27811, "r_y2": 573.75169, "r_x3": 134.76498, "r_y3": 573.75169, "coord_origin": "TOPLEFT" }, "text": "architectures for this task.", "orig": "architectures for this task.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Im2Seq approaches have shown to be well-suited for the TSR task and allow a full end-to-end network design that can output the final table structure without pre- or post-processing logic. Furthermore, Im2Seq models have demonstrated to deliver state-of-the-art prediction accuracy [9]. This motivated the authors to investigate if the performance (both in accuracy and inference time) can be further improved by optimising the table structure representation language. We believe this is a necessary step before further improving neural network architectures for this task." }, { "label": "section_header", "id": 3, "page_no": 3, "cluster": { "id": 3, "label": "section_header", "bbox": { "l": 134.76498, "t": 605.54984, "r": 269.62442, "b": 616.11823, "coord_origin": "TOPLEFT" }, "confidence": 0.9393903017044067, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 616.11823, "r_x1": 141.48859, "r_y1": 616.11823, "r_x2": 141.48859, "r_y2": 605.54984, "r_x3": 134.76498, "r_y3": 605.54984, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.93819, "r_y0": 616.11823, "r_x1": 269.62442, "r_y1": 616.11823, "r_x2": 269.62442, "r_y2": 605.54984, "r_x3": 154.93819, "r_y3": 605.54984, "coord_origin": "TOPLEFT" }, "text": "Problem Statement", "orig": "Problem Statement", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "3 Problem Statement" }, { "label": "text", "id": 1, "page_no": 3, "cluster": { "id": 1, "label": "text", "bbox": { "l": 134.76498, "t": 632.14769, "r": 480.5936899999999, "b": 664.85566, "coord_origin": "TOPLEFT" }, "confidence": 0.9692807197570801, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 640.94466, "r_x1": 480.59064, "r_y1": 640.94466, "r_x2": 480.59064, "r_y2": 632.14769, "r_x3": 134.76498, "r_y3": 632.14769, "coord_origin": "TOPLEFT" }, "text": "All known Im2Seq based models for TSR fundamentally work in similar ways.", "orig": "All known Im2Seq based models for TSR fundamentally work in similar ways.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 652.89966, "r_x1": 480.5867, "r_y1": 652.89966, "r_x2": 480.5867, "r_y2": 644.1026899999999, "r_x3": 134.76498, "r_y3": 644.1026899999999, "coord_origin": "TOPLEFT" }, "text": "Given an image of a table, the Im2Seq model predicts the structure of the table", "orig": "Given an image of a table, the Im2Seq model predicts the structure of the table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 664.85566, "r_x1": 480.5936899999999, "r_y1": 664.85566, "r_x2": 480.5936899999999, "r_y2": 656.0586900000001, "r_x3": 134.76498, "r_y3": 656.0586900000001, "coord_origin": "TOPLEFT" }, "text": "by generating a sequence of tokens. These tokens originate from a finite vocab-", "orig": "by generating a sequence of tokens. These tokens originate from a finite vocab-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "All known Im2Seq based models for TSR fundamentally work in similar ways. Given an image of a table, the Im2Seq model predicts the structure of the table by generating a sequence of tokens. These tokens originate from a finite vocab-" } ], "body": [ { "label": "text", "id": 2, "page_no": 3, "cluster": { "id": 2, "label": "text", "bbox": { "l": 134.765, "t": 118.93377999999996, "r": 480.5957599999999, "b": 259.23792000000003, "coord_origin": "TOPLEFT" }, "confidence": 0.9467443823814392, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 127.73077, "r_x1": 480.59375, "r_y1": 127.73077, "r_x2": 480.59375, "r_y2": 118.93377999999996, "r_x3": 134.765, "r_y3": 118.93377999999996, "coord_origin": "TOPLEFT" }, "text": "Other work [20] aims at predicting a grid for each table and deciding which cells", "orig": "Other work [20] aims at predicting a grid for each table and deciding which cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 139.68579, "r_x1": 480.58774, "r_y1": 139.68579, "r_x2": 480.58774, "r_y2": 130.88878999999997, "r_x3": 134.765, "r_y3": 130.88878999999997, "coord_origin": "TOPLEFT" }, "text": "must be merged using an attention network. Im2Seq methods cast the problem", "orig": "must be merged using an attention network. Im2Seq methods cast the problem", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 151.64178000000004, "r_x1": 480.58675999999997, "r_y1": 151.64178000000004, "r_x2": 480.58675999999997, "r_y2": 142.84479, "r_x3": 134.765, "r_y3": 142.84479, "coord_origin": "TOPLEFT" }, "text": "as a sequence generation task [4,5,9,22], and therefore need an internal table-", "orig": "as a sequence generation task [4,5,9,22], and therefore need an internal table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 163.59680000000003, "r_x1": 480.5878000000001, "r_y1": 163.59680000000003, "r_x2": 480.5878000000001, "r_y2": 154.7998, "r_x3": 134.765, "r_y3": 154.7998, "coord_origin": "TOPLEFT" }, "text": "structure representation language, which is often implemented with standard", "orig": "structure representation language, which is often implemented with standard", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 175.55182000000002, "r_x1": 480.59271, "r_y1": 175.55182000000002, "r_x2": 480.59271, "r_y2": 166.75482, "r_x3": 134.765, "r_y3": 166.75482, "coord_origin": "TOPLEFT" }, "text": "markup languages (e.g. HTML, LaTeX, Markdown). In theory, Im2Seq methods", "orig": "markup languages (e.g. HTML, LaTeX, Markdown). In theory, Im2Seq methods", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 187.50684, "r_x1": 480.5957599999999, "r_y1": 187.50684, "r_x2": 480.5957599999999, "r_y2": 178.70983999999999, "r_x3": 134.765, "r_y3": 178.70983999999999, "coord_origin": "TOPLEFT" }, "text": "have a natural advantage over the OD and GNN methods by virtue of directly", "orig": "have a natural advantage over the OD and GNN methods by virtue of directly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 199.46185000000003, "r_x1": 480.59271, "r_y1": 199.46185000000003, "r_x2": 480.59271, "r_y2": 190.66485999999998, "r_x3": 134.765, "r_y3": 190.66485999999998, "coord_origin": "TOPLEFT" }, "text": "predicting the table-structure. As such, no post-processing or rules are needed", "orig": "predicting the table-structure. As such, no post-processing or rules are needed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 211.41687000000002, "r_x1": 480.59378, "r_y1": 211.41687000000002, "r_x2": 480.59378, "r_y2": 202.61987, "r_x3": 134.765, "r_y3": 202.61987, "coord_origin": "TOPLEFT" }, "text": "in order to obtain the table-structure, which is necessary with OD and GNN", "orig": "in order to obtain the table-structure, which is necessary with OD and GNN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 223.37285999999995, "r_x1": 480.58783000000005, "r_y1": 223.37285999999995, "r_x2": 480.58783000000005, "r_y2": 214.57587, "r_x3": 134.765, "r_y3": 214.57587, "coord_origin": "TOPLEFT" }, "text": "approaches. In practice, this is not entirely true, because a predicted sequence", "orig": "approaches. In practice, this is not entirely true, because a predicted sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 235.32788000000005, "r_x1": 480.58978, "r_y1": 235.32788000000005, "r_x2": 480.58978, "r_y2": 226.53088000000002, "r_x3": 134.765, "r_y3": 226.53088000000002, "coord_origin": "TOPLEFT" }, "text": "of table-structure markup does not necessarily have to be syntactically correct.", "orig": "of table-structure markup does not necessarily have to be syntactically correct.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 247.28290000000004, "r_x1": 480.59572999999995, "r_y1": 247.28290000000004, "r_x2": 480.59572999999995, "r_y2": 238.48590000000002, "r_x3": 134.765, "r_y3": 238.48590000000002, "coord_origin": "TOPLEFT" }, "text": "Hence, depending on the quality of the predicted sequence, some post-processing", "orig": "Hence, depending on the quality of the predicted sequence, some post-processing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 259.23792000000003, "r_x1": 480.59473, "r_y1": 259.23792000000003, "r_x2": 480.59473, "r_y2": 250.44092, "r_x3": 134.765, "r_y3": 250.44092, "coord_origin": "TOPLEFT" }, "text": "needs to be performed to ensure a syntactically valid (let alone correct) sequence.", "orig": "needs to be performed to ensure a syntactically valid (let alone correct) sequence.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Other work [20] aims at predicting a grid for each table and deciding which cells must be merged using an attention network. Im2Seq methods cast the problem as a sequence generation task [4,5,9,22], and therefore need an internal tablestructure representation language, which is often implemented with standard markup languages (e.g. HTML, LaTeX, Markdown). In theory, Im2Seq methods have a natural advantage over the OD and GNN methods by virtue of directly predicting the table-structure. As such, no post-processing or rules are needed in order to obtain the table-structure, which is necessary with OD and GNN approaches. In practice, this is not entirely true, because a predicted sequence of table-structure markup does not necessarily have to be syntactically correct. Hence, depending on the quality of the predicted sequence, some post-processing needs to be performed to ensure a syntactically valid (let alone correct) sequence." }, { "label": "text", "id": 4, "page_no": 3, "cluster": { "id": 4, "label": "text", "bbox": { "l": 134.76498, "t": 262.65692, "r": 480.59569999999997, "b": 486.6467, "coord_origin": "TOPLEFT" }, "confidence": 0.929087221622467, "cells": [ { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.709, "r_y0": 271.45392000000004, "r_x1": 480.59280000000007, "r_y1": 271.45392000000004, "r_x2": 480.59280000000007, "r_y2": 262.65692, "r_x3": 149.709, "r_y3": 262.65692, "coord_origin": "TOPLEFT" }, "text": "Within the Im2Seq method, we find several popular models, namely the", "orig": "Within the Im2Seq method, we find several popular models, namely the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 283.40891, "r_x1": 480.59167, "r_y1": 283.40891, "r_x2": 480.59167, "r_y2": 274.61194, "r_x3": 134.765, "r_y3": 274.61194, "coord_origin": "TOPLEFT" }, "text": "encoder-dual-decoder model (EDD) [22], TableFormer [9], Tabsplitter[2] and Ye", "orig": "encoder-dual-decoder model (EDD) [22], TableFormer [9], Tabsplitter[2] and Ye", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 295.36389, "r_x1": 480.59271, "r_y1": 295.36389, "r_x2": 480.59271, "r_y2": 286.56692999999996, "r_x3": 134.765, "r_y3": 286.56692999999996, "coord_origin": "TOPLEFT" }, "text": "et. al. [19]. EDD uses two consecutive long short-term memory (LSTM) decoders", "orig": "et. al. [19]. EDD uses two consecutive long short-term memory (LSTM) decoders", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 307.31888, "r_x1": 342.02097, "r_y1": 307.31888, "r_x2": 342.02097, "r_y2": 298.52190999999993, "r_x3": 134.765, "r_y3": 298.52190999999993, "coord_origin": "TOPLEFT" }, "text": "to predict a table in HTML representation. The", "orig": "to predict a table in HTML representation. The", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.064, "r_y0": 307.31888, "r_x1": 393.04684, "r_y1": 307.31888, "r_x2": 393.04684, "r_y2": 298.52190999999993, "r_x3": 345.064, "r_y3": 298.52190999999993, "coord_origin": "TOPLEFT" }, "text": "tag decoder", "orig": "tag decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.16699, "r_y0": 307.31888, "r_x1": 480.59082, "r_y1": 307.31888, "r_x2": 480.59082, "r_y2": 298.52190999999993, "r_x3": 397.16699, "r_y3": 298.52190999999993, "coord_origin": "TOPLEFT" }, "text": "predicts a sequence", "orig": "predicts a sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 319.27487, "r_x1": 333.29871, "r_y1": 319.27487, "r_x2": 333.29871, "r_y2": 310.47791, "r_x3": 134.76498, "r_y3": 310.47791, "coord_origin": "TOPLEFT" }, "text": "of HTML tags. For each decoded table cell (", "orig": "of HTML tags. For each decoded table cell (", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.29898, "r_y0": 319.27487, "r_x1": 356.9711, "r_y1": 319.27487, "r_x2": 356.9711, "r_y2": 310.47791, "r_x3": 333.29898, "r_y3": 310.47791, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 357.08499, "r_y0": 319.27487, "r_x1": 480.59433000000007, "r_y1": 319.27487, "r_x2": 480.59433000000007, "r_y2": 310.47791, "r_x3": 357.08499, "r_y3": 310.47791, "coord_origin": "TOPLEFT" }, "text": "), the attention is passed to", "orig": "), the attention is passed to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 331.22986, "r_x1": 148.59805, "r_y1": 331.22986, "r_x2": 148.59805, "r_y2": 322.43289, "r_x3": 134.76498, "r_y3": 322.43289, "coord_origin": "TOPLEFT" }, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 152.27698, "r_y0": 331.22986, "r_x1": 202.1109, "r_y1": 331.22986, "r_x2": 202.1109, "r_y2": 322.43289, "r_x3": 152.27698, "r_y3": 322.43289, "coord_origin": "TOPLEFT" }, "text": "cell decoder", "orig": "cell decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 206.86398, "r_y0": 331.22986, "r_x1": 480.58743, "r_y1": 331.22986, "r_x2": 480.58743, "r_y2": 322.43289, "r_x3": 206.86398, "r_y3": 322.43289, "coord_origin": "TOPLEFT" }, "text": "to predict the content with an embedded OCR approach. The", "orig": "to predict the content with an embedded OCR approach. The", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 343.18484, "r_x1": 480.59476, "r_y1": 343.18484, "r_x2": 480.59476, "r_y2": 334.38788, "r_x3": 134.76498, "r_y3": 334.38788, "coord_origin": "TOPLEFT" }, "text": "latter makes it susceptible to transcription errors in the cell content of the table.", "orig": "latter makes it susceptible to transcription errors in the cell content of the table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 355.13983, "r_x1": 480.58675999999997, "r_y1": 355.13983, "r_x2": 480.58675999999997, "r_y2": 346.34286, "r_x3": 134.76498, "r_y3": 346.34286, "coord_origin": "TOPLEFT" }, "text": "TableFormer address this reliance on OCR and uses two transformer decoders for", "orig": "TableFormer address this reliance on OCR and uses two transformer decoders for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 367.09482, "r_x1": 480.58868, "r_y1": 367.09482, "r_x2": 480.58868, "r_y2": 358.29785, "r_x3": 134.76498, "r_y3": 358.29785, "coord_origin": "TOPLEFT" }, "text": "HTML structure and cell bounding box prediction in an end-to-end architecture.", "orig": "HTML structure and cell bounding box prediction in an end-to-end architecture.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 379.0498, "r_x1": 480.58868, "r_y1": 379.0498, "r_x2": 480.58868, "r_y2": 370.25284, "r_x3": 134.76498, "r_y3": 370.25284, "coord_origin": "TOPLEFT" }, "text": "The predicted cell bounding box is then used to extract text tokens from an", "orig": "The predicted cell bounding box is then used to extract text tokens from an", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 391.0058, "r_x1": 480.59357000000006, "r_y1": 391.0058, "r_x2": 480.59357000000006, "r_y2": 382.20883, "r_x3": 134.76498, "r_y3": 382.20883, "coord_origin": "TOPLEFT" }, "text": "originating (digital) PDF page, circumventing any need for OCR. TabSplitter", "orig": "originating (digital) PDF page, circumventing any need for OCR. TabSplitter", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 402.96078, "r_x1": 144.76979, "r_y1": 402.96078, "r_x2": 144.76979, "r_y2": 394.16382, "r_x3": 134.76498, "r_y3": 394.16382, "coord_origin": "TOPLEFT" }, "text": "[2]", "orig": "[2]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.50908, "r_y0": 402.96078, "r_x1": 480.58667, "r_y1": 402.96078, "r_x2": 480.58667, "r_y2": 394.16382, "r_x3": 149.50908, "r_y3": 394.16382, "coord_origin": "TOPLEFT" }, "text": "proposes a compact double-matrix representation of table rows and columns", "orig": "proposes a compact double-matrix representation of table rows and columns", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 414.91576999999995, "r_x1": 480.59569999999997, "r_y1": 414.91576999999995, "r_x2": 480.59569999999997, "r_y2": 406.1188, "r_x3": 134.76498, "r_y3": 406.1188, "coord_origin": "TOPLEFT" }, "text": "to do error detection and error correction of HTML structure sequences based", "orig": "to do error detection and error correction of HTML structure sequences based", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 426.87076, "r_x1": 480.59180000000003, "r_y1": 426.87076, "r_x2": 480.59180000000003, "r_y2": 418.07379, "r_x3": 134.76498, "r_y3": 418.07379, "coord_origin": "TOPLEFT" }, "text": "on predictions from [19]. This compact double-matrix representation can not be", "orig": "on predictions from [19]. This compact double-matrix representation can not be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 438.82574, "r_x1": 480.5878000000001, "r_y1": 438.82574, "r_x2": 480.5878000000001, "r_y2": 430.02878, "r_x3": 134.76498, "r_y3": 430.02878, "coord_origin": "TOPLEFT" }, "text": "used directly by the Img2seq model training, so the model uses HTML as an", "orig": "used directly by the Img2seq model training, so the model uses HTML as an", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 450.78073, "r_x1": 480.58868, "r_y1": 450.78073, "r_x2": 480.58868, "r_y2": 441.98376, "r_x3": 134.76498, "r_y3": 441.98376, "coord_origin": "TOPLEFT" }, "text": "intermediate form. Chi et. al. [4] introduce a data set and a baseline method", "orig": "intermediate form. Chi et. al. [4] introduce a data set and a baseline method", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 462.73672, "r_x1": 384.5752, "r_y1": 462.73672, "r_x2": 384.5752, "r_y2": 453.93976000000004, "r_x3": 134.76498, "r_y3": 453.93976000000004, "coord_origin": "TOPLEFT" }, "text": "using bidirectional LSTMs to predict LaTeX code. Kayal", "orig": "using bidirectional LSTMs to predict LaTeX code. Kayal", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 391.55899, "r_y0": 462.73672, "r_x1": 401.73236, "r_y1": 462.73672, "r_x2": 401.73236, "r_y2": 453.93976000000004, "r_x3": 391.55899, "r_y3": 453.93976000000004, "coord_origin": "TOPLEFT" }, "text": "[5]", "orig": "[5]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 406.55154, "r_y0": 462.73672, "r_x1": 480.58777, "r_y1": 462.73672, "r_x2": 480.58777, "r_y2": 453.93976000000004, "r_x3": 406.55154, "r_y3": 453.93976000000004, "coord_origin": "TOPLEFT" }, "text": "introduces Gated", "orig": "introduces Gated", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 474.69171, "r_x1": 480.59079, "r_y1": 474.69171, "r_x2": 480.59079, "r_y2": 465.89474, "r_x3": 134.76498, "r_y3": 465.89474, "coord_origin": "TOPLEFT" }, "text": "ResNet transformers to predict LaTeX code, and a separate OCR module to", "orig": "ResNet transformers to predict LaTeX code, and a separate OCR module to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 486.6467, "r_x1": 203.68625, "r_y1": 486.6467, "r_x2": 203.68625, "r_y2": 477.84973, "r_x3": 134.76498, "r_y3": 477.84973, "coord_origin": "TOPLEFT" }, "text": "extract content.", "orig": "extract content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Within the Im2Seq method, we find several popular models, namely the encoder-dual-decoder model (EDD) [22], TableFormer [9], Tabsplitter[2] and Ye et. al. [19]. EDD uses two consecutive long short-term memory (LSTM) decoders to predict a table in HTML representation. The tag decoder predicts a sequence of HTML tags. For each decoded table cell ( ), the attention is passed to the cell decoder to predict the content with an embedded OCR approach. The latter makes it susceptible to transcription errors in the cell content of the table. TableFormer address this reliance on OCR and uses two transformer decoders for HTML structure and cell bounding box prediction in an end-to-end architecture. The predicted cell bounding box is then used to extract text tokens from an originating (digital) PDF page, circumventing any need for OCR. TabSplitter [2] proposes a compact double-matrix representation of table rows and columns to do error detection and error correction of HTML structure sequences based on predictions from [19]. This compact double-matrix representation can not be used directly by the Img2seq model training, so the model uses HTML as an intermediate form. Chi et. al. [4] introduce a data set and a baseline method using bidirectional LSTMs to predict LaTeX code. Kayal [5] introduces Gated ResNet transformers to predict LaTeX code, and a separate OCR module to extract content." }, { "label": "text", "id": 0, "page_no": 3, "cluster": { "id": 0, "label": "text", "bbox": { "l": 134.76498, "t": 490.06573, "r": 480.59378, "b": 582.54866, "coord_origin": "TOPLEFT" }, "confidence": 0.9853583574295044, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.70898, "r_y0": 498.8627, "r_x1": 480.59378, "r_y1": 498.8627, "r_x2": 480.59378, "r_y2": 490.06573, "r_x3": 149.70898, "r_y3": 490.06573, "coord_origin": "TOPLEFT" }, "text": "Im2Seq approaches have shown to be well-suited for the TSR task and allow a", "orig": "Im2Seq approaches have shown to be well-suited for the TSR task and allow a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 510.81769, "r_x1": 480.58871, "r_y1": 510.81769, "r_x2": 480.58871, "r_y2": 502.02072, "r_x3": 134.76498, "r_y3": 502.02072, "coord_origin": "TOPLEFT" }, "text": "full end-to-end network design that can output the final table structure without", "orig": "full end-to-end network design that can output the final table structure without", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 522.7726700000001, "r_x1": 480.58675999999997, "r_y1": 522.7726700000001, "r_x2": 480.58675999999997, "r_y2": 513.9757099999999, "r_x3": 134.76498, "r_y3": 513.9757099999999, "coord_origin": "TOPLEFT" }, "text": "pre- or post-processing logic. Furthermore, Im2Seq models have demonstrated", "orig": "pre- or post-processing logic. Furthermore, Im2Seq models have demonstrated", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 534.72766, "r_x1": 480.58978, "r_y1": 534.72766, "r_x2": 480.58978, "r_y2": 525.93069, "r_x3": 134.76498, "r_y3": 525.93069, "coord_origin": "TOPLEFT" }, "text": "to deliver state-of-the-art prediction accuracy [9]. This motivated the authors", "orig": "to deliver state-of-the-art prediction accuracy [9]. This motivated the authors", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 546.6826599999999, "r_x1": 480.58765, "r_y1": 546.6826599999999, "r_x2": 480.58765, "r_y2": 537.8857, "r_x3": 134.76498, "r_y3": 537.8857, "coord_origin": "TOPLEFT" }, "text": "to investigate if the performance (both in accuracy and inference time) can", "orig": "to investigate if the performance (both in accuracy and inference time) can", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 558.63866, "r_x1": 480.58971999999994, "r_y1": 558.63866, "r_x2": 480.58971999999994, "r_y2": 549.84169, "r_x3": 134.76498, "r_y3": 549.84169, "coord_origin": "TOPLEFT" }, "text": "be further improved by optimising the table structure representation language.", "orig": "be further improved by optimising the table structure representation language.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 570.59366, "r_x1": 480.58871, "r_y1": 570.59366, "r_x2": 480.58871, "r_y2": 561.79669, "r_x3": 134.76498, "r_y3": 561.79669, "coord_origin": "TOPLEFT" }, "text": "We believe this is a necessary step before further improving neural network", "orig": "We believe this is a necessary step before further improving neural network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 582.54866, "r_x1": 249.27811, "r_y1": 582.54866, "r_x2": 249.27811, "r_y2": 573.75169, "r_x3": 134.76498, "r_y3": 573.75169, "coord_origin": "TOPLEFT" }, "text": "architectures for this task.", "orig": "architectures for this task.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Im2Seq approaches have shown to be well-suited for the TSR task and allow a full end-to-end network design that can output the final table structure without pre- or post-processing logic. Furthermore, Im2Seq models have demonstrated to deliver state-of-the-art prediction accuracy [9]. This motivated the authors to investigate if the performance (both in accuracy and inference time) can be further improved by optimising the table structure representation language. We believe this is a necessary step before further improving neural network architectures for this task." }, { "label": "section_header", "id": 3, "page_no": 3, "cluster": { "id": 3, "label": "section_header", "bbox": { "l": 134.76498, "t": 605.54984, "r": 269.62442, "b": 616.11823, "coord_origin": "TOPLEFT" }, "confidence": 0.9393903017044067, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 616.11823, "r_x1": 141.48859, "r_y1": 616.11823, "r_x2": 141.48859, "r_y2": 605.54984, "r_x3": 134.76498, "r_y3": 605.54984, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.93819, "r_y0": 616.11823, "r_x1": 269.62442, "r_y1": 616.11823, "r_x2": 269.62442, "r_y2": 605.54984, "r_x3": 154.93819, "r_y3": 605.54984, "coord_origin": "TOPLEFT" }, "text": "Problem Statement", "orig": "Problem Statement", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "3 Problem Statement" }, { "label": "text", "id": 1, "page_no": 3, "cluster": { "id": 1, "label": "text", "bbox": { "l": 134.76498, "t": 632.14769, "r": 480.5936899999999, "b": 664.85566, "coord_origin": "TOPLEFT" }, "confidence": 0.9692807197570801, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 640.94466, "r_x1": 480.59064, "r_y1": 640.94466, "r_x2": 480.59064, "r_y2": 632.14769, "r_x3": 134.76498, "r_y3": 632.14769, "coord_origin": "TOPLEFT" }, "text": "All known Im2Seq based models for TSR fundamentally work in similar ways.", "orig": "All known Im2Seq based models for TSR fundamentally work in similar ways.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 652.89966, "r_x1": 480.5867, "r_y1": 652.89966, "r_x2": 480.5867, "r_y2": 644.1026899999999, "r_x3": 134.76498, "r_y3": 644.1026899999999, "coord_origin": "TOPLEFT" }, "text": "Given an image of a table, the Im2Seq model predicts the structure of the table", "orig": "Given an image of a table, the Im2Seq model predicts the structure of the table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 664.85566, "r_x1": 480.5936899999999, "r_y1": 664.85566, "r_x2": 480.5936899999999, "r_y2": 656.0586900000001, "r_x3": 134.76498, "r_y3": 656.0586900000001, "coord_origin": "TOPLEFT" }, "text": "by generating a sequence of tokens. These tokens originate from a finite vocab-", "orig": "by generating a sequence of tokens. These tokens originate from a finite vocab-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "All known Im2Seq based models for TSR fundamentally work in similar ways. Given an image of a table, the Im2Seq model predicts the structure of the table by generating a sequence of tokens. These tokens originate from a finite vocab-" } ], "headers": [ { "label": "page_header", "id": 6, "page_no": 3, "cluster": { "id": 6, "label": "page_header", "bbox": { "l": 134.765, "t": 93.77099999999996, "r": 139.37193, "b": 101.84069999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.7890051603317261, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 101.84069999999997, "r_x1": 139.37193, "r_y1": 101.84069999999997, "r_x2": 139.37193, "r_y2": 93.77099999999996, "r_x3": 134.765, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "4" }, { "label": "page_header", "id": 5, "page_no": 3, "cluster": { "id": 5, "label": "page_header", "bbox": { "l": 167.81335, "t": 93.77099999999996, "r": 231.72227, "b": 101.84069999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.9045588374137878, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.81335, "r_y0": 101.84069999999997, "r_x1": 178.07675, "r_y1": 101.84069999999997, "r_x2": 178.07675, "r_y2": 93.77099999999996, "r_x3": 167.81335, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.37415, "r_y0": 101.84069999999997, "r_x1": 231.72227, "r_y1": 101.84069999999997, "r_x2": 231.72227, "r_y2": 93.77099999999996, "r_x3": 182.37415, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "M. Lysak, et al." } ] } }, { "page_no": 4, "size": { "width": 612.0, "height": 792.0 }, "parsed_page": { "dimension": { "angle": 0.0, "rect": { "r_x0": 0.0, "r_y0": 0.0, "r_x1": 612.0, "r_y1": 0.0, "r_x2": 612.0, "r_y2": 792.0, "r_x3": 0.0, "r_y3": 792.0, "coord_origin": "BOTTOMLEFT" }, "boundary_type": "crop_box", "art_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "bleed_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "crop_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "media_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "trim_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" } }, "bitmap_resources": [], "char_cells": [], "word_cells": [], "textline_cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.478, "r_y0": 101.84069999999997, "r_x1": 447.54291000000006, "r_y1": 101.84069999999997, "r_x2": 447.54291000000006, "r_y2": 93.77099999999996, "r_x3": 194.478, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 475.98431, "r_y0": 101.84069999999997, "r_x1": 480.59125000000006, "r_y1": 101.84069999999997, "r_x2": 480.59125000000006, "r_y2": 93.77099999999996, "r_x3": 475.98431, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 127.73077, "r_x1": 480.58577999999994, "r_y1": 127.73077, "r_x2": 480.58577999999994, "r_y2": 118.93377999999996, "r_x3": 134.765, "r_y3": 118.93377999999996, "coord_origin": "TOPLEFT" }, "text": "ulary and can be interpreted as a table structure. For example, with the HTML", "orig": "ulary and can be interpreted as a table structure. For example, with the HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 139.68579, "r_x1": 162.48494, "r_y1": 139.68579, "r_x2": 162.48494, "r_y2": 130.88878999999997, "r_x3": 134.765, "r_y3": 130.88878999999997, "coord_origin": "TOPLEFT" }, "text": "tokens", "orig": "tokens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 166.368, "r_y0": 139.68579, "r_x1": 201.74918, "r_y1": 139.68579, "r_x2": 201.74918, "r_y2": 130.88878999999997, "r_x3": 166.368, "r_y3": 130.88878999999997, "coord_origin": "TOPLEFT" }, "text": "", "orig": "
", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 201.74899, "r_y0": 139.68579, "r_x1": 204.51561, "r_y1": 139.68579, "r_x2": 204.51561, "r_y2": 130.88878999999997, "r_x3": 201.74899, "r_y3": 130.88878999999997, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.39699, "r_y0": 139.68579, "r_x1": 248.86904999999996, "r_y1": 139.68579, "r_x2": 248.86904999999996, "r_y2": 130.88878999999997, "r_x3": 208.39699, "r_y3": 130.88878999999997, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 248.86899, "r_y0": 139.68579, "r_x1": 251.6356, "r_y1": 139.68579, "r_x2": 251.6356, "r_y2": 130.88878999999997, "r_x3": 248.86899, "r_y3": 130.88878999999997, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 255.51698, "r_y0": 139.68579, "r_x1": 278.29846, "r_y1": 139.68579, "r_x2": 278.29846, "r_y2": 130.88878999999997, "r_x3": 255.51698, "r_y3": 130.88878999999997, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 278.29797, "r_y0": 139.68579, "r_x1": 281.06458, "r_y1": 139.68579, "r_x2": 281.06458, "r_y2": 130.88878999999997, "r_x3": 278.29797, "r_y3": 130.88878999999997, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 284.94598, "r_y0": 139.68579, "r_x1": 312.81836, "r_y1": 139.68579, "r_x2": 312.81836, "r_y2": 130.88878999999997, "r_x3": 284.94598, "r_y3": 130.88878999999997, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.81799, "r_y0": 139.68579, "r_x1": 315.58459, "r_y1": 139.68579, "r_x2": 315.58459, "r_y2": 130.88878999999997, "r_x3": 312.81799, "r_y3": 130.88878999999997, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 319.466, "r_y0": 139.68579, "r_x1": 343.13812, "r_y1": 139.68579, "r_x2": 343.13812, "r_y2": 130.88878999999997, "r_x3": 319.466, "r_y3": 130.88878999999997, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.13202, "r_y0": 139.68579, "r_x1": 363.17877, "r_y1": 139.68579, "r_x2": 363.17877, "r_y2": 130.88878999999997, "r_x3": 347.13202, "r_y3": 130.88878999999997, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.06003, "r_y0": 139.68579, "r_x1": 395.82306, "r_y1": 139.68579, "r_x2": 395.82306, "r_y2": 130.88878999999997, "r_x3": 367.06003, "r_y3": 130.88878999999997, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.82303, "r_y0": 139.68579, "r_x1": 480.59177000000005, "r_y1": 139.68579, "r_x2": 480.59177000000005, "r_y2": 130.88878999999997, "r_x3": 395.82303, "r_y3": 130.88878999999997, "coord_origin": "TOPLEFT" }, "text": ", one can construct", "orig": ", one can construct", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 151.64178000000004, "r_x1": 480.59365999999994, "r_y1": 151.64178000000004, "r_x2": 480.59365999999994, "r_y2": 142.84479, "r_x3": 134.76501, "r_y3": 142.84479, "coord_origin": "TOPLEFT" }, "text": "simple table structures without any spanning cells. In reality though, one needs", "orig": "simple table structures without any spanning cells. In reality though, one needs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 163.59680000000003, "r_x1": 480.58577999999994, "r_y1": 163.59680000000003, "r_x2": 480.58577999999994, "r_y2": 154.7998, "r_x3": 134.76501, "r_y3": 154.7998, "coord_origin": "TOPLEFT" }, "text": "at least 28 HTML tokens to describe the most common complex tables observed", "orig": "at least 28 HTML tokens to describe the most common complex tables observed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 175.55182000000002, "r_x1": 480.59378, "r_y1": 175.55182000000002, "r_x2": 480.59378, "r_y2": 166.75482, "r_x3": 134.76501, "r_y3": 166.75482, "coord_origin": "TOPLEFT" }, "text": "in real-world documents [21,22], due to a variety of spanning cells definitions in", "orig": "in real-world documents [21,22], due to a variety of spanning cells definitions in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 187.50684, "r_x1": 261.92566, "r_y1": 187.50684, "r_x2": 261.92566, "r_y2": 178.70983999999999, "r_x3": 134.76501, "r_y3": 178.70983999999999, "coord_origin": "TOPLEFT" }, "text": "the HTML token vocabulary.", "orig": "the HTML token vocabulary.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 145.60701, "r_y0": 229.00562000000002, "r_x1": 173.48625, "r_y1": 229.00562000000002, "r_x2": 173.48625, "r_y2": 221.07928000000004, "r_x3": 145.60701, "r_y3": 221.07928000000004, "coord_origin": "TOPLEFT" }, "text": "Fig. 2.", "orig": "Fig. 2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.56001, "r_y0": 229.21178999999995, "r_x1": 469.75223000000005, "r_y1": 229.21178999999995, "r_x2": 469.75223000000005, "r_y2": 221.14209000000005, "r_x3": 176.56001, "r_y3": 221.14209000000005, "coord_origin": "TOPLEFT" }, "text": "Frequency of tokens in HTML and OTSL as they appear in PubTabNet.", "orig": "Frequency of tokens in HTML and OTSL as they appear in PubTabNet.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.709, "r_y0": 377.00375, "r_x1": 480.59283000000005, "r_y1": 377.00375, "r_x2": 480.59283000000005, "r_y2": 368.20679, "r_x3": 149.709, "r_y3": 368.20679, "coord_origin": "TOPLEFT" }, "text": "Obviously, HTML and other general-purpose markup languages were not de-", "orig": "Obviously, HTML and other general-purpose markup languages were not de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 388.9587399999999, "r_x1": 480.58664, "r_y1": 388.9587399999999, "r_x2": 480.58664, "r_y2": 380.16177, "r_x3": 134.765, "r_y3": 380.16177, "coord_origin": "TOPLEFT" }, "text": "signed for Im2Seq models. As such, they have some serious drawbacks. First, the", "orig": "signed for Im2Seq models. As such, they have some serious drawbacks. First, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 400.91373, "r_x1": 480.59180000000003, "r_y1": 400.91373, "r_x2": 480.59180000000003, "r_y2": 392.11676, "r_x3": 134.765, "r_y3": 392.11676, "coord_origin": "TOPLEFT" }, "text": "token vocabulary needs to be artificially large in order to describe all plausible", "orig": "token vocabulary needs to be artificially large in order to describe all plausible", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 412.86871, "r_x1": 480.5897499999999, "r_y1": 412.86871, "r_x2": 480.5897499999999, "r_y2": 404.07175, "r_x3": 134.765, "r_y3": 404.07175, "coord_origin": "TOPLEFT" }, "text": "tabular structures. Since most Im2Seq models use an autoregressive approach,", "orig": "tabular structures. Since most Im2Seq models use an autoregressive approach,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 424.82471, "r_x1": 480.58871, "r_y1": 424.82471, "r_x2": 480.58871, "r_y2": 416.02774, "r_x3": 134.765, "r_y3": 416.02774, "coord_origin": "TOPLEFT" }, "text": "they generate the sequence token by token. Therefore, to reduce inference time,", "orig": "they generate the sequence token by token. Therefore, to reduce inference time,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 436.77969, "r_x1": 480.59265, "r_y1": 436.77969, "r_x2": 480.59265, "r_y2": 427.98273, "r_x3": 134.765, "r_y3": 427.98273, "coord_origin": "TOPLEFT" }, "text": "a shorter sequence length is critical. Every table-cell is represented by at least", "orig": "a shorter sequence length is critical. Every table-cell is represented by at least", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 448.73467999999997, "r_x1": 187.93439, "r_y1": 448.73467999999997, "r_x2": 187.93439, "r_y2": 439.9377099999999, "r_x3": 134.765, "r_y3": 439.9377099999999, "coord_origin": "TOPLEFT" }, "text": "two tokens (", "orig": "two tokens (", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 187.931, "r_y0": 448.73467999999997, "r_x1": 211.60313, "r_y1": 448.73467999999997, "r_x2": 211.60313, "r_y2": 439.9377099999999, "r_x3": 187.931, "r_y3": 439.9377099999999, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 214.75400000000002, "r_y0": 448.73467999999997, "r_x1": 230.80075000000002, "r_y1": 448.73467999999997, "r_x2": 230.80075000000002, "r_y2": 439.9377099999999, "r_x3": 214.75400000000002, "r_y3": 439.9377099999999, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 233.83898999999997, "r_y0": 448.73467999999997, "r_x1": 262.60202, "r_y1": 448.73467999999997, "r_x2": 262.60202, "r_y2": 439.9377099999999, "r_x3": 233.83898999999997, "r_y3": 439.9377099999999, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.716, "r_y0": 448.73467999999997, "r_x1": 480.59009, "r_y1": 448.73467999999997, "r_x2": 480.59009, "r_y2": 439.9377099999999, "r_x3": 262.716, "r_y3": 439.9377099999999, "coord_origin": "TOPLEFT" }, "text": "). Furthermore, when tokenizing the HTML struc-", "orig": "). Furthermore, when tokenizing the HTML struc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 460.68967, "r_x1": 480.58777, "r_y1": 460.68967, "r_x2": 480.58777, "r_y2": 451.8927, "r_x3": 134.76501, "r_y3": 451.8927, "coord_origin": "TOPLEFT" }, "text": "ture, one needs to explicitly enumerate possible column-spans and row-spans", "orig": "ture, one needs to explicitly enumerate possible column-spans and row-spans", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 472.64465, "r_x1": 480.58681999999993, "r_y1": 472.64465, "r_x2": 480.58681999999993, "r_y2": 463.84769, "r_x3": 134.76501, "r_y3": 463.84769, "coord_origin": "TOPLEFT" }, "text": "as words. In practice, this ends up requiring 28 different HTML tokens (when", "orig": "as words. In practice, this ends up requiring 28 different HTML tokens (when", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 484.60065, "r_x1": 480.58681999999993, "r_y1": 484.60065, "r_x2": 480.58681999999993, "r_y2": 475.80368, "r_x3": 134.76501, "r_y3": 475.80368, "coord_origin": "TOPLEFT" }, "text": "including column- and row-spans up to 10 cells) just to describe every table in", "orig": "including column- and row-spans up to 10 cells) just to describe every table in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 496.55563, "r_x1": 480.59067, "r_y1": 496.55563, "r_x2": 480.59067, "r_y2": 487.75867, "r_x3": 134.76501, "r_y3": 487.75867, "coord_origin": "TOPLEFT" }, "text": "the PubTabNet dataset. Clearly, not every token is equally represented, as is", "orig": "the PubTabNet dataset. Clearly, not every token is equally represented, as is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 508.51062, "r_x1": 480.59277, "r_y1": 508.51062, "r_x2": 480.59277, "r_y2": 499.71365, "r_x3": 134.76501, "r_y3": 499.71365, "coord_origin": "TOPLEFT" }, "text": "depicted in Figure 2. This skewed distribution of tokens in combination with", "orig": "depicted in Figure 2. This skewed distribution of tokens in combination with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 520.46561, "r_x1": 480.59476, "r_y1": 520.46561, "r_x2": 480.59476, "r_y2": 511.66864, "r_x3": 134.76501, "r_y3": 511.66864, "coord_origin": "TOPLEFT" }, "text": "variable token row-length makes it challenging for models to learn the HTML", "orig": "variable token row-length makes it challenging for models to learn the HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 532.42059, "r_x1": 176.92873, "r_y1": 532.42059, "r_x2": 176.92873, "r_y2": 523.62363, "r_x3": 134.76501, "r_y3": 523.62363, "coord_origin": "TOPLEFT" }, "text": "structure.", "orig": "structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.70901, "r_y0": 544.8396, "r_x1": 480.59289999999993, "r_y1": 544.8396, "r_x2": 480.59289999999993, "r_y2": 536.04263, "r_x3": 149.70901, "r_y3": 536.04263, "coord_origin": "TOPLEFT" }, "text": "Additionally, it would be desirable if the representation would easily allow", "orig": "Additionally, it would be desirable if the representation would easily allow", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 556.7946000000001, "r_x1": 480.59085, "r_y1": 556.7946000000001, "r_x2": 480.59085, "r_y2": 547.99763, "r_x3": 134.76501, "r_y3": 547.99763, "coord_origin": "TOPLEFT" }, "text": "an early detection of invalid sequences on-the-go, before the prediction of the", "orig": "an early detection of invalid sequences on-the-go, before the prediction of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 568.7496, "r_x1": 480.58984, "r_y1": 568.7496, "r_x2": 480.58984, "r_y2": 559.95264, "r_x3": 134.76501, "r_y3": 559.95264, "coord_origin": "TOPLEFT" }, "text": "entire table structure is completed. HTML is not well-suited for this purpose as", "orig": "entire table structure is completed. HTML is not well-suited for this purpose as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 580.7056, "r_x1": 452.18933, "r_y1": 580.7056, "r_x2": 452.18933, "r_y2": 571.90863, "r_x3": 134.76501, "r_y3": 571.90863, "coord_origin": "TOPLEFT" }, "text": "the verification of incomplete sequences is non-trivial or even impossible.", "orig": "the verification of incomplete sequences is non-trivial or even impossible.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.70901, "r_y0": 593.1236, "r_x1": 480.59283000000005, "r_y1": 593.1236, "r_x2": 480.59283000000005, "r_y2": 584.32663, "r_x3": 149.70901, "r_y3": 584.32663, "coord_origin": "TOPLEFT" }, "text": "In a valid HTML table, the token sequence must describe a 2D grid of table", "orig": "In a valid HTML table, the token sequence must describe a 2D grid of table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 605.07959, "r_x1": 480.58978, "r_y1": 605.07959, "r_x2": 480.58978, "r_y2": 596.28262, "r_x3": 134.76501, "r_y3": 596.28262, "coord_origin": "TOPLEFT" }, "text": "cells, serialised in row-major ordering, where each row and each column have", "orig": "cells, serialised in row-major ordering, where each row and each column have", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 617.03459, "r_x1": 480.5936899999999, "r_y1": 617.03459, "r_x2": 480.5936899999999, "r_y2": 608.23763, "r_x3": 134.76501, "r_y3": 608.23763, "coord_origin": "TOPLEFT" }, "text": "the same length (while considering row- and column-spans). Furthermore, every", "orig": "the same length (while considering row- and column-spans). Furthermore, every", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 628.98959, "r_x1": 480.59091, "r_y1": 628.98959, "r_x2": 480.59091, "r_y2": 620.19263, "r_x3": 134.76501, "r_y3": 620.19263, "coord_origin": "TOPLEFT" }, "text": "opening tag in HTML needs to be matched by a closing tag in a correct hierar-", "orig": "opening tag in HTML needs to be matched by a closing tag in a correct hierar-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 640.9446, "r_x1": 480.58582, "r_y1": 640.9446, "r_x2": 480.58582, "r_y2": 632.1476299999999, "r_x3": 134.76501, "r_y3": 632.1476299999999, "coord_origin": "TOPLEFT" }, "text": "chical manner. Since the number of tokens for each table row and column can", "orig": "chical manner. Since the number of tokens for each table row and column can", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 652.8996, "r_x1": 480.59180000000003, "r_y1": 652.8996, "r_x2": 480.59180000000003, "r_y2": 644.10263, "r_x3": 134.76501, "r_y3": 644.10263, "coord_origin": "TOPLEFT" }, "text": "vary significantly, especially for large tables with many row- and column-spans,", "orig": "vary significantly, especially for large tables with many row- and column-spans,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 664.85461, "r_x1": 480.59473, "r_y1": 664.85461, "r_x2": 480.59473, "r_y2": 656.05763, "r_x3": 134.76501, "r_y3": 656.05763, "coord_origin": "TOPLEFT" }, "text": "it is complex to verify the consistency of predicted structures during sequence", "orig": "it is complex to verify the consistency of predicted structures during sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "has_chars": false, "has_words": false, "has_lines": true, "image": null, "lines": [] }, "predictions": { "layout": { "clusters": [ { "id": 5, "label": "page_header", "bbox": { "l": 194.478, "t": 93.77099999999996, "r": 447.54291000000006, "b": 101.84069999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.9269194602966309, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.478, "r_y0": 101.84069999999997, "r_x1": 447.54291000000006, "r_y1": 101.84069999999997, "r_x2": 447.54291000000006, "r_y2": 93.77099999999996, "r_x3": 194.478, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 6, "label": "page_header", "bbox": { "l": 475.98431, "t": 93.77099999999996, "r": 480.59125000000006, "b": 101.84069999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.8696112036705017, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 475.98431, "r_y0": 101.84069999999997, "r_x1": 480.59125000000006, "r_y1": 101.84069999999997, "r_x2": 480.59125000000006, "r_y2": 93.77099999999996, "r_x3": 475.98431, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 0, "label": "text", "bbox": { "l": 134.765, "t": 118.93377999999996, "r": 480.59378, "b": 187.50684, "coord_origin": "TOPLEFT" }, "confidence": 0.9857171773910522, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 127.73077, "r_x1": 480.58577999999994, "r_y1": 127.73077, "r_x2": 480.58577999999994, "r_y2": 118.93377999999996, "r_x3": 134.765, "r_y3": 118.93377999999996, "coord_origin": "TOPLEFT" }, "text": "ulary and can be interpreted as a table structure. For example, with the HTML", "orig": "ulary and can be interpreted as a table structure. For example, with the HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 139.68579, "r_x1": 162.48494, "r_y1": 139.68579, "r_x2": 162.48494, "r_y2": 130.88878999999997, "r_x3": 134.765, "r_y3": 130.88878999999997, "coord_origin": "TOPLEFT" }, "text": "tokens", "orig": "tokens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 166.368, "r_y0": 139.68579, "r_x1": 201.74918, "r_y1": 139.68579, "r_x2": 201.74918, "r_y2": 130.88878999999997, "r_x3": 166.368, "r_y3": 130.88878999999997, "coord_origin": "TOPLEFT" }, "text": "", "orig": "
", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 201.74899, "r_y0": 139.68579, "r_x1": 204.51561, "r_y1": 139.68579, "r_x2": 204.51561, "r_y2": 130.88878999999997, "r_x3": 201.74899, "r_y3": 130.88878999999997, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.39699, "r_y0": 139.68579, "r_x1": 248.86904999999996, "r_y1": 139.68579, "r_x2": 248.86904999999996, "r_y2": 130.88878999999997, "r_x3": 208.39699, "r_y3": 130.88878999999997, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 248.86899, "r_y0": 139.68579, "r_x1": 251.6356, "r_y1": 139.68579, "r_x2": 251.6356, "r_y2": 130.88878999999997, "r_x3": 248.86899, "r_y3": 130.88878999999997, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 255.51698, "r_y0": 139.68579, "r_x1": 278.29846, "r_y1": 139.68579, "r_x2": 278.29846, "r_y2": 130.88878999999997, "r_x3": 255.51698, "r_y3": 130.88878999999997, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 278.29797, "r_y0": 139.68579, "r_x1": 281.06458, "r_y1": 139.68579, "r_x2": 281.06458, "r_y2": 130.88878999999997, "r_x3": 278.29797, "r_y3": 130.88878999999997, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 284.94598, "r_y0": 139.68579, "r_x1": 312.81836, "r_y1": 139.68579, "r_x2": 312.81836, "r_y2": 130.88878999999997, "r_x3": 284.94598, "r_y3": 130.88878999999997, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.81799, "r_y0": 139.68579, "r_x1": 315.58459, "r_y1": 139.68579, "r_x2": 315.58459, "r_y2": 130.88878999999997, "r_x3": 312.81799, "r_y3": 130.88878999999997, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 319.466, "r_y0": 139.68579, "r_x1": 343.13812, "r_y1": 139.68579, "r_x2": 343.13812, "r_y2": 130.88878999999997, "r_x3": 319.466, "r_y3": 130.88878999999997, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.13202, "r_y0": 139.68579, "r_x1": 363.17877, "r_y1": 139.68579, "r_x2": 363.17877, "r_y2": 130.88878999999997, "r_x3": 347.13202, "r_y3": 130.88878999999997, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.06003, "r_y0": 139.68579, "r_x1": 395.82306, "r_y1": 139.68579, "r_x2": 395.82306, "r_y2": 130.88878999999997, "r_x3": 367.06003, "r_y3": 130.88878999999997, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.82303, "r_y0": 139.68579, "r_x1": 480.59177000000005, "r_y1": 139.68579, "r_x2": 480.59177000000005, "r_y2": 130.88878999999997, "r_x3": 395.82303, "r_y3": 130.88878999999997, "coord_origin": "TOPLEFT" }, "text": ", one can construct", "orig": ", one can construct", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 151.64178000000004, "r_x1": 480.59365999999994, "r_y1": 151.64178000000004, "r_x2": 480.59365999999994, "r_y2": 142.84479, "r_x3": 134.76501, "r_y3": 142.84479, "coord_origin": "TOPLEFT" }, "text": "simple table structures without any spanning cells. In reality though, one needs", "orig": "simple table structures without any spanning cells. In reality though, one needs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 163.59680000000003, "r_x1": 480.58577999999994, "r_y1": 163.59680000000003, "r_x2": 480.58577999999994, "r_y2": 154.7998, "r_x3": 134.76501, "r_y3": 154.7998, "coord_origin": "TOPLEFT" }, "text": "at least 28 HTML tokens to describe the most common complex tables observed", "orig": "at least 28 HTML tokens to describe the most common complex tables observed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 175.55182000000002, "r_x1": 480.59378, "r_y1": 175.55182000000002, "r_x2": 480.59378, "r_y2": 166.75482, "r_x3": 134.76501, "r_y3": 166.75482, "coord_origin": "TOPLEFT" }, "text": "in real-world documents [21,22], due to a variety of spanning cells definitions in", "orig": "in real-world documents [21,22], due to a variety of spanning cells definitions in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 187.50684, "r_x1": 261.92566, "r_y1": 187.50684, "r_x2": 261.92566, "r_y2": 178.70983999999999, "r_x3": 134.76501, "r_y3": 178.70983999999999, "coord_origin": "TOPLEFT" }, "text": "the HTML token vocabulary.", "orig": "the HTML token vocabulary.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 7, "label": "caption", "bbox": { "l": 145.60701, "t": 221.07928000000004, "r": 469.75223000000005, "b": 229.21178999999995, "coord_origin": "TOPLEFT" }, "confidence": 0.8472551703453064, "cells": [ { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 145.60701, "r_y0": 229.00562000000002, "r_x1": 173.48625, "r_y1": 229.00562000000002, "r_x2": 173.48625, "r_y2": 221.07928000000004, "r_x3": 145.60701, "r_y3": 221.07928000000004, "coord_origin": "TOPLEFT" }, "text": "Fig. 2.", "orig": "Fig. 2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.56001, "r_y0": 229.21178999999995, "r_x1": 469.75223000000005, "r_y1": 229.21178999999995, "r_x2": 469.75223000000005, "r_y2": 221.14209000000005, "r_x3": 176.56001, "r_y3": 221.14209000000005, "coord_origin": "TOPLEFT" }, "text": "Frequency of tokens in HTML and OTSL as they appear in PubTabNet.", "orig": "Frequency of tokens in HTML and OTSL as they appear in PubTabNet.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 1, "label": "text", "bbox": { "l": 134.765, "t": 368.20679, "r": 480.59476, "b": 532.42059, "coord_origin": "TOPLEFT" }, "confidence": 0.9844799637794495, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.709, "r_y0": 377.00375, "r_x1": 480.59283000000005, "r_y1": 377.00375, "r_x2": 480.59283000000005, "r_y2": 368.20679, "r_x3": 149.709, "r_y3": 368.20679, "coord_origin": "TOPLEFT" }, "text": "Obviously, HTML and other general-purpose markup languages were not de-", "orig": "Obviously, HTML and other general-purpose markup languages were not de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 388.9587399999999, "r_x1": 480.58664, "r_y1": 388.9587399999999, "r_x2": 480.58664, "r_y2": 380.16177, "r_x3": 134.765, "r_y3": 380.16177, "coord_origin": "TOPLEFT" }, "text": "signed for Im2Seq models. As such, they have some serious drawbacks. First, the", "orig": "signed for Im2Seq models. As such, they have some serious drawbacks. First, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 400.91373, "r_x1": 480.59180000000003, "r_y1": 400.91373, "r_x2": 480.59180000000003, "r_y2": 392.11676, "r_x3": 134.765, "r_y3": 392.11676, "coord_origin": "TOPLEFT" }, "text": "token vocabulary needs to be artificially large in order to describe all plausible", "orig": "token vocabulary needs to be artificially large in order to describe all plausible", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 412.86871, "r_x1": 480.5897499999999, "r_y1": 412.86871, "r_x2": 480.5897499999999, "r_y2": 404.07175, "r_x3": 134.765, "r_y3": 404.07175, "coord_origin": "TOPLEFT" }, "text": "tabular structures. Since most Im2Seq models use an autoregressive approach,", "orig": "tabular structures. Since most Im2Seq models use an autoregressive approach,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 424.82471, "r_x1": 480.58871, "r_y1": 424.82471, "r_x2": 480.58871, "r_y2": 416.02774, "r_x3": 134.765, "r_y3": 416.02774, "coord_origin": "TOPLEFT" }, "text": "they generate the sequence token by token. Therefore, to reduce inference time,", "orig": "they generate the sequence token by token. Therefore, to reduce inference time,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 436.77969, "r_x1": 480.59265, "r_y1": 436.77969, "r_x2": 480.59265, "r_y2": 427.98273, "r_x3": 134.765, "r_y3": 427.98273, "coord_origin": "TOPLEFT" }, "text": "a shorter sequence length is critical. Every table-cell is represented by at least", "orig": "a shorter sequence length is critical. Every table-cell is represented by at least", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 448.73467999999997, "r_x1": 187.93439, "r_y1": 448.73467999999997, "r_x2": 187.93439, "r_y2": 439.9377099999999, "r_x3": 134.765, "r_y3": 439.9377099999999, "coord_origin": "TOPLEFT" }, "text": "two tokens (", "orig": "two tokens (", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 187.931, "r_y0": 448.73467999999997, "r_x1": 211.60313, "r_y1": 448.73467999999997, "r_x2": 211.60313, "r_y2": 439.9377099999999, "r_x3": 187.931, "r_y3": 439.9377099999999, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 214.75400000000002, "r_y0": 448.73467999999997, "r_x1": 230.80075000000002, "r_y1": 448.73467999999997, "r_x2": 230.80075000000002, "r_y2": 439.9377099999999, "r_x3": 214.75400000000002, "r_y3": 439.9377099999999, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 233.83898999999997, "r_y0": 448.73467999999997, "r_x1": 262.60202, "r_y1": 448.73467999999997, "r_x2": 262.60202, "r_y2": 439.9377099999999, "r_x3": 233.83898999999997, "r_y3": 439.9377099999999, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.716, "r_y0": 448.73467999999997, "r_x1": 480.59009, "r_y1": 448.73467999999997, "r_x2": 480.59009, "r_y2": 439.9377099999999, "r_x3": 262.716, "r_y3": 439.9377099999999, "coord_origin": "TOPLEFT" }, "text": "). Furthermore, when tokenizing the HTML struc-", "orig": "). Furthermore, when tokenizing the HTML struc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 460.68967, "r_x1": 480.58777, "r_y1": 460.68967, "r_x2": 480.58777, "r_y2": 451.8927, "r_x3": 134.76501, "r_y3": 451.8927, "coord_origin": "TOPLEFT" }, "text": "ture, one needs to explicitly enumerate possible column-spans and row-spans", "orig": "ture, one needs to explicitly enumerate possible column-spans and row-spans", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 472.64465, "r_x1": 480.58681999999993, "r_y1": 472.64465, "r_x2": 480.58681999999993, "r_y2": 463.84769, "r_x3": 134.76501, "r_y3": 463.84769, "coord_origin": "TOPLEFT" }, "text": "as words. In practice, this ends up requiring 28 different HTML tokens (when", "orig": "as words. In practice, this ends up requiring 28 different HTML tokens (when", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 484.60065, "r_x1": 480.58681999999993, "r_y1": 484.60065, "r_x2": 480.58681999999993, "r_y2": 475.80368, "r_x3": 134.76501, "r_y3": 475.80368, "coord_origin": "TOPLEFT" }, "text": "including column- and row-spans up to 10 cells) just to describe every table in", "orig": "including column- and row-spans up to 10 cells) just to describe every table in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 496.55563, "r_x1": 480.59067, "r_y1": 496.55563, "r_x2": 480.59067, "r_y2": 487.75867, "r_x3": 134.76501, "r_y3": 487.75867, "coord_origin": "TOPLEFT" }, "text": "the PubTabNet dataset. Clearly, not every token is equally represented, as is", "orig": "the PubTabNet dataset. Clearly, not every token is equally represented, as is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 508.51062, "r_x1": 480.59277, "r_y1": 508.51062, "r_x2": 480.59277, "r_y2": 499.71365, "r_x3": 134.76501, "r_y3": 499.71365, "coord_origin": "TOPLEFT" }, "text": "depicted in Figure 2. This skewed distribution of tokens in combination with", "orig": "depicted in Figure 2. This skewed distribution of tokens in combination with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 520.46561, "r_x1": 480.59476, "r_y1": 520.46561, "r_x2": 480.59476, "r_y2": 511.66864, "r_x3": 134.76501, "r_y3": 511.66864, "coord_origin": "TOPLEFT" }, "text": "variable token row-length makes it challenging for models to learn the HTML", "orig": "variable token row-length makes it challenging for models to learn the HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 532.42059, "r_x1": 176.92873, "r_y1": 532.42059, "r_x2": 176.92873, "r_y2": 523.62363, "r_x3": 134.76501, "r_y3": 523.62363, "coord_origin": "TOPLEFT" }, "text": "structure.", "orig": "structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 3, "label": "text", "bbox": { "l": 134.76501, "t": 536.04263, "r": 480.59289999999993, "b": 580.7056, "coord_origin": "TOPLEFT" }, "confidence": 0.978394627571106, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.70901, "r_y0": 544.8396, "r_x1": 480.59289999999993, "r_y1": 544.8396, "r_x2": 480.59289999999993, "r_y2": 536.04263, "r_x3": 149.70901, "r_y3": 536.04263, "coord_origin": "TOPLEFT" }, "text": "Additionally, it would be desirable if the representation would easily allow", "orig": "Additionally, it would be desirable if the representation would easily allow", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 556.7946000000001, "r_x1": 480.59085, "r_y1": 556.7946000000001, "r_x2": 480.59085, "r_y2": 547.99763, "r_x3": 134.76501, "r_y3": 547.99763, "coord_origin": "TOPLEFT" }, "text": "an early detection of invalid sequences on-the-go, before the prediction of the", "orig": "an early detection of invalid sequences on-the-go, before the prediction of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 568.7496, "r_x1": 480.58984, "r_y1": 568.7496, "r_x2": 480.58984, "r_y2": 559.95264, "r_x3": 134.76501, "r_y3": 559.95264, "coord_origin": "TOPLEFT" }, "text": "entire table structure is completed. HTML is not well-suited for this purpose as", "orig": "entire table structure is completed. HTML is not well-suited for this purpose as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 580.7056, "r_x1": 452.18933, "r_y1": 580.7056, "r_x2": 452.18933, "r_y2": 571.90863, "r_x3": 134.76501, "r_y3": 571.90863, "coord_origin": "TOPLEFT" }, "text": "the verification of incomplete sequences is non-trivial or even impossible.", "orig": "the verification of incomplete sequences is non-trivial or even impossible.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 2, "label": "text", "bbox": { "l": 134.76501, "t": 584.32663, "r": 480.59473, "b": 664.85461, "coord_origin": "TOPLEFT" }, "confidence": 0.9838283061981201, "cells": [ { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.70901, "r_y0": 593.1236, "r_x1": 480.59283000000005, "r_y1": 593.1236, "r_x2": 480.59283000000005, "r_y2": 584.32663, "r_x3": 149.70901, "r_y3": 584.32663, "coord_origin": "TOPLEFT" }, "text": "In a valid HTML table, the token sequence must describe a 2D grid of table", "orig": "In a valid HTML table, the token sequence must describe a 2D grid of table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 605.07959, "r_x1": 480.58978, "r_y1": 605.07959, "r_x2": 480.58978, "r_y2": 596.28262, "r_x3": 134.76501, "r_y3": 596.28262, "coord_origin": "TOPLEFT" }, "text": "cells, serialised in row-major ordering, where each row and each column have", "orig": "cells, serialised in row-major ordering, where each row and each column have", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 617.03459, "r_x1": 480.5936899999999, "r_y1": 617.03459, "r_x2": 480.5936899999999, "r_y2": 608.23763, "r_x3": 134.76501, "r_y3": 608.23763, "coord_origin": "TOPLEFT" }, "text": "the same length (while considering row- and column-spans). Furthermore, every", "orig": "the same length (while considering row- and column-spans). Furthermore, every", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 628.98959, "r_x1": 480.59091, "r_y1": 628.98959, "r_x2": 480.59091, "r_y2": 620.19263, "r_x3": 134.76501, "r_y3": 620.19263, "coord_origin": "TOPLEFT" }, "text": "opening tag in HTML needs to be matched by a closing tag in a correct hierar-", "orig": "opening tag in HTML needs to be matched by a closing tag in a correct hierar-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 640.9446, "r_x1": 480.58582, "r_y1": 640.9446, "r_x2": 480.58582, "r_y2": 632.1476299999999, "r_x3": 134.76501, "r_y3": 632.1476299999999, "coord_origin": "TOPLEFT" }, "text": "chical manner. Since the number of tokens for each table row and column can", "orig": "chical manner. Since the number of tokens for each table row and column can", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 652.8996, "r_x1": 480.59180000000003, "r_y1": 652.8996, "r_x2": 480.59180000000003, "r_y2": 644.10263, "r_x3": 134.76501, "r_y3": 644.10263, "coord_origin": "TOPLEFT" }, "text": "vary significantly, especially for large tables with many row- and column-spans,", "orig": "vary significantly, especially for large tables with many row- and column-spans,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 664.85461, "r_x1": 480.59473, "r_y1": 664.85461, "r_x2": 480.59473, "r_y2": 656.05763, "r_x3": 134.76501, "r_y3": 656.05763, "coord_origin": "TOPLEFT" }, "text": "it is complex to verify the consistency of predicted structures during sequence", "orig": "it is complex to verify the consistency of predicted structures during sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 4, "label": "picture", "bbox": { "l": 137.41448974609375, "t": 233.51231384277344, "r": 476.5608215332031, "b": 340.2304992675781, "coord_origin": "TOPLEFT" }, "confidence": 0.9387977123260498, "cells": [], "children": [] } ] }, "tablestructure": { "table_map": {} }, "figures_classification": null, "equations_prediction": null, "vlm_response": null }, "assembled": { "elements": [ { "label": "page_header", "id": 5, "page_no": 4, "cluster": { "id": 5, "label": "page_header", "bbox": { "l": 194.478, "t": 93.77099999999996, "r": 447.54291000000006, "b": 101.84069999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.9269194602966309, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.478, "r_y0": 101.84069999999997, "r_x1": 447.54291000000006, "r_y1": 101.84069999999997, "r_x2": 447.54291000000006, "r_y2": 93.77099999999996, "r_x3": 194.478, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Optimized Table Tokenization for Table Structure Recognition" }, { "label": "page_header", "id": 6, "page_no": 4, "cluster": { "id": 6, "label": "page_header", "bbox": { "l": 475.98431, "t": 93.77099999999996, "r": 480.59125000000006, "b": 101.84069999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.8696112036705017, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 475.98431, "r_y0": 101.84069999999997, "r_x1": 480.59125000000006, "r_y1": 101.84069999999997, "r_x2": 480.59125000000006, "r_y2": 93.77099999999996, "r_x3": 475.98431, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "5" }, { "label": "text", "id": 0, "page_no": 4, "cluster": { "id": 0, "label": "text", "bbox": { "l": 134.765, "t": 118.93377999999996, "r": 480.59378, "b": 187.50684, "coord_origin": "TOPLEFT" }, "confidence": 0.9857171773910522, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 127.73077, "r_x1": 480.58577999999994, "r_y1": 127.73077, "r_x2": 480.58577999999994, "r_y2": 118.93377999999996, "r_x3": 134.765, "r_y3": 118.93377999999996, "coord_origin": "TOPLEFT" }, "text": "ulary and can be interpreted as a table structure. For example, with the HTML", "orig": "ulary and can be interpreted as a table structure. For example, with the HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 139.68579, "r_x1": 162.48494, "r_y1": 139.68579, "r_x2": 162.48494, "r_y2": 130.88878999999997, "r_x3": 134.765, "r_y3": 130.88878999999997, "coord_origin": "TOPLEFT" }, "text": "tokens", "orig": "tokens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 166.368, "r_y0": 139.68579, "r_x1": 201.74918, "r_y1": 139.68579, "r_x2": 201.74918, "r_y2": 130.88878999999997, "r_x3": 166.368, "r_y3": 130.88878999999997, "coord_origin": "TOPLEFT" }, "text": "", "orig": "
", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 201.74899, "r_y0": 139.68579, "r_x1": 204.51561, "r_y1": 139.68579, "r_x2": 204.51561, "r_y2": 130.88878999999997, "r_x3": 201.74899, "r_y3": 130.88878999999997, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.39699, "r_y0": 139.68579, "r_x1": 248.86904999999996, "r_y1": 139.68579, "r_x2": 248.86904999999996, "r_y2": 130.88878999999997, "r_x3": 208.39699, "r_y3": 130.88878999999997, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 248.86899, "r_y0": 139.68579, "r_x1": 251.6356, "r_y1": 139.68579, "r_x2": 251.6356, "r_y2": 130.88878999999997, "r_x3": 248.86899, "r_y3": 130.88878999999997, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 255.51698, "r_y0": 139.68579, "r_x1": 278.29846, "r_y1": 139.68579, "r_x2": 278.29846, "r_y2": 130.88878999999997, "r_x3": 255.51698, "r_y3": 130.88878999999997, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 278.29797, "r_y0": 139.68579, "r_x1": 281.06458, "r_y1": 139.68579, "r_x2": 281.06458, "r_y2": 130.88878999999997, "r_x3": 278.29797, "r_y3": 130.88878999999997, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 284.94598, "r_y0": 139.68579, "r_x1": 312.81836, "r_y1": 139.68579, "r_x2": 312.81836, "r_y2": 130.88878999999997, "r_x3": 284.94598, "r_y3": 130.88878999999997, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.81799, "r_y0": 139.68579, "r_x1": 315.58459, "r_y1": 139.68579, "r_x2": 315.58459, "r_y2": 130.88878999999997, "r_x3": 312.81799, "r_y3": 130.88878999999997, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 319.466, "r_y0": 139.68579, "r_x1": 343.13812, "r_y1": 139.68579, "r_x2": 343.13812, "r_y2": 130.88878999999997, "r_x3": 319.466, "r_y3": 130.88878999999997, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.13202, "r_y0": 139.68579, "r_x1": 363.17877, "r_y1": 139.68579, "r_x2": 363.17877, "r_y2": 130.88878999999997, "r_x3": 347.13202, "r_y3": 130.88878999999997, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.06003, "r_y0": 139.68579, "r_x1": 395.82306, "r_y1": 139.68579, "r_x2": 395.82306, "r_y2": 130.88878999999997, "r_x3": 367.06003, "r_y3": 130.88878999999997, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.82303, "r_y0": 139.68579, "r_x1": 480.59177000000005, "r_y1": 139.68579, "r_x2": 480.59177000000005, "r_y2": 130.88878999999997, "r_x3": 395.82303, "r_y3": 130.88878999999997, "coord_origin": "TOPLEFT" }, "text": ", one can construct", "orig": ", one can construct", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 151.64178000000004, "r_x1": 480.59365999999994, "r_y1": 151.64178000000004, "r_x2": 480.59365999999994, "r_y2": 142.84479, "r_x3": 134.76501, "r_y3": 142.84479, "coord_origin": "TOPLEFT" }, "text": "simple table structures without any spanning cells. In reality though, one needs", "orig": "simple table structures without any spanning cells. In reality though, one needs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 163.59680000000003, "r_x1": 480.58577999999994, "r_y1": 163.59680000000003, "r_x2": 480.58577999999994, "r_y2": 154.7998, "r_x3": 134.76501, "r_y3": 154.7998, "coord_origin": "TOPLEFT" }, "text": "at least 28 HTML tokens to describe the most common complex tables observed", "orig": "at least 28 HTML tokens to describe the most common complex tables observed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 175.55182000000002, "r_x1": 480.59378, "r_y1": 175.55182000000002, "r_x2": 480.59378, "r_y2": 166.75482, "r_x3": 134.76501, "r_y3": 166.75482, "coord_origin": "TOPLEFT" }, "text": "in real-world documents [21,22], due to a variety of spanning cells definitions in", "orig": "in real-world documents [21,22], due to a variety of spanning cells definitions in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 187.50684, "r_x1": 261.92566, "r_y1": 187.50684, "r_x2": 261.92566, "r_y2": 178.70983999999999, "r_x3": 134.76501, "r_y3": 178.70983999999999, "coord_origin": "TOPLEFT" }, "text": "the HTML token vocabulary.", "orig": "the HTML token vocabulary.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "ulary and can be interpreted as a table structure. For example, with the HTML tokens ,
, , , and , one can construct simple table structures without any spanning cells. In reality though, one needs at least 28 HTML tokens to describe the most common complex tables observed in real-world documents [21,22], due to a variety of spanning cells definitions in the HTML token vocabulary." }, { "label": "caption", "id": 7, "page_no": 4, "cluster": { "id": 7, "label": "caption", "bbox": { "l": 145.60701, "t": 221.07928000000004, "r": 469.75223000000005, "b": 229.21178999999995, "coord_origin": "TOPLEFT" }, "confidence": 0.8472551703453064, "cells": [ { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 145.60701, "r_y0": 229.00562000000002, "r_x1": 173.48625, "r_y1": 229.00562000000002, "r_x2": 173.48625, "r_y2": 221.07928000000004, "r_x3": 145.60701, "r_y3": 221.07928000000004, "coord_origin": "TOPLEFT" }, "text": "Fig. 2.", "orig": "Fig. 2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.56001, "r_y0": 229.21178999999995, "r_x1": 469.75223000000005, "r_y1": 229.21178999999995, "r_x2": 469.75223000000005, "r_y2": 221.14209000000005, "r_x3": 176.56001, "r_y3": 221.14209000000005, "coord_origin": "TOPLEFT" }, "text": "Frequency of tokens in HTML and OTSL as they appear in PubTabNet.", "orig": "Frequency of tokens in HTML and OTSL as they appear in PubTabNet.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Fig. 2. Frequency of tokens in HTML and OTSL as they appear in PubTabNet." }, { "label": "text", "id": 1, "page_no": 4, "cluster": { "id": 1, "label": "text", "bbox": { "l": 134.765, "t": 368.20679, "r": 480.59476, "b": 532.42059, "coord_origin": "TOPLEFT" }, "confidence": 0.9844799637794495, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.709, "r_y0": 377.00375, "r_x1": 480.59283000000005, "r_y1": 377.00375, "r_x2": 480.59283000000005, "r_y2": 368.20679, "r_x3": 149.709, "r_y3": 368.20679, "coord_origin": "TOPLEFT" }, "text": "Obviously, HTML and other general-purpose markup languages were not de-", "orig": "Obviously, HTML and other general-purpose markup languages were not de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 388.9587399999999, "r_x1": 480.58664, "r_y1": 388.9587399999999, "r_x2": 480.58664, "r_y2": 380.16177, "r_x3": 134.765, "r_y3": 380.16177, "coord_origin": "TOPLEFT" }, "text": "signed for Im2Seq models. As such, they have some serious drawbacks. First, the", "orig": "signed for Im2Seq models. As such, they have some serious drawbacks. First, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 400.91373, "r_x1": 480.59180000000003, "r_y1": 400.91373, "r_x2": 480.59180000000003, "r_y2": 392.11676, "r_x3": 134.765, "r_y3": 392.11676, "coord_origin": "TOPLEFT" }, "text": "token vocabulary needs to be artificially large in order to describe all plausible", "orig": "token vocabulary needs to be artificially large in order to describe all plausible", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 412.86871, "r_x1": 480.5897499999999, "r_y1": 412.86871, "r_x2": 480.5897499999999, "r_y2": 404.07175, "r_x3": 134.765, "r_y3": 404.07175, "coord_origin": "TOPLEFT" }, "text": "tabular structures. Since most Im2Seq models use an autoregressive approach,", "orig": "tabular structures. Since most Im2Seq models use an autoregressive approach,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 424.82471, "r_x1": 480.58871, "r_y1": 424.82471, "r_x2": 480.58871, "r_y2": 416.02774, "r_x3": 134.765, "r_y3": 416.02774, "coord_origin": "TOPLEFT" }, "text": "they generate the sequence token by token. Therefore, to reduce inference time,", "orig": "they generate the sequence token by token. Therefore, to reduce inference time,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 436.77969, "r_x1": 480.59265, "r_y1": 436.77969, "r_x2": 480.59265, "r_y2": 427.98273, "r_x3": 134.765, "r_y3": 427.98273, "coord_origin": "TOPLEFT" }, "text": "a shorter sequence length is critical. Every table-cell is represented by at least", "orig": "a shorter sequence length is critical. Every table-cell is represented by at least", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 448.73467999999997, "r_x1": 187.93439, "r_y1": 448.73467999999997, "r_x2": 187.93439, "r_y2": 439.9377099999999, "r_x3": 134.765, "r_y3": 439.9377099999999, "coord_origin": "TOPLEFT" }, "text": "two tokens (", "orig": "two tokens (", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 187.931, "r_y0": 448.73467999999997, "r_x1": 211.60313, "r_y1": 448.73467999999997, "r_x2": 211.60313, "r_y2": 439.9377099999999, "r_x3": 187.931, "r_y3": 439.9377099999999, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 214.75400000000002, "r_y0": 448.73467999999997, "r_x1": 230.80075000000002, "r_y1": 448.73467999999997, "r_x2": 230.80075000000002, "r_y2": 439.9377099999999, "r_x3": 214.75400000000002, "r_y3": 439.9377099999999, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 233.83898999999997, "r_y0": 448.73467999999997, "r_x1": 262.60202, "r_y1": 448.73467999999997, "r_x2": 262.60202, "r_y2": 439.9377099999999, "r_x3": 233.83898999999997, "r_y3": 439.9377099999999, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.716, "r_y0": 448.73467999999997, "r_x1": 480.59009, "r_y1": 448.73467999999997, "r_x2": 480.59009, "r_y2": 439.9377099999999, "r_x3": 262.716, "r_y3": 439.9377099999999, "coord_origin": "TOPLEFT" }, "text": "). Furthermore, when tokenizing the HTML struc-", "orig": "). Furthermore, when tokenizing the HTML struc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 460.68967, "r_x1": 480.58777, "r_y1": 460.68967, "r_x2": 480.58777, "r_y2": 451.8927, "r_x3": 134.76501, "r_y3": 451.8927, "coord_origin": "TOPLEFT" }, "text": "ture, one needs to explicitly enumerate possible column-spans and row-spans", "orig": "ture, one needs to explicitly enumerate possible column-spans and row-spans", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 472.64465, "r_x1": 480.58681999999993, "r_y1": 472.64465, "r_x2": 480.58681999999993, "r_y2": 463.84769, "r_x3": 134.76501, "r_y3": 463.84769, "coord_origin": "TOPLEFT" }, "text": "as words. In practice, this ends up requiring 28 different HTML tokens (when", "orig": "as words. In practice, this ends up requiring 28 different HTML tokens (when", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 484.60065, "r_x1": 480.58681999999993, "r_y1": 484.60065, "r_x2": 480.58681999999993, "r_y2": 475.80368, "r_x3": 134.76501, "r_y3": 475.80368, "coord_origin": "TOPLEFT" }, "text": "including column- and row-spans up to 10 cells) just to describe every table in", "orig": "including column- and row-spans up to 10 cells) just to describe every table in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 496.55563, "r_x1": 480.59067, "r_y1": 496.55563, "r_x2": 480.59067, "r_y2": 487.75867, "r_x3": 134.76501, "r_y3": 487.75867, "coord_origin": "TOPLEFT" }, "text": "the PubTabNet dataset. Clearly, not every token is equally represented, as is", "orig": "the PubTabNet dataset. Clearly, not every token is equally represented, as is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 508.51062, "r_x1": 480.59277, "r_y1": 508.51062, "r_x2": 480.59277, "r_y2": 499.71365, "r_x3": 134.76501, "r_y3": 499.71365, "coord_origin": "TOPLEFT" }, "text": "depicted in Figure 2. This skewed distribution of tokens in combination with", "orig": "depicted in Figure 2. This skewed distribution of tokens in combination with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 520.46561, "r_x1": 480.59476, "r_y1": 520.46561, "r_x2": 480.59476, "r_y2": 511.66864, "r_x3": 134.76501, "r_y3": 511.66864, "coord_origin": "TOPLEFT" }, "text": "variable token row-length makes it challenging for models to learn the HTML", "orig": "variable token row-length makes it challenging for models to learn the HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 532.42059, "r_x1": 176.92873, "r_y1": 532.42059, "r_x2": 176.92873, "r_y2": 523.62363, "r_x3": 134.76501, "r_y3": 523.62363, "coord_origin": "TOPLEFT" }, "text": "structure.", "orig": "structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Obviously, HTML and other general-purpose markup languages were not designed for Im2Seq models. As such, they have some serious drawbacks. First, the token vocabulary needs to be artificially large in order to describe all plausible tabular structures. Since most Im2Seq models use an autoregressive approach, they generate the sequence token by token. Therefore, to reduce inference time, a shorter sequence length is critical. Every table-cell is represented by at least two tokens ( and ). Furthermore, when tokenizing the HTML structure, one needs to explicitly enumerate possible column-spans and row-spans as words. In practice, this ends up requiring 28 different HTML tokens (when including column- and row-spans up to 10 cells) just to describe every table in the PubTabNet dataset. Clearly, not every token is equally represented, as is depicted in Figure 2. This skewed distribution of tokens in combination with variable token row-length makes it challenging for models to learn the HTML structure." }, { "label": "text", "id": 3, "page_no": 4, "cluster": { "id": 3, "label": "text", "bbox": { "l": 134.76501, "t": 536.04263, "r": 480.59289999999993, "b": 580.7056, "coord_origin": "TOPLEFT" }, "confidence": 0.978394627571106, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.70901, "r_y0": 544.8396, "r_x1": 480.59289999999993, "r_y1": 544.8396, "r_x2": 480.59289999999993, "r_y2": 536.04263, "r_x3": 149.70901, "r_y3": 536.04263, "coord_origin": "TOPLEFT" }, "text": "Additionally, it would be desirable if the representation would easily allow", "orig": "Additionally, it would be desirable if the representation would easily allow", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 556.7946000000001, "r_x1": 480.59085, "r_y1": 556.7946000000001, "r_x2": 480.59085, "r_y2": 547.99763, "r_x3": 134.76501, "r_y3": 547.99763, "coord_origin": "TOPLEFT" }, "text": "an early detection of invalid sequences on-the-go, before the prediction of the", "orig": "an early detection of invalid sequences on-the-go, before the prediction of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 568.7496, "r_x1": 480.58984, "r_y1": 568.7496, "r_x2": 480.58984, "r_y2": 559.95264, "r_x3": 134.76501, "r_y3": 559.95264, "coord_origin": "TOPLEFT" }, "text": "entire table structure is completed. HTML is not well-suited for this purpose as", "orig": "entire table structure is completed. HTML is not well-suited for this purpose as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 580.7056, "r_x1": 452.18933, "r_y1": 580.7056, "r_x2": 452.18933, "r_y2": 571.90863, "r_x3": 134.76501, "r_y3": 571.90863, "coord_origin": "TOPLEFT" }, "text": "the verification of incomplete sequences is non-trivial or even impossible.", "orig": "the verification of incomplete sequences is non-trivial or even impossible.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Additionally, it would be desirable if the representation would easily allow an early detection of invalid sequences on-the-go, before the prediction of the entire table structure is completed. HTML is not well-suited for this purpose as the verification of incomplete sequences is non-trivial or even impossible." }, { "label": "text", "id": 2, "page_no": 4, "cluster": { "id": 2, "label": "text", "bbox": { "l": 134.76501, "t": 584.32663, "r": 480.59473, "b": 664.85461, "coord_origin": "TOPLEFT" }, "confidence": 0.9838283061981201, "cells": [ { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.70901, "r_y0": 593.1236, "r_x1": 480.59283000000005, "r_y1": 593.1236, "r_x2": 480.59283000000005, "r_y2": 584.32663, "r_x3": 149.70901, "r_y3": 584.32663, "coord_origin": "TOPLEFT" }, "text": "In a valid HTML table, the token sequence must describe a 2D grid of table", "orig": "In a valid HTML table, the token sequence must describe a 2D grid of table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 605.07959, "r_x1": 480.58978, "r_y1": 605.07959, "r_x2": 480.58978, "r_y2": 596.28262, "r_x3": 134.76501, "r_y3": 596.28262, "coord_origin": "TOPLEFT" }, "text": "cells, serialised in row-major ordering, where each row and each column have", "orig": "cells, serialised in row-major ordering, where each row and each column have", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 617.03459, "r_x1": 480.5936899999999, "r_y1": 617.03459, "r_x2": 480.5936899999999, "r_y2": 608.23763, "r_x3": 134.76501, "r_y3": 608.23763, "coord_origin": "TOPLEFT" }, "text": "the same length (while considering row- and column-spans). Furthermore, every", "orig": "the same length (while considering row- and column-spans). Furthermore, every", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 628.98959, "r_x1": 480.59091, "r_y1": 628.98959, "r_x2": 480.59091, "r_y2": 620.19263, "r_x3": 134.76501, "r_y3": 620.19263, "coord_origin": "TOPLEFT" }, "text": "opening tag in HTML needs to be matched by a closing tag in a correct hierar-", "orig": "opening tag in HTML needs to be matched by a closing tag in a correct hierar-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 640.9446, "r_x1": 480.58582, "r_y1": 640.9446, "r_x2": 480.58582, "r_y2": 632.1476299999999, "r_x3": 134.76501, "r_y3": 632.1476299999999, "coord_origin": "TOPLEFT" }, "text": "chical manner. Since the number of tokens for each table row and column can", "orig": "chical manner. Since the number of tokens for each table row and column can", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 652.8996, "r_x1": 480.59180000000003, "r_y1": 652.8996, "r_x2": 480.59180000000003, "r_y2": 644.10263, "r_x3": 134.76501, "r_y3": 644.10263, "coord_origin": "TOPLEFT" }, "text": "vary significantly, especially for large tables with many row- and column-spans,", "orig": "vary significantly, especially for large tables with many row- and column-spans,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 664.85461, "r_x1": 480.59473, "r_y1": 664.85461, "r_x2": 480.59473, "r_y2": 656.05763, "r_x3": 134.76501, "r_y3": 656.05763, "coord_origin": "TOPLEFT" }, "text": "it is complex to verify the consistency of predicted structures during sequence", "orig": "it is complex to verify the consistency of predicted structures during sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "In a valid HTML table, the token sequence must describe a 2D grid of table cells, serialised in row-major ordering, where each row and each column have the same length (while considering row- and column-spans). Furthermore, every opening tag in HTML needs to be matched by a closing tag in a correct hierarchical manner. Since the number of tokens for each table row and column can vary significantly, especially for large tables with many row- and column-spans, it is complex to verify the consistency of predicted structures during sequence" }, { "label": "picture", "id": 4, "page_no": 4, "cluster": { "id": 4, "label": "picture", "bbox": { "l": 137.41448974609375, "t": 233.51231384277344, "r": 476.5608215332031, "b": 340.2304992675781, "coord_origin": "TOPLEFT" }, "confidence": 0.9387977123260498, "cells": [], "children": [] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null } ], "body": [ { "label": "text", "id": 0, "page_no": 4, "cluster": { "id": 0, "label": "text", "bbox": { "l": 134.765, "t": 118.93377999999996, "r": 480.59378, "b": 187.50684, "coord_origin": "TOPLEFT" }, "confidence": 0.9857171773910522, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 127.73077, "r_x1": 480.58577999999994, "r_y1": 127.73077, "r_x2": 480.58577999999994, "r_y2": 118.93377999999996, "r_x3": 134.765, "r_y3": 118.93377999999996, "coord_origin": "TOPLEFT" }, "text": "ulary and can be interpreted as a table structure. For example, with the HTML", "orig": "ulary and can be interpreted as a table structure. For example, with the HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 139.68579, "r_x1": 162.48494, "r_y1": 139.68579, "r_x2": 162.48494, "r_y2": 130.88878999999997, "r_x3": 134.765, "r_y3": 130.88878999999997, "coord_origin": "TOPLEFT" }, "text": "tokens", "orig": "tokens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 166.368, "r_y0": 139.68579, "r_x1": 201.74918, "r_y1": 139.68579, "r_x2": 201.74918, "r_y2": 130.88878999999997, "r_x3": 166.368, "r_y3": 130.88878999999997, "coord_origin": "TOPLEFT" }, "text": "", "orig": "
", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 201.74899, "r_y0": 139.68579, "r_x1": 204.51561, "r_y1": 139.68579, "r_x2": 204.51561, "r_y2": 130.88878999999997, "r_x3": 201.74899, "r_y3": 130.88878999999997, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.39699, "r_y0": 139.68579, "r_x1": 248.86904999999996, "r_y1": 139.68579, "r_x2": 248.86904999999996, "r_y2": 130.88878999999997, "r_x3": 208.39699, "r_y3": 130.88878999999997, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 248.86899, "r_y0": 139.68579, "r_x1": 251.6356, "r_y1": 139.68579, "r_x2": 251.6356, "r_y2": 130.88878999999997, "r_x3": 248.86899, "r_y3": 130.88878999999997, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 255.51698, "r_y0": 139.68579, "r_x1": 278.29846, "r_y1": 139.68579, "r_x2": 278.29846, "r_y2": 130.88878999999997, "r_x3": 255.51698, "r_y3": 130.88878999999997, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 278.29797, "r_y0": 139.68579, "r_x1": 281.06458, "r_y1": 139.68579, "r_x2": 281.06458, "r_y2": 130.88878999999997, "r_x3": 278.29797, "r_y3": 130.88878999999997, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 284.94598, "r_y0": 139.68579, "r_x1": 312.81836, "r_y1": 139.68579, "r_x2": 312.81836, "r_y2": 130.88878999999997, "r_x3": 284.94598, "r_y3": 130.88878999999997, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.81799, "r_y0": 139.68579, "r_x1": 315.58459, "r_y1": 139.68579, "r_x2": 315.58459, "r_y2": 130.88878999999997, "r_x3": 312.81799, "r_y3": 130.88878999999997, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 319.466, "r_y0": 139.68579, "r_x1": 343.13812, "r_y1": 139.68579, "r_x2": 343.13812, "r_y2": 130.88878999999997, "r_x3": 319.466, "r_y3": 130.88878999999997, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.13202, "r_y0": 139.68579, "r_x1": 363.17877, "r_y1": 139.68579, "r_x2": 363.17877, "r_y2": 130.88878999999997, "r_x3": 347.13202, "r_y3": 130.88878999999997, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.06003, "r_y0": 139.68579, "r_x1": 395.82306, "r_y1": 139.68579, "r_x2": 395.82306, "r_y2": 130.88878999999997, "r_x3": 367.06003, "r_y3": 130.88878999999997, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.82303, "r_y0": 139.68579, "r_x1": 480.59177000000005, "r_y1": 139.68579, "r_x2": 480.59177000000005, "r_y2": 130.88878999999997, "r_x3": 395.82303, "r_y3": 130.88878999999997, "coord_origin": "TOPLEFT" }, "text": ", one can construct", "orig": ", one can construct", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 151.64178000000004, "r_x1": 480.59365999999994, "r_y1": 151.64178000000004, "r_x2": 480.59365999999994, "r_y2": 142.84479, "r_x3": 134.76501, "r_y3": 142.84479, "coord_origin": "TOPLEFT" }, "text": "simple table structures without any spanning cells. In reality though, one needs", "orig": "simple table structures without any spanning cells. In reality though, one needs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 163.59680000000003, "r_x1": 480.58577999999994, "r_y1": 163.59680000000003, "r_x2": 480.58577999999994, "r_y2": 154.7998, "r_x3": 134.76501, "r_y3": 154.7998, "coord_origin": "TOPLEFT" }, "text": "at least 28 HTML tokens to describe the most common complex tables observed", "orig": "at least 28 HTML tokens to describe the most common complex tables observed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 175.55182000000002, "r_x1": 480.59378, "r_y1": 175.55182000000002, "r_x2": 480.59378, "r_y2": 166.75482, "r_x3": 134.76501, "r_y3": 166.75482, "coord_origin": "TOPLEFT" }, "text": "in real-world documents [21,22], due to a variety of spanning cells definitions in", "orig": "in real-world documents [21,22], due to a variety of spanning cells definitions in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 187.50684, "r_x1": 261.92566, "r_y1": 187.50684, "r_x2": 261.92566, "r_y2": 178.70983999999999, "r_x3": 134.76501, "r_y3": 178.70983999999999, "coord_origin": "TOPLEFT" }, "text": "the HTML token vocabulary.", "orig": "the HTML token vocabulary.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "ulary and can be interpreted as a table structure. For example, with the HTML tokens ,
, , , and , one can construct simple table structures without any spanning cells. In reality though, one needs at least 28 HTML tokens to describe the most common complex tables observed in real-world documents [21,22], due to a variety of spanning cells definitions in the HTML token vocabulary." }, { "label": "caption", "id": 7, "page_no": 4, "cluster": { "id": 7, "label": "caption", "bbox": { "l": 145.60701, "t": 221.07928000000004, "r": 469.75223000000005, "b": 229.21178999999995, "coord_origin": "TOPLEFT" }, "confidence": 0.8472551703453064, "cells": [ { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 145.60701, "r_y0": 229.00562000000002, "r_x1": 173.48625, "r_y1": 229.00562000000002, "r_x2": 173.48625, "r_y2": 221.07928000000004, "r_x3": 145.60701, "r_y3": 221.07928000000004, "coord_origin": "TOPLEFT" }, "text": "Fig. 2.", "orig": "Fig. 2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.56001, "r_y0": 229.21178999999995, "r_x1": 469.75223000000005, "r_y1": 229.21178999999995, "r_x2": 469.75223000000005, "r_y2": 221.14209000000005, "r_x3": 176.56001, "r_y3": 221.14209000000005, "coord_origin": "TOPLEFT" }, "text": "Frequency of tokens in HTML and OTSL as they appear in PubTabNet.", "orig": "Frequency of tokens in HTML and OTSL as they appear in PubTabNet.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Fig. 2. Frequency of tokens in HTML and OTSL as they appear in PubTabNet." }, { "label": "text", "id": 1, "page_no": 4, "cluster": { "id": 1, "label": "text", "bbox": { "l": 134.765, "t": 368.20679, "r": 480.59476, "b": 532.42059, "coord_origin": "TOPLEFT" }, "confidence": 0.9844799637794495, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.709, "r_y0": 377.00375, "r_x1": 480.59283000000005, "r_y1": 377.00375, "r_x2": 480.59283000000005, "r_y2": 368.20679, "r_x3": 149.709, "r_y3": 368.20679, "coord_origin": "TOPLEFT" }, "text": "Obviously, HTML and other general-purpose markup languages were not de-", "orig": "Obviously, HTML and other general-purpose markup languages were not de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 388.9587399999999, "r_x1": 480.58664, "r_y1": 388.9587399999999, "r_x2": 480.58664, "r_y2": 380.16177, "r_x3": 134.765, "r_y3": 380.16177, "coord_origin": "TOPLEFT" }, "text": "signed for Im2Seq models. As such, they have some serious drawbacks. First, the", "orig": "signed for Im2Seq models. As such, they have some serious drawbacks. First, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 400.91373, "r_x1": 480.59180000000003, "r_y1": 400.91373, "r_x2": 480.59180000000003, "r_y2": 392.11676, "r_x3": 134.765, "r_y3": 392.11676, "coord_origin": "TOPLEFT" }, "text": "token vocabulary needs to be artificially large in order to describe all plausible", "orig": "token vocabulary needs to be artificially large in order to describe all plausible", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 412.86871, "r_x1": 480.5897499999999, "r_y1": 412.86871, "r_x2": 480.5897499999999, "r_y2": 404.07175, "r_x3": 134.765, "r_y3": 404.07175, "coord_origin": "TOPLEFT" }, "text": "tabular structures. Since most Im2Seq models use an autoregressive approach,", "orig": "tabular structures. Since most Im2Seq models use an autoregressive approach,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 424.82471, "r_x1": 480.58871, "r_y1": 424.82471, "r_x2": 480.58871, "r_y2": 416.02774, "r_x3": 134.765, "r_y3": 416.02774, "coord_origin": "TOPLEFT" }, "text": "they generate the sequence token by token. Therefore, to reduce inference time,", "orig": "they generate the sequence token by token. Therefore, to reduce inference time,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 436.77969, "r_x1": 480.59265, "r_y1": 436.77969, "r_x2": 480.59265, "r_y2": 427.98273, "r_x3": 134.765, "r_y3": 427.98273, "coord_origin": "TOPLEFT" }, "text": "a shorter sequence length is critical. Every table-cell is represented by at least", "orig": "a shorter sequence length is critical. Every table-cell is represented by at least", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 448.73467999999997, "r_x1": 187.93439, "r_y1": 448.73467999999997, "r_x2": 187.93439, "r_y2": 439.9377099999999, "r_x3": 134.765, "r_y3": 439.9377099999999, "coord_origin": "TOPLEFT" }, "text": "two tokens (", "orig": "two tokens (", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 187.931, "r_y0": 448.73467999999997, "r_x1": 211.60313, "r_y1": 448.73467999999997, "r_x2": 211.60313, "r_y2": 439.9377099999999, "r_x3": 187.931, "r_y3": 439.9377099999999, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 214.75400000000002, "r_y0": 448.73467999999997, "r_x1": 230.80075000000002, "r_y1": 448.73467999999997, "r_x2": 230.80075000000002, "r_y2": 439.9377099999999, "r_x3": 214.75400000000002, "r_y3": 439.9377099999999, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 233.83898999999997, "r_y0": 448.73467999999997, "r_x1": 262.60202, "r_y1": 448.73467999999997, "r_x2": 262.60202, "r_y2": 439.9377099999999, "r_x3": 233.83898999999997, "r_y3": 439.9377099999999, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.716, "r_y0": 448.73467999999997, "r_x1": 480.59009, "r_y1": 448.73467999999997, "r_x2": 480.59009, "r_y2": 439.9377099999999, "r_x3": 262.716, "r_y3": 439.9377099999999, "coord_origin": "TOPLEFT" }, "text": "). Furthermore, when tokenizing the HTML struc-", "orig": "). Furthermore, when tokenizing the HTML struc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 460.68967, "r_x1": 480.58777, "r_y1": 460.68967, "r_x2": 480.58777, "r_y2": 451.8927, "r_x3": 134.76501, "r_y3": 451.8927, "coord_origin": "TOPLEFT" }, "text": "ture, one needs to explicitly enumerate possible column-spans and row-spans", "orig": "ture, one needs to explicitly enumerate possible column-spans and row-spans", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 472.64465, "r_x1": 480.58681999999993, "r_y1": 472.64465, "r_x2": 480.58681999999993, "r_y2": 463.84769, "r_x3": 134.76501, "r_y3": 463.84769, "coord_origin": "TOPLEFT" }, "text": "as words. In practice, this ends up requiring 28 different HTML tokens (when", "orig": "as words. In practice, this ends up requiring 28 different HTML tokens (when", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 484.60065, "r_x1": 480.58681999999993, "r_y1": 484.60065, "r_x2": 480.58681999999993, "r_y2": 475.80368, "r_x3": 134.76501, "r_y3": 475.80368, "coord_origin": "TOPLEFT" }, "text": "including column- and row-spans up to 10 cells) just to describe every table in", "orig": "including column- and row-spans up to 10 cells) just to describe every table in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 496.55563, "r_x1": 480.59067, "r_y1": 496.55563, "r_x2": 480.59067, "r_y2": 487.75867, "r_x3": 134.76501, "r_y3": 487.75867, "coord_origin": "TOPLEFT" }, "text": "the PubTabNet dataset. Clearly, not every token is equally represented, as is", "orig": "the PubTabNet dataset. Clearly, not every token is equally represented, as is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 508.51062, "r_x1": 480.59277, "r_y1": 508.51062, "r_x2": 480.59277, "r_y2": 499.71365, "r_x3": 134.76501, "r_y3": 499.71365, "coord_origin": "TOPLEFT" }, "text": "depicted in Figure 2. This skewed distribution of tokens in combination with", "orig": "depicted in Figure 2. This skewed distribution of tokens in combination with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 520.46561, "r_x1": 480.59476, "r_y1": 520.46561, "r_x2": 480.59476, "r_y2": 511.66864, "r_x3": 134.76501, "r_y3": 511.66864, "coord_origin": "TOPLEFT" }, "text": "variable token row-length makes it challenging for models to learn the HTML", "orig": "variable token row-length makes it challenging for models to learn the HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 532.42059, "r_x1": 176.92873, "r_y1": 532.42059, "r_x2": 176.92873, "r_y2": 523.62363, "r_x3": 134.76501, "r_y3": 523.62363, "coord_origin": "TOPLEFT" }, "text": "structure.", "orig": "structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Obviously, HTML and other general-purpose markup languages were not designed for Im2Seq models. As such, they have some serious drawbacks. First, the token vocabulary needs to be artificially large in order to describe all plausible tabular structures. Since most Im2Seq models use an autoregressive approach, they generate the sequence token by token. Therefore, to reduce inference time, a shorter sequence length is critical. Every table-cell is represented by at least two tokens ( and ). Furthermore, when tokenizing the HTML structure, one needs to explicitly enumerate possible column-spans and row-spans as words. In practice, this ends up requiring 28 different HTML tokens (when including column- and row-spans up to 10 cells) just to describe every table in the PubTabNet dataset. Clearly, not every token is equally represented, as is depicted in Figure 2. This skewed distribution of tokens in combination with variable token row-length makes it challenging for models to learn the HTML structure." }, { "label": "text", "id": 3, "page_no": 4, "cluster": { "id": 3, "label": "text", "bbox": { "l": 134.76501, "t": 536.04263, "r": 480.59289999999993, "b": 580.7056, "coord_origin": "TOPLEFT" }, "confidence": 0.978394627571106, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.70901, "r_y0": 544.8396, "r_x1": 480.59289999999993, "r_y1": 544.8396, "r_x2": 480.59289999999993, "r_y2": 536.04263, "r_x3": 149.70901, "r_y3": 536.04263, "coord_origin": "TOPLEFT" }, "text": "Additionally, it would be desirable if the representation would easily allow", "orig": "Additionally, it would be desirable if the representation would easily allow", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 556.7946000000001, "r_x1": 480.59085, "r_y1": 556.7946000000001, "r_x2": 480.59085, "r_y2": 547.99763, "r_x3": 134.76501, "r_y3": 547.99763, "coord_origin": "TOPLEFT" }, "text": "an early detection of invalid sequences on-the-go, before the prediction of the", "orig": "an early detection of invalid sequences on-the-go, before the prediction of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 568.7496, "r_x1": 480.58984, "r_y1": 568.7496, "r_x2": 480.58984, "r_y2": 559.95264, "r_x3": 134.76501, "r_y3": 559.95264, "coord_origin": "TOPLEFT" }, "text": "entire table structure is completed. HTML is not well-suited for this purpose as", "orig": "entire table structure is completed. HTML is not well-suited for this purpose as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 580.7056, "r_x1": 452.18933, "r_y1": 580.7056, "r_x2": 452.18933, "r_y2": 571.90863, "r_x3": 134.76501, "r_y3": 571.90863, "coord_origin": "TOPLEFT" }, "text": "the verification of incomplete sequences is non-trivial or even impossible.", "orig": "the verification of incomplete sequences is non-trivial or even impossible.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Additionally, it would be desirable if the representation would easily allow an early detection of invalid sequences on-the-go, before the prediction of the entire table structure is completed. HTML is not well-suited for this purpose as the verification of incomplete sequences is non-trivial or even impossible." }, { "label": "text", "id": 2, "page_no": 4, "cluster": { "id": 2, "label": "text", "bbox": { "l": 134.76501, "t": 584.32663, "r": 480.59473, "b": 664.85461, "coord_origin": "TOPLEFT" }, "confidence": 0.9838283061981201, "cells": [ { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.70901, "r_y0": 593.1236, "r_x1": 480.59283000000005, "r_y1": 593.1236, "r_x2": 480.59283000000005, "r_y2": 584.32663, "r_x3": 149.70901, "r_y3": 584.32663, "coord_origin": "TOPLEFT" }, "text": "In a valid HTML table, the token sequence must describe a 2D grid of table", "orig": "In a valid HTML table, the token sequence must describe a 2D grid of table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 605.07959, "r_x1": 480.58978, "r_y1": 605.07959, "r_x2": 480.58978, "r_y2": 596.28262, "r_x3": 134.76501, "r_y3": 596.28262, "coord_origin": "TOPLEFT" }, "text": "cells, serialised in row-major ordering, where each row and each column have", "orig": "cells, serialised in row-major ordering, where each row and each column have", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 617.03459, "r_x1": 480.5936899999999, "r_y1": 617.03459, "r_x2": 480.5936899999999, "r_y2": 608.23763, "r_x3": 134.76501, "r_y3": 608.23763, "coord_origin": "TOPLEFT" }, "text": "the same length (while considering row- and column-spans). Furthermore, every", "orig": "the same length (while considering row- and column-spans). Furthermore, every", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 628.98959, "r_x1": 480.59091, "r_y1": 628.98959, "r_x2": 480.59091, "r_y2": 620.19263, "r_x3": 134.76501, "r_y3": 620.19263, "coord_origin": "TOPLEFT" }, "text": "opening tag in HTML needs to be matched by a closing tag in a correct hierar-", "orig": "opening tag in HTML needs to be matched by a closing tag in a correct hierar-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 640.9446, "r_x1": 480.58582, "r_y1": 640.9446, "r_x2": 480.58582, "r_y2": 632.1476299999999, "r_x3": 134.76501, "r_y3": 632.1476299999999, "coord_origin": "TOPLEFT" }, "text": "chical manner. Since the number of tokens for each table row and column can", "orig": "chical manner. Since the number of tokens for each table row and column can", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 652.8996, "r_x1": 480.59180000000003, "r_y1": 652.8996, "r_x2": 480.59180000000003, "r_y2": 644.10263, "r_x3": 134.76501, "r_y3": 644.10263, "coord_origin": "TOPLEFT" }, "text": "vary significantly, especially for large tables with many row- and column-spans,", "orig": "vary significantly, especially for large tables with many row- and column-spans,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 664.85461, "r_x1": 480.59473, "r_y1": 664.85461, "r_x2": 480.59473, "r_y2": 656.05763, "r_x3": 134.76501, "r_y3": 656.05763, "coord_origin": "TOPLEFT" }, "text": "it is complex to verify the consistency of predicted structures during sequence", "orig": "it is complex to verify the consistency of predicted structures during sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "In a valid HTML table, the token sequence must describe a 2D grid of table cells, serialised in row-major ordering, where each row and each column have the same length (while considering row- and column-spans). Furthermore, every opening tag in HTML needs to be matched by a closing tag in a correct hierarchical manner. Since the number of tokens for each table row and column can vary significantly, especially for large tables with many row- and column-spans, it is complex to verify the consistency of predicted structures during sequence" }, { "label": "picture", "id": 4, "page_no": 4, "cluster": { "id": 4, "label": "picture", "bbox": { "l": 137.41448974609375, "t": 233.51231384277344, "r": 476.5608215332031, "b": 340.2304992675781, "coord_origin": "TOPLEFT" }, "confidence": 0.9387977123260498, "cells": [], "children": [] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null } ], "headers": [ { "label": "page_header", "id": 5, "page_no": 4, "cluster": { "id": 5, "label": "page_header", "bbox": { "l": 194.478, "t": 93.77099999999996, "r": 447.54291000000006, "b": 101.84069999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.9269194602966309, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.478, "r_y0": 101.84069999999997, "r_x1": 447.54291000000006, "r_y1": 101.84069999999997, "r_x2": 447.54291000000006, "r_y2": 93.77099999999996, "r_x3": 194.478, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Optimized Table Tokenization for Table Structure Recognition" }, { "label": "page_header", "id": 6, "page_no": 4, "cluster": { "id": 6, "label": "page_header", "bbox": { "l": 475.98431, "t": 93.77099999999996, "r": 480.59125000000006, "b": 101.84069999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.8696112036705017, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 475.98431, "r_y0": 101.84069999999997, "r_x1": 480.59125000000006, "r_y1": 101.84069999999997, "r_x2": 480.59125000000006, "r_y2": 93.77099999999996, "r_x3": 475.98431, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "5" } ] } }, { "page_no": 5, "size": { "width": 612.0, "height": 792.0 }, "parsed_page": { "dimension": { "angle": 0.0, "rect": { "r_x0": 0.0, "r_y0": 0.0, "r_x1": 612.0, "r_y1": 0.0, "r_x2": 612.0, "r_y2": 792.0, "r_x3": 0.0, "r_y3": 792.0, "coord_origin": "BOTTOMLEFT" }, "boundary_type": "crop_box", "art_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "bleed_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "crop_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "media_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "trim_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" } }, "bitmap_resources": [], "char_cells": [], "word_cells": [], "textline_cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 101.84069999999997, "r_x1": 139.37193, "r_y1": 101.84069999999997, "r_x2": 139.37193, "r_y2": 93.77099999999996, "r_x3": 134.765, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.81335, "r_y0": 101.84069999999997, "r_x1": 178.07675, "r_y1": 101.84069999999997, "r_x2": 178.07675, "r_y2": 93.77099999999996, "r_x3": 167.81335, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.37415, "r_y0": 101.84069999999997, "r_x1": 231.72227, "r_y1": 101.84069999999997, "r_x2": 231.72227, "r_y2": 93.77099999999996, "r_x3": 182.37415, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 127.73077, "r_x1": 480.59479, "r_y1": 127.73077, "r_x2": 480.59479, "r_y2": 118.93377999999996, "r_x3": 134.765, "r_y3": 118.93377999999996, "coord_origin": "TOPLEFT" }, "text": "generation. Implicitly, this also means that Im2Seq models need to learn these", "orig": "generation. Implicitly, this also means that Im2Seq models need to learn these", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 139.68579, "r_x1": 364.62503, "r_y1": 139.68579, "r_x2": 364.62503, "r_y2": 130.88878999999997, "r_x3": 134.765, "r_y3": 130.88878999999997, "coord_origin": "TOPLEFT" }, "text": "complex syntax rules, simply to deliver valid output.", "orig": "complex syntax rules, simply to deliver valid output.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.709, "r_y0": 152.27979000000005, "r_x1": 480.58981, "r_y1": 152.27979000000005, "r_x2": 480.58981, "r_y2": 143.48279000000002, "r_x3": 149.709, "r_y3": 143.48279000000002, "coord_origin": "TOPLEFT" }, "text": "In practice, we observe two major issues with prediction quality when train-", "orig": "In practice, we observe two major issues with prediction quality when train-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 164.23479999999995, "r_x1": 480.59378, "r_y1": 164.23479999999995, "r_x2": 480.59378, "r_y2": 155.43781, "r_x3": 134.765, "r_y3": 155.43781, "coord_origin": "TOPLEFT" }, "text": "ing Im2Seq models on HTML table structure generation from images. On the", "orig": "ing Im2Seq models on HTML table structure generation from images. On the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 176.18982000000005, "r_x1": 480.5867, "r_y1": 176.18982000000005, "r_x2": 480.5867, "r_y2": 167.39282000000003, "r_x3": 134.765, "r_y3": 167.39282000000003, "coord_origin": "TOPLEFT" }, "text": "one hand, we find that on large tables, the visual attention of the model often", "orig": "one hand, we find that on large tables, the visual attention of the model often", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 188.14484000000004, "r_x1": 480.59476, "r_y1": 188.14484000000004, "r_x2": 480.59476, "r_y2": 179.34784000000002, "r_x3": 134.765, "r_y3": 179.34784000000002, "coord_origin": "TOPLEFT" }, "text": "starts to drift and is not accurately moving forward cell by cell anymore. This", "orig": "starts to drift and is not accurately moving forward cell by cell anymore. This", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 200.09984999999995, "r_x1": 314.27805, "r_y1": 200.09984999999995, "r_x2": 314.27805, "r_y2": 191.30286, "r_x3": 134.765, "r_y3": 191.30286, "coord_origin": "TOPLEFT" }, "text": "manifests itself in either in an increasing", "orig": "manifests itself in either in an increasing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.056, "r_y0": 200.09984999999995, "r_x1": 374.08664, "r_y1": 200.09984999999995, "r_x2": 374.08664, "r_y2": 191.30286, "r_x3": 318.056, "r_y3": 191.30286, "coord_origin": "TOPLEFT" }, "text": "location drift", "orig": "location drift", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 378.80899, "r_y0": 200.09984999999995, "r_x1": 480.58594, "r_y1": 200.09984999999995, "r_x2": 480.58594, "r_y2": 191.30286, "r_x3": 378.80899, "r_y3": 191.30286, "coord_origin": "TOPLEFT" }, "text": "for proposed table-cells", "orig": "for proposed table-cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 212.05584999999996, "r_x1": 480.58771, "r_y1": 212.05584999999996, "r_x2": 480.58771, "r_y2": 203.25885000000005, "r_x3": 134.76498, "r_y3": 203.25885000000005, "coord_origin": "TOPLEFT" }, "text": "in later rows on the same column or even complete loss of vertical alignment, as", "orig": "in later rows on the same column or even complete loss of vertical alignment, as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 224.01085999999998, "r_x1": 480.59569999999997, "r_y1": 224.01085999999998, "r_x2": 480.59569999999997, "r_y2": 215.21387000000004, "r_x3": 134.76498, "r_y3": 215.21387000000004, "coord_origin": "TOPLEFT" }, "text": "illustrated in Figure 5. Addressing this with post-processing is partially possible,", "orig": "illustrated in Figure 5. Addressing this with post-processing is partially possible,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 235.96587999999997, "r_x1": 480.59454, "r_y1": 235.96587999999997, "r_x2": 480.59454, "r_y2": 227.16887999999994, "r_x3": 134.76498, "r_y3": 227.16887999999994, "coord_origin": "TOPLEFT" }, "text": "but clearly undesired. On the other hand, we find many instances of predictions", "orig": "but clearly undesired. On the other hand, we find many instances of predictions", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 247.92089999999996, "r_x1": 480.58759000000003, "r_y1": 247.92089999999996, "r_x2": 480.58759000000003, "r_y2": 239.12390000000005, "r_x3": 134.76498, "r_y3": 239.12390000000005, "coord_origin": "TOPLEFT" }, "text": "with structural inconsistencies or plain invalid HTML output, as shown in Fig-", "orig": "with structural inconsistencies or plain invalid HTML output, as shown in Fig-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 259.87591999999995, "r_x1": 480.59277, "r_y1": 259.87591999999995, "r_x2": 480.59277, "r_y2": 251.07892000000004, "r_x3": 134.76498, "r_y3": 251.07892000000004, "coord_origin": "TOPLEFT" }, "text": "ure 6, which are nearly impossible to properly correct. Both problems seriously", "orig": "ure 6, which are nearly impossible to properly correct. Both problems seriously", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 271.83092999999997, "r_x1": 480.59463999999997, "r_y1": 271.83092999999997, "r_x2": 480.59463999999997, "r_y2": 263.03394000000003, "r_x3": 134.76498, "r_y3": 263.03394000000003, "coord_origin": "TOPLEFT" }, "text": "impact the TSR model performance, since they reflect not only in the task of", "orig": "impact the TSR model performance, since they reflect not only in the task of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 283.78693, "r_x1": 480.58978, "r_y1": 283.78693, "r_x2": 480.58978, "r_y2": 274.98992999999996, "r_x3": 134.76498, "r_y3": 274.98992999999996, "coord_origin": "TOPLEFT" }, "text": "pure structure recognition but also in the equally crucial recognition or matching", "orig": "pure structure recognition but also in the equally crucial recognition or matching", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 295.74191, "r_x1": 223.57262, "r_y1": 295.74191, "r_x2": 223.57262, "r_y2": 286.94495, "r_x3": 134.76498, "r_y3": 286.94495, "coord_origin": "TOPLEFT" }, "text": "of table cell content.", "orig": "of table cell content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 331.19949, "r_x1": 141.48859, "r_y1": 331.19949, "r_x2": 141.48859, "r_y2": 320.6311, "r_x3": 134.76498, "r_y3": 320.6311, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.93819, "r_y0": 331.19949, "r_x1": 372.50848, "r_y1": 331.19949, "r_x2": 372.50848, "r_y2": 320.6311, "r_x3": 154.93819, "r_y3": 320.6311, "coord_origin": "TOPLEFT" }, "text": "Optimised Table Structure Language", "orig": "Optimised Table Structure Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 357.91394, "r_x1": 480.59075999999993, "r_y1": 357.91394, "r_x2": 480.59075999999993, "r_y2": 349.11697, "r_x3": 134.76498, "r_y3": 349.11697, "coord_origin": "TOPLEFT" }, "text": "To mitigate the issues with HTML in Im2Seq-based TSR models laid out before,", "orig": "To mitigate the issues with HTML in Im2Seq-based TSR models laid out before,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 369.86893, "r_x1": 480.58875, "r_y1": 369.86893, "r_x2": 480.58875, "r_y2": 361.07196000000005, "r_x3": 134.76498, "r_y3": 361.07196000000005, "coord_origin": "TOPLEFT" }, "text": "we propose here our Optimised Table Structure Language (OTSL). OTSL is", "orig": "we propose here our Optimised Table Structure Language (OTSL). OTSL is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 381.82492, "r_x1": 480.58681999999993, "r_y1": 381.82492, "r_x2": 480.58681999999993, "r_y2": 373.02795, "r_x3": 134.76498, "r_y3": 373.02795, "coord_origin": "TOPLEFT" }, "text": "designed to express table structure with a minimized vocabulary and a simple", "orig": "designed to express table structure with a minimized vocabulary and a simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 393.77991, "r_x1": 480.58875, "r_y1": 393.77991, "r_x2": 480.58875, "r_y2": 384.98294, "r_x3": 134.76498, "r_y3": 384.98294, "coord_origin": "TOPLEFT" }, "text": "set of rules, which are both significantly reduced compared to HTML. At the", "orig": "set of rules, which are both significantly reduced compared to HTML. At the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 405.73489, "r_x1": 480.58978, "r_y1": 405.73489, "r_x2": 480.58978, "r_y2": 396.93793, "r_x3": 134.76498, "r_y3": 396.93793, "coord_origin": "TOPLEFT" }, "text": "same time, OTSL enables easy error detection and correction during sequence", "orig": "same time, OTSL enables easy error detection and correction during sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 417.68988, "r_x1": 480.59473, "r_y1": 417.68988, "r_x2": 480.59473, "r_y2": 408.89291, "r_x3": 134.76498, "r_y3": 408.89291, "coord_origin": "TOPLEFT" }, "text": "generation. We further demonstrate how the compact structure representation", "orig": "generation. We further demonstrate how the compact structure representation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 429.64487, "r_x1": 480.58868, "r_y1": 429.64487, "r_x2": 480.58868, "r_y2": 420.8479, "r_x3": 134.76498, "r_y3": 420.8479, "coord_origin": "TOPLEFT" }, "text": "and minimized sequence length improves prediction accuracy and inference time", "orig": "and minimized sequence length improves prediction accuracy and inference time", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 441.59985, "r_x1": 276.67325, "r_y1": 441.59985, "r_x2": 276.67325, "r_y2": 432.80289, "r_x3": 134.76498, "r_y3": 432.80289, "coord_origin": "TOPLEFT" }, "text": "in the TableFormer architecture.", "orig": "in the TableFormer architecture.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 474.67886, "r_x1": 149.40204, "r_y1": 474.67886, "r_x2": 149.40204, "r_y2": 465.87192, "r_x3": 134.76498, "r_y3": 465.87192, "coord_origin": "TOPLEFT" }, "text": "4.1", "orig": "4.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.85902, "r_y0": 474.67886, "r_x1": 261.80109, "r_y1": 474.67886, "r_x2": 261.80109, "r_y2": 465.87192, "r_x3": 160.85902, "r_y3": 465.87192, "coord_origin": "TOPLEFT" }, "text": "Language Definition", "orig": "Language Definition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 497.79486, "r_x1": 480.58871, "r_y1": 497.79486, "r_x2": 480.58871, "r_y2": 488.99789, "r_x3": 134.76498, "r_y3": 488.99789, "coord_origin": "TOPLEFT" }, "text": "In Figure 3, we illustrate how the OTSL is defined. In essence, the OTSL defines", "orig": "In Figure 3, we illustrate how the OTSL is defined. In essence, the OTSL defines", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 509.74985, "r_x1": 480.5867, "r_y1": 509.74985, "r_x2": 480.5867, "r_y2": 500.95288, "r_x3": 134.76498, "r_y3": 500.95288, "coord_origin": "TOPLEFT" }, "text": "only 5 tokens that directly describe a tabular structure based on an atomic 2D", "orig": "only 5 tokens that directly describe a tabular structure based on an atomic 2D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 521.7058400000001, "r_x1": 154.7131, "r_y1": 521.7058400000001, "r_x2": 154.7131, "r_y2": 512.90887, "r_x3": 134.76498, "r_y3": 512.90887, "coord_origin": "TOPLEFT" }, "text": "grid.", "orig": "grid.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.70898, "r_y0": 534.29883, "r_x1": 409.31137, "r_y1": 534.29883, "r_x2": 409.31137, "r_y2": 525.5018600000001, "r_x3": 149.70898, "r_y3": 525.5018600000001, "coord_origin": "TOPLEFT" }, "text": "The OTSL vocabulary is comprised of the following tokens:", "orig": "The OTSL vocabulary is comprised of the following tokens:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 140.99298, "r_y0": 556.77682, "r_x1": 146.72047, "r_y1": 556.77682, "r_x2": 146.72047, "r_y2": 547.96989, "r_x3": 140.99298, "r_y3": 547.96989, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.70099, "r_y0": 556.77682, "r_x1": 193.20619, "r_y1": 556.77682, "r_x2": 193.20619, "r_y2": 547.97986, "r_x3": 151.70099, "r_y3": 547.97986, "coord_origin": "TOPLEFT" }, "text": "\"C\" cell -", "orig": "\"C\" cell -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.52199, "r_y0": 556.77682, "r_x1": 263.46564, "r_y1": 556.77682, "r_x2": 263.46564, "r_y2": 547.97986, "r_x3": 196.52199, "r_y3": 547.97986, "coord_origin": "TOPLEFT" }, "text": "a new table cell", "orig": "a new table cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 267.815, "r_y0": 556.77682, "r_x1": 460.54443, "r_y1": 556.77682, "r_x2": 460.54443, "r_y2": 547.97986, "r_x3": 267.815, "r_y3": 547.97986, "coord_origin": "TOPLEFT" }, "text": "that either has or does not have cell content", "orig": "that either has or does not have cell content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 140.99301, "r_y0": 569.36983, "r_x1": 146.7205, "r_y1": 569.36983, "r_x2": 146.7205, "r_y2": 560.5629, "r_x3": 140.99301, "r_y3": 560.5629, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.70102, "r_y0": 569.36983, "r_x1": 194.30011, "r_y1": 569.36983, "r_x2": 194.30011, "r_y2": 560.57286, "r_x3": 151.70102, "r_y3": 560.57286, "coord_origin": "TOPLEFT" }, "text": "\"L\" cell -", "orig": "\"L\" cell -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 198.65903, "r_y0": 569.36983, "r_x1": 264.51779, "r_y1": 569.36983, "r_x2": 264.51779, "r_y2": 560.57286, "r_x3": 198.65903, "r_y3": 560.57286, "coord_origin": "TOPLEFT" }, "text": "left-looking cell", "orig": "left-looking cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.51804, "r_y0": 569.36983, "r_x1": 480.59392999999994, "r_y1": 569.36983, "r_x2": 480.59392999999994, "r_y2": 560.57286, "r_x3": 264.51804, "r_y3": 560.57286, "coord_origin": "TOPLEFT" }, "text": ", merging with the left neighbor cell to create a", "orig": ", merging with the left neighbor cell to create a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.70103, "r_y0": 581.32483, "r_x1": 171.67604, "r_y1": 581.32483, "r_x2": 171.67604, "r_y2": 572.52786, "r_x3": 151.70103, "r_y3": 572.52786, "coord_origin": "TOPLEFT" }, "text": "span", "orig": "span", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 140.99304, "r_y0": 593.91882, "r_x1": 146.72054, "r_y1": 593.91882, "r_x2": 146.72054, "r_y2": 585.11189, "r_x3": 140.99304, "r_y3": 585.11189, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.70105, "r_y0": 593.91882, "r_x1": 194.11086, "r_y1": 593.91882, "r_x2": 194.11086, "r_y2": 585.12186, "r_x3": 151.70105, "r_y3": 585.12186, "coord_origin": "TOPLEFT" }, "text": "\"U\" cell -", "orig": "\"U\" cell -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 197.74805, "r_y0": 593.91882, "r_x1": 259.89474, "r_y1": 593.91882, "r_x2": 259.89474, "r_y2": 585.12186, "r_x3": 197.74805, "r_y3": 585.12186, "coord_origin": "TOPLEFT" }, "text": "up-looking cell", "orig": "up-looking cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.89206, "r_y0": 593.91882, "r_x1": 480.58856, "r_y1": 593.91882, "r_x2": 480.58856, "r_y2": 585.12186, "r_x3": 259.89206, "r_y3": 585.12186, "coord_origin": "TOPLEFT" }, "text": ", merging with the upper neighbor cell to create a", "orig": ", merging with the upper neighbor cell to create a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.70105, "r_y0": 605.87383, "r_x1": 171.67606, "r_y1": 605.87383, "r_x2": 171.67606, "r_y2": 597.07686, "r_x3": 151.70105, "r_y3": 597.07686, "coord_origin": "TOPLEFT" }, "text": "span", "orig": "span", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 140.99304, "r_y0": 618.46683, "r_x1": 146.72054, "r_y1": 618.46683, "r_x2": 146.72054, "r_y2": 609.6599, "r_x3": 140.99304, "r_y3": 609.6599, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.70105, "r_y0": 618.46683, "r_x1": 193.48323, "r_y1": 618.46683, "r_x2": 193.48323, "r_y2": 609.66986, "r_x3": 151.70105, "r_y3": 609.66986, "coord_origin": "TOPLEFT" }, "text": "\"X\" cell -", "orig": "\"X\" cell -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.79904, "r_y0": 618.46683, "r_x1": 236.12042, "r_y1": 618.46683, "r_x2": 236.12042, "r_y2": 609.66986, "r_x3": 196.79904, "r_y3": 609.66986, "coord_origin": "TOPLEFT" }, "text": "cross cell", "orig": "cross cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 236.12505, "r_y0": 618.46683, "r_x1": 454.55496, "r_y1": 618.46683, "r_x2": 454.55496, "r_y2": 609.66986, "r_x3": 236.12505, "r_y3": 609.66986, "coord_origin": "TOPLEFT" }, "text": ", to merge with both left and upper neighbor cells", "orig": ", to merge with both left and upper neighbor cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 140.99304, "r_y0": 631.06082, "r_x1": 146.72054, "r_y1": 631.06082, "r_x2": 146.72054, "r_y2": 622.2538900000001, "r_x3": 140.99304, "r_y3": 622.2538900000001, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.70105, "r_y0": 631.06082, "r_x1": 181.99434, "r_y1": 631.06082, "r_x2": 181.99434, "r_y2": 622.26385, "r_x3": 151.70105, "r_y3": 622.26385, "coord_origin": "TOPLEFT" }, "text": "\"NL\" -", "orig": "\"NL\" -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.31705, "r_y0": 631.06082, "r_x1": 221.46236, "r_y1": 631.06082, "r_x2": 221.46236, "r_y2": 622.26385, "r_x3": 185.31705, "r_y3": 622.26385, "coord_origin": "TOPLEFT" }, "text": "new-line", "orig": "new-line", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 221.46104, "r_y0": 631.06082, "r_x1": 328.61676, "r_y1": 631.06082, "r_x2": 328.61676, "r_y2": 622.26385, "r_x3": 221.46104, "r_y3": 622.26385, "coord_origin": "TOPLEFT" }, "text": ", switch to the next row.", "orig": ", switch to the next row.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.70905, "r_y0": 652.8998300000001, "r_x1": 480.59280000000007, "r_y1": 652.8998300000001, "r_x2": 480.59280000000007, "r_y2": 644.10286, "r_x3": 149.70905, "r_y3": 644.10286, "coord_origin": "TOPLEFT" }, "text": "A notable attribute of OTSL is that it has the capability of achieving lossless", "orig": "A notable attribute of OTSL is that it has the capability of achieving lossless", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76505, "r_y0": 664.85484, "r_x1": 228.22321, "r_y1": 664.85484, "r_x2": 228.22321, "r_y2": 656.05786, "r_x3": 134.76505, "r_y3": 656.05786, "coord_origin": "TOPLEFT" }, "text": "conversion to HTML.", "orig": "conversion to HTML.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "has_chars": false, "has_words": false, "has_lines": true, "image": null, "lines": [] }, "predictions": { "layout": { "clusters": [ { "id": 14, "label": "page_header", "bbox": { "l": 134.765, "t": 93.77099999999996, "r": 139.37193, "b": 101.84069999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.8378868699073792, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 101.84069999999997, "r_x1": 139.37193, "r_y1": 101.84069999999997, "r_x2": 139.37193, "r_y2": 93.77099999999996, "r_x3": 134.765, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 11, "label": "page_header", "bbox": { "l": 167.81335, "t": 93.77099999999996, "r": 231.72227, "b": 101.84069999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.8919177651405334, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.81335, "r_y0": 101.84069999999997, "r_x1": 178.07675, "r_y1": 101.84069999999997, "r_x2": 178.07675, "r_y2": 93.77099999999996, "r_x3": 167.81335, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.37415, "r_y0": 101.84069999999997, "r_x1": 231.72227, "r_y1": 101.84069999999997, "r_x2": 231.72227, "r_y2": 93.77099999999996, "r_x3": 182.37415, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 3, "label": "text", "bbox": { "l": 134.765, "t": 118.93377999999996, "r": 480.59479, "b": 139.68579, "coord_origin": "TOPLEFT" }, "confidence": 0.9633480906486511, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 127.73077, "r_x1": 480.59479, "r_y1": 127.73077, "r_x2": 480.59479, "r_y2": 118.93377999999996, "r_x3": 134.765, "r_y3": 118.93377999999996, "coord_origin": "TOPLEFT" }, "text": "generation. Implicitly, this also means that Im2Seq models need to learn these", "orig": "generation. Implicitly, this also means that Im2Seq models need to learn these", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 139.68579, "r_x1": 364.62503, "r_y1": 139.68579, "r_x2": 364.62503, "r_y2": 130.88878999999997, "r_x3": 134.765, "r_y3": 130.88878999999997, "coord_origin": "TOPLEFT" }, "text": "complex syntax rules, simply to deliver valid output.", "orig": "complex syntax rules, simply to deliver valid output.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 1, "label": "text", "bbox": { "l": 134.76498, "t": 143.48279000000002, "r": 480.59569999999997, "b": 295.74191, "coord_origin": "TOPLEFT" }, "confidence": 0.9856827855110168, "cells": [ { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.709, "r_y0": 152.27979000000005, "r_x1": 480.58981, "r_y1": 152.27979000000005, "r_x2": 480.58981, "r_y2": 143.48279000000002, "r_x3": 149.709, "r_y3": 143.48279000000002, "coord_origin": "TOPLEFT" }, "text": "In practice, we observe two major issues with prediction quality when train-", "orig": "In practice, we observe two major issues with prediction quality when train-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 164.23479999999995, "r_x1": 480.59378, "r_y1": 164.23479999999995, "r_x2": 480.59378, "r_y2": 155.43781, "r_x3": 134.765, "r_y3": 155.43781, "coord_origin": "TOPLEFT" }, "text": "ing Im2Seq models on HTML table structure generation from images. On the", "orig": "ing Im2Seq models on HTML table structure generation from images. On the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 176.18982000000005, "r_x1": 480.5867, "r_y1": 176.18982000000005, "r_x2": 480.5867, "r_y2": 167.39282000000003, "r_x3": 134.765, "r_y3": 167.39282000000003, "coord_origin": "TOPLEFT" }, "text": "one hand, we find that on large tables, the visual attention of the model often", "orig": "one hand, we find that on large tables, the visual attention of the model often", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 188.14484000000004, "r_x1": 480.59476, "r_y1": 188.14484000000004, "r_x2": 480.59476, "r_y2": 179.34784000000002, "r_x3": 134.765, "r_y3": 179.34784000000002, "coord_origin": "TOPLEFT" }, "text": "starts to drift and is not accurately moving forward cell by cell anymore. This", "orig": "starts to drift and is not accurately moving forward cell by cell anymore. This", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 200.09984999999995, "r_x1": 314.27805, "r_y1": 200.09984999999995, "r_x2": 314.27805, "r_y2": 191.30286, "r_x3": 134.765, "r_y3": 191.30286, "coord_origin": "TOPLEFT" }, "text": "manifests itself in either in an increasing", "orig": "manifests itself in either in an increasing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.056, "r_y0": 200.09984999999995, "r_x1": 374.08664, "r_y1": 200.09984999999995, "r_x2": 374.08664, "r_y2": 191.30286, "r_x3": 318.056, "r_y3": 191.30286, "coord_origin": "TOPLEFT" }, "text": "location drift", "orig": "location drift", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 378.80899, "r_y0": 200.09984999999995, "r_x1": 480.58594, "r_y1": 200.09984999999995, "r_x2": 480.58594, "r_y2": 191.30286, "r_x3": 378.80899, "r_y3": 191.30286, "coord_origin": "TOPLEFT" }, "text": "for proposed table-cells", "orig": "for proposed table-cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 212.05584999999996, "r_x1": 480.58771, "r_y1": 212.05584999999996, "r_x2": 480.58771, "r_y2": 203.25885000000005, "r_x3": 134.76498, "r_y3": 203.25885000000005, "coord_origin": "TOPLEFT" }, "text": "in later rows on the same column or even complete loss of vertical alignment, as", "orig": "in later rows on the same column or even complete loss of vertical alignment, as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 224.01085999999998, "r_x1": 480.59569999999997, "r_y1": 224.01085999999998, "r_x2": 480.59569999999997, "r_y2": 215.21387000000004, "r_x3": 134.76498, "r_y3": 215.21387000000004, "coord_origin": "TOPLEFT" }, "text": "illustrated in Figure 5. Addressing this with post-processing is partially possible,", "orig": "illustrated in Figure 5. Addressing this with post-processing is partially possible,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 235.96587999999997, "r_x1": 480.59454, "r_y1": 235.96587999999997, "r_x2": 480.59454, "r_y2": 227.16887999999994, "r_x3": 134.76498, "r_y3": 227.16887999999994, "coord_origin": "TOPLEFT" }, "text": "but clearly undesired. On the other hand, we find many instances of predictions", "orig": "but clearly undesired. On the other hand, we find many instances of predictions", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 247.92089999999996, "r_x1": 480.58759000000003, "r_y1": 247.92089999999996, "r_x2": 480.58759000000003, "r_y2": 239.12390000000005, "r_x3": 134.76498, "r_y3": 239.12390000000005, "coord_origin": "TOPLEFT" }, "text": "with structural inconsistencies or plain invalid HTML output, as shown in Fig-", "orig": "with structural inconsistencies or plain invalid HTML output, as shown in Fig-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 259.87591999999995, "r_x1": 480.59277, "r_y1": 259.87591999999995, "r_x2": 480.59277, "r_y2": 251.07892000000004, "r_x3": 134.76498, "r_y3": 251.07892000000004, "coord_origin": "TOPLEFT" }, "text": "ure 6, which are nearly impossible to properly correct. Both problems seriously", "orig": "ure 6, which are nearly impossible to properly correct. Both problems seriously", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 271.83092999999997, "r_x1": 480.59463999999997, "r_y1": 271.83092999999997, "r_x2": 480.59463999999997, "r_y2": 263.03394000000003, "r_x3": 134.76498, "r_y3": 263.03394000000003, "coord_origin": "TOPLEFT" }, "text": "impact the TSR model performance, since they reflect not only in the task of", "orig": "impact the TSR model performance, since they reflect not only in the task of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 283.78693, "r_x1": 480.58978, "r_y1": 283.78693, "r_x2": 480.58978, "r_y2": 274.98992999999996, "r_x3": 134.76498, "r_y3": 274.98992999999996, "coord_origin": "TOPLEFT" }, "text": "pure structure recognition but also in the equally crucial recognition or matching", "orig": "pure structure recognition but also in the equally crucial recognition or matching", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 295.74191, "r_x1": 223.57262, "r_y1": 295.74191, "r_x2": 223.57262, "r_y2": 286.94495, "r_x3": 134.76498, "r_y3": 286.94495, "coord_origin": "TOPLEFT" }, "text": "of table cell content.", "orig": "of table cell content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 4, "label": "section_header", "bbox": { "l": 134.76498, "t": 320.6311, "r": 372.50848, "b": 331.19949, "coord_origin": "TOPLEFT" }, "confidence": 0.957028865814209, "cells": [ { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 331.19949, "r_x1": 141.48859, "r_y1": 331.19949, "r_x2": 141.48859, "r_y2": 320.6311, "r_x3": 134.76498, "r_y3": 320.6311, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.93819, "r_y0": 331.19949, "r_x1": 372.50848, "r_y1": 331.19949, "r_x2": 372.50848, "r_y2": 320.6311, "r_x3": 154.93819, "r_y3": 320.6311, "coord_origin": "TOPLEFT" }, "text": "Optimised Table Structure Language", "orig": "Optimised Table Structure Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 0, "label": "text", "bbox": { "l": 134.76498, "t": 349.11697, "r": 480.59473, "b": 441.59985, "coord_origin": "TOPLEFT" }, "confidence": 0.9879323840141296, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 357.91394, "r_x1": 480.59075999999993, "r_y1": 357.91394, "r_x2": 480.59075999999993, "r_y2": 349.11697, "r_x3": 134.76498, "r_y3": 349.11697, "coord_origin": "TOPLEFT" }, "text": "To mitigate the issues with HTML in Im2Seq-based TSR models laid out before,", "orig": "To mitigate the issues with HTML in Im2Seq-based TSR models laid out before,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 369.86893, "r_x1": 480.58875, "r_y1": 369.86893, "r_x2": 480.58875, "r_y2": 361.07196000000005, "r_x3": 134.76498, "r_y3": 361.07196000000005, "coord_origin": "TOPLEFT" }, "text": "we propose here our Optimised Table Structure Language (OTSL). OTSL is", "orig": "we propose here our Optimised Table Structure Language (OTSL). OTSL is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 381.82492, "r_x1": 480.58681999999993, "r_y1": 381.82492, "r_x2": 480.58681999999993, "r_y2": 373.02795, "r_x3": 134.76498, "r_y3": 373.02795, "coord_origin": "TOPLEFT" }, "text": "designed to express table structure with a minimized vocabulary and a simple", "orig": "designed to express table structure with a minimized vocabulary and a simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 393.77991, "r_x1": 480.58875, "r_y1": 393.77991, "r_x2": 480.58875, "r_y2": 384.98294, "r_x3": 134.76498, "r_y3": 384.98294, "coord_origin": "TOPLEFT" }, "text": "set of rules, which are both significantly reduced compared to HTML. At the", "orig": "set of rules, which are both significantly reduced compared to HTML. At the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 405.73489, "r_x1": 480.58978, "r_y1": 405.73489, "r_x2": 480.58978, "r_y2": 396.93793, "r_x3": 134.76498, "r_y3": 396.93793, "coord_origin": "TOPLEFT" }, "text": "same time, OTSL enables easy error detection and correction during sequence", "orig": "same time, OTSL enables easy error detection and correction during sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 417.68988, "r_x1": 480.59473, "r_y1": 417.68988, "r_x2": 480.59473, "r_y2": 408.89291, "r_x3": 134.76498, "r_y3": 408.89291, "coord_origin": "TOPLEFT" }, "text": "generation. We further demonstrate how the compact structure representation", "orig": "generation. We further demonstrate how the compact structure representation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 429.64487, "r_x1": 480.58868, "r_y1": 429.64487, "r_x2": 480.58868, "r_y2": 420.8479, "r_x3": 134.76498, "r_y3": 420.8479, "coord_origin": "TOPLEFT" }, "text": "and minimized sequence length improves prediction accuracy and inference time", "orig": "and minimized sequence length improves prediction accuracy and inference time", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 441.59985, "r_x1": 276.67325, "r_y1": 441.59985, "r_x2": 276.67325, "r_y2": 432.80289, "r_x3": 134.76498, "r_y3": 432.80289, "coord_origin": "TOPLEFT" }, "text": "in the TableFormer architecture.", "orig": "in the TableFormer architecture.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 5, "label": "section_header", "bbox": { "l": 134.76498, "t": 465.87192, "r": 261.80109, "b": 474.67886, "coord_origin": "TOPLEFT" }, "confidence": 0.9559652209281921, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 474.67886, "r_x1": 149.40204, "r_y1": 474.67886, "r_x2": 149.40204, "r_y2": 465.87192, "r_x3": 134.76498, "r_y3": 465.87192, "coord_origin": "TOPLEFT" }, "text": "4.1", "orig": "4.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.85902, "r_y0": 474.67886, "r_x1": 261.80109, "r_y1": 474.67886, "r_x2": 261.80109, "r_y2": 465.87192, "r_x3": 160.85902, "r_y3": 465.87192, "coord_origin": "TOPLEFT" }, "text": "Language Definition", "orig": "Language Definition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 2, "label": "text", "bbox": { "l": 134.76498, "t": 488.99789, "r": 480.58871, "b": 521.7058400000001, "coord_origin": "TOPLEFT" }, "confidence": 0.9671263098716736, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 497.79486, "r_x1": 480.58871, "r_y1": 497.79486, "r_x2": 480.58871, "r_y2": 488.99789, "r_x3": 134.76498, "r_y3": 488.99789, "coord_origin": "TOPLEFT" }, "text": "In Figure 3, we illustrate how the OTSL is defined. In essence, the OTSL defines", "orig": "In Figure 3, we illustrate how the OTSL is defined. In essence, the OTSL defines", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 509.74985, "r_x1": 480.5867, "r_y1": 509.74985, "r_x2": 480.5867, "r_y2": 500.95288, "r_x3": 134.76498, "r_y3": 500.95288, "coord_origin": "TOPLEFT" }, "text": "only 5 tokens that directly describe a tabular structure based on an atomic 2D", "orig": "only 5 tokens that directly describe a tabular structure based on an atomic 2D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 521.7058400000001, "r_x1": 154.7131, "r_y1": 521.7058400000001, "r_x2": 154.7131, "r_y2": 512.90887, "r_x3": 134.76498, "r_y3": 512.90887, "coord_origin": "TOPLEFT" }, "text": "grid.", "orig": "grid.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 13, "label": "text", "bbox": { "l": 149.70898, "t": 525.5018600000001, "r": 409.31137, "b": 534.29883, "coord_origin": "TOPLEFT" }, "confidence": 0.8555866479873657, "cells": [ { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.70898, "r_y0": 534.29883, "r_x1": 409.31137, "r_y1": 534.29883, "r_x2": 409.31137, "r_y2": 525.5018600000001, "r_x3": 149.70898, "r_y3": 525.5018600000001, "coord_origin": "TOPLEFT" }, "text": "The OTSL vocabulary is comprised of the following tokens:", "orig": "The OTSL vocabulary is comprised of the following tokens:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 9, "label": "list_item", "bbox": { "l": 140.99298, "t": 547.96989, "r": 460.54443, "b": 556.77682, "coord_origin": "TOPLEFT" }, "confidence": 0.9184334874153137, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 140.99298, "r_y0": 556.77682, "r_x1": 146.72047, "r_y1": 556.77682, "r_x2": 146.72047, "r_y2": 547.96989, "r_x3": 140.99298, "r_y3": 547.96989, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.70099, "r_y0": 556.77682, "r_x1": 193.20619, "r_y1": 556.77682, "r_x2": 193.20619, "r_y2": 547.97986, "r_x3": 151.70099, "r_y3": 547.97986, "coord_origin": "TOPLEFT" }, "text": "\"C\" cell -", "orig": "\"C\" cell -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.52199, "r_y0": 556.77682, "r_x1": 263.46564, "r_y1": 556.77682, "r_x2": 263.46564, "r_y2": 547.97986, "r_x3": 196.52199, "r_y3": 547.97986, "coord_origin": "TOPLEFT" }, "text": "a new table cell", "orig": "a new table cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 267.815, "r_y0": 556.77682, "r_x1": 460.54443, "r_y1": 556.77682, "r_x2": 460.54443, "r_y2": 547.97986, "r_x3": 267.815, "r_y3": 547.97986, "coord_origin": "TOPLEFT" }, "text": "that either has or does not have cell content", "orig": "that either has or does not have cell content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 8, "label": "list_item", "bbox": { "l": 140.99301, "t": 560.5629, "r": 480.59392999999994, "b": 581.32483, "coord_origin": "TOPLEFT" }, "confidence": 0.9319931268692017, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 140.99301, "r_y0": 569.36983, "r_x1": 146.7205, "r_y1": 569.36983, "r_x2": 146.7205, "r_y2": 560.5629, "r_x3": 140.99301, "r_y3": 560.5629, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.70102, "r_y0": 569.36983, "r_x1": 194.30011, "r_y1": 569.36983, "r_x2": 194.30011, "r_y2": 560.57286, "r_x3": 151.70102, "r_y3": 560.57286, "coord_origin": "TOPLEFT" }, "text": "\"L\" cell -", "orig": "\"L\" cell -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 198.65903, "r_y0": 569.36983, "r_x1": 264.51779, "r_y1": 569.36983, "r_x2": 264.51779, "r_y2": 560.57286, "r_x3": 198.65903, "r_y3": 560.57286, "coord_origin": "TOPLEFT" }, "text": "left-looking cell", "orig": "left-looking cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.51804, "r_y0": 569.36983, "r_x1": 480.59392999999994, "r_y1": 569.36983, "r_x2": 480.59392999999994, "r_y2": 560.57286, "r_x3": 264.51804, "r_y3": 560.57286, "coord_origin": "TOPLEFT" }, "text": ", merging with the left neighbor cell to create a", "orig": ", merging with the left neighbor cell to create a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.70103, "r_y0": 581.32483, "r_x1": 171.67604, "r_y1": 581.32483, "r_x2": 171.67604, "r_y2": 572.52786, "r_x3": 151.70103, "r_y3": 572.52786, "coord_origin": "TOPLEFT" }, "text": "span", "orig": "span", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 7, "label": "list_item", "bbox": { "l": 140.99304, "t": 585.11189, "r": 480.58856, "b": 605.87383, "coord_origin": "TOPLEFT" }, "confidence": 0.9438967704772949, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 140.99304, "r_y0": 593.91882, "r_x1": 146.72054, "r_y1": 593.91882, "r_x2": 146.72054, "r_y2": 585.11189, "r_x3": 140.99304, "r_y3": 585.11189, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.70105, "r_y0": 593.91882, "r_x1": 194.11086, "r_y1": 593.91882, "r_x2": 194.11086, "r_y2": 585.12186, "r_x3": 151.70105, "r_y3": 585.12186, "coord_origin": "TOPLEFT" }, "text": "\"U\" cell -", "orig": "\"U\" cell -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 197.74805, "r_y0": 593.91882, "r_x1": 259.89474, "r_y1": 593.91882, "r_x2": 259.89474, "r_y2": 585.12186, "r_x3": 197.74805, "r_y3": 585.12186, "coord_origin": "TOPLEFT" }, "text": "up-looking cell", "orig": "up-looking cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.89206, "r_y0": 593.91882, "r_x1": 480.58856, "r_y1": 593.91882, "r_x2": 480.58856, "r_y2": 585.12186, "r_x3": 259.89206, "r_y3": 585.12186, "coord_origin": "TOPLEFT" }, "text": ", merging with the upper neighbor cell to create a", "orig": ", merging with the upper neighbor cell to create a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.70105, "r_y0": 605.87383, "r_x1": 171.67606, "r_y1": 605.87383, "r_x2": 171.67606, "r_y2": 597.07686, "r_x3": 151.70105, "r_y3": 597.07686, "coord_origin": "TOPLEFT" }, "text": "span", "orig": "span", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 10, "label": "list_item", "bbox": { "l": 140.99304, "t": 609.6599, "r": 454.55496, "b": 618.46683, "coord_origin": "TOPLEFT" }, "confidence": 0.9036387801170349, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 140.99304, "r_y0": 618.46683, "r_x1": 146.72054, "r_y1": 618.46683, "r_x2": 146.72054, "r_y2": 609.6599, "r_x3": 140.99304, "r_y3": 609.6599, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.70105, "r_y0": 618.46683, "r_x1": 193.48323, "r_y1": 618.46683, "r_x2": 193.48323, "r_y2": 609.66986, "r_x3": 151.70105, "r_y3": 609.66986, "coord_origin": "TOPLEFT" }, "text": "\"X\" cell -", "orig": "\"X\" cell -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.79904, "r_y0": 618.46683, "r_x1": 236.12042, "r_y1": 618.46683, "r_x2": 236.12042, "r_y2": 609.66986, "r_x3": 196.79904, "r_y3": 609.66986, "coord_origin": "TOPLEFT" }, "text": "cross cell", "orig": "cross cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 236.12505, "r_y0": 618.46683, "r_x1": 454.55496, "r_y1": 618.46683, "r_x2": 454.55496, "r_y2": 609.66986, "r_x3": 236.12505, "r_y3": 609.66986, "coord_origin": "TOPLEFT" }, "text": ", to merge with both left and upper neighbor cells", "orig": ", to merge with both left and upper neighbor cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 12, "label": "list_item", "bbox": { "l": 140.99304, "t": 622.2538900000001, "r": 328.61676, "b": 631.06082, "coord_origin": "TOPLEFT" }, "confidence": 0.8636871576309204, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 140.99304, "r_y0": 631.06082, "r_x1": 146.72054, "r_y1": 631.06082, "r_x2": 146.72054, "r_y2": 622.2538900000001, "r_x3": 140.99304, "r_y3": 622.2538900000001, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.70105, "r_y0": 631.06082, "r_x1": 181.99434, "r_y1": 631.06082, "r_x2": 181.99434, "r_y2": 622.26385, "r_x3": 151.70105, "r_y3": 622.26385, "coord_origin": "TOPLEFT" }, "text": "\"NL\" -", "orig": "\"NL\" -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.31705, "r_y0": 631.06082, "r_x1": 221.46236, "r_y1": 631.06082, "r_x2": 221.46236, "r_y2": 622.26385, "r_x3": 185.31705, "r_y3": 622.26385, "coord_origin": "TOPLEFT" }, "text": "new-line", "orig": "new-line", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 221.46104, "r_y0": 631.06082, "r_x1": 328.61676, "r_y1": 631.06082, "r_x2": 328.61676, "r_y2": 622.26385, "r_x3": 221.46104, "r_y3": 622.26385, "coord_origin": "TOPLEFT" }, "text": ", switch to the next row.", "orig": ", switch to the next row.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 6, "label": "text", "bbox": { "l": 134.76505, "t": 644.10286, "r": 480.59280000000007, "b": 664.85484, "coord_origin": "TOPLEFT" }, "confidence": 0.9443338513374329, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.70905, "r_y0": 652.8998300000001, "r_x1": 480.59280000000007, "r_y1": 652.8998300000001, "r_x2": 480.59280000000007, "r_y2": 644.10286, "r_x3": 149.70905, "r_y3": 644.10286, "coord_origin": "TOPLEFT" }, "text": "A notable attribute of OTSL is that it has the capability of achieving lossless", "orig": "A notable attribute of OTSL is that it has the capability of achieving lossless", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76505, "r_y0": 664.85484, "r_x1": 228.22321, "r_y1": 664.85484, "r_x2": 228.22321, "r_y2": 656.05786, "r_x3": 134.76505, "r_y3": 656.05786, "coord_origin": "TOPLEFT" }, "text": "conversion to HTML.", "orig": "conversion to HTML.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "tablestructure": { "table_map": {} }, "figures_classification": null, "equations_prediction": null, "vlm_response": null }, "assembled": { "elements": [ { "label": "page_header", "id": 14, "page_no": 5, "cluster": { "id": 14, "label": "page_header", "bbox": { "l": 134.765, "t": 93.77099999999996, "r": 139.37193, "b": 101.84069999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.8378868699073792, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 101.84069999999997, "r_x1": 139.37193, "r_y1": 101.84069999999997, "r_x2": 139.37193, "r_y2": 93.77099999999996, "r_x3": 134.765, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "6" }, { "label": "page_header", "id": 11, "page_no": 5, "cluster": { "id": 11, "label": "page_header", "bbox": { "l": 167.81335, "t": 93.77099999999996, "r": 231.72227, "b": 101.84069999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.8919177651405334, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.81335, "r_y0": 101.84069999999997, "r_x1": 178.07675, "r_y1": 101.84069999999997, "r_x2": 178.07675, "r_y2": 93.77099999999996, "r_x3": 167.81335, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.37415, "r_y0": 101.84069999999997, "r_x1": 231.72227, "r_y1": 101.84069999999997, "r_x2": 231.72227, "r_y2": 93.77099999999996, "r_x3": 182.37415, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "M. Lysak, et al." }, { "label": "text", "id": 3, "page_no": 5, "cluster": { "id": 3, "label": "text", "bbox": { "l": 134.765, "t": 118.93377999999996, "r": 480.59479, "b": 139.68579, "coord_origin": "TOPLEFT" }, "confidence": 0.9633480906486511, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 127.73077, "r_x1": 480.59479, "r_y1": 127.73077, "r_x2": 480.59479, "r_y2": 118.93377999999996, "r_x3": 134.765, "r_y3": 118.93377999999996, "coord_origin": "TOPLEFT" }, "text": "generation. Implicitly, this also means that Im2Seq models need to learn these", "orig": "generation. Implicitly, this also means that Im2Seq models need to learn these", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 139.68579, "r_x1": 364.62503, "r_y1": 139.68579, "r_x2": 364.62503, "r_y2": 130.88878999999997, "r_x3": 134.765, "r_y3": 130.88878999999997, "coord_origin": "TOPLEFT" }, "text": "complex syntax rules, simply to deliver valid output.", "orig": "complex syntax rules, simply to deliver valid output.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "generation. Implicitly, this also means that Im2Seq models need to learn these complex syntax rules, simply to deliver valid output." }, { "label": "text", "id": 1, "page_no": 5, "cluster": { "id": 1, "label": "text", "bbox": { "l": 134.76498, "t": 143.48279000000002, "r": 480.59569999999997, "b": 295.74191, "coord_origin": "TOPLEFT" }, "confidence": 0.9856827855110168, "cells": [ { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.709, "r_y0": 152.27979000000005, "r_x1": 480.58981, "r_y1": 152.27979000000005, "r_x2": 480.58981, "r_y2": 143.48279000000002, "r_x3": 149.709, "r_y3": 143.48279000000002, "coord_origin": "TOPLEFT" }, "text": "In practice, we observe two major issues with prediction quality when train-", "orig": "In practice, we observe two major issues with prediction quality when train-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 164.23479999999995, "r_x1": 480.59378, "r_y1": 164.23479999999995, "r_x2": 480.59378, "r_y2": 155.43781, "r_x3": 134.765, "r_y3": 155.43781, "coord_origin": "TOPLEFT" }, "text": "ing Im2Seq models on HTML table structure generation from images. On the", "orig": "ing Im2Seq models on HTML table structure generation from images. On the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 176.18982000000005, "r_x1": 480.5867, "r_y1": 176.18982000000005, "r_x2": 480.5867, "r_y2": 167.39282000000003, "r_x3": 134.765, "r_y3": 167.39282000000003, "coord_origin": "TOPLEFT" }, "text": "one hand, we find that on large tables, the visual attention of the model often", "orig": "one hand, we find that on large tables, the visual attention of the model often", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 188.14484000000004, "r_x1": 480.59476, "r_y1": 188.14484000000004, "r_x2": 480.59476, "r_y2": 179.34784000000002, "r_x3": 134.765, "r_y3": 179.34784000000002, "coord_origin": "TOPLEFT" }, "text": "starts to drift and is not accurately moving forward cell by cell anymore. This", "orig": "starts to drift and is not accurately moving forward cell by cell anymore. This", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 200.09984999999995, "r_x1": 314.27805, "r_y1": 200.09984999999995, "r_x2": 314.27805, "r_y2": 191.30286, "r_x3": 134.765, "r_y3": 191.30286, "coord_origin": "TOPLEFT" }, "text": "manifests itself in either in an increasing", "orig": "manifests itself in either in an increasing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.056, "r_y0": 200.09984999999995, "r_x1": 374.08664, "r_y1": 200.09984999999995, "r_x2": 374.08664, "r_y2": 191.30286, "r_x3": 318.056, "r_y3": 191.30286, "coord_origin": "TOPLEFT" }, "text": "location drift", "orig": "location drift", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 378.80899, "r_y0": 200.09984999999995, "r_x1": 480.58594, "r_y1": 200.09984999999995, "r_x2": 480.58594, "r_y2": 191.30286, "r_x3": 378.80899, "r_y3": 191.30286, "coord_origin": "TOPLEFT" }, "text": "for proposed table-cells", "orig": "for proposed table-cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 212.05584999999996, "r_x1": 480.58771, "r_y1": 212.05584999999996, "r_x2": 480.58771, "r_y2": 203.25885000000005, "r_x3": 134.76498, "r_y3": 203.25885000000005, "coord_origin": "TOPLEFT" }, "text": "in later rows on the same column or even complete loss of vertical alignment, as", "orig": "in later rows on the same column or even complete loss of vertical alignment, as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 224.01085999999998, "r_x1": 480.59569999999997, "r_y1": 224.01085999999998, "r_x2": 480.59569999999997, "r_y2": 215.21387000000004, "r_x3": 134.76498, "r_y3": 215.21387000000004, "coord_origin": "TOPLEFT" }, "text": "illustrated in Figure 5. Addressing this with post-processing is partially possible,", "orig": "illustrated in Figure 5. Addressing this with post-processing is partially possible,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 235.96587999999997, "r_x1": 480.59454, "r_y1": 235.96587999999997, "r_x2": 480.59454, "r_y2": 227.16887999999994, "r_x3": 134.76498, "r_y3": 227.16887999999994, "coord_origin": "TOPLEFT" }, "text": "but clearly undesired. On the other hand, we find many instances of predictions", "orig": "but clearly undesired. On the other hand, we find many instances of predictions", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 247.92089999999996, "r_x1": 480.58759000000003, "r_y1": 247.92089999999996, "r_x2": 480.58759000000003, "r_y2": 239.12390000000005, "r_x3": 134.76498, "r_y3": 239.12390000000005, "coord_origin": "TOPLEFT" }, "text": "with structural inconsistencies or plain invalid HTML output, as shown in Fig-", "orig": "with structural inconsistencies or plain invalid HTML output, as shown in Fig-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 259.87591999999995, "r_x1": 480.59277, "r_y1": 259.87591999999995, "r_x2": 480.59277, "r_y2": 251.07892000000004, "r_x3": 134.76498, "r_y3": 251.07892000000004, "coord_origin": "TOPLEFT" }, "text": "ure 6, which are nearly impossible to properly correct. Both problems seriously", "orig": "ure 6, which are nearly impossible to properly correct. Both problems seriously", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 271.83092999999997, "r_x1": 480.59463999999997, "r_y1": 271.83092999999997, "r_x2": 480.59463999999997, "r_y2": 263.03394000000003, "r_x3": 134.76498, "r_y3": 263.03394000000003, "coord_origin": "TOPLEFT" }, "text": "impact the TSR model performance, since they reflect not only in the task of", "orig": "impact the TSR model performance, since they reflect not only in the task of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 283.78693, "r_x1": 480.58978, "r_y1": 283.78693, "r_x2": 480.58978, "r_y2": 274.98992999999996, "r_x3": 134.76498, "r_y3": 274.98992999999996, "coord_origin": "TOPLEFT" }, "text": "pure structure recognition but also in the equally crucial recognition or matching", "orig": "pure structure recognition but also in the equally crucial recognition or matching", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 295.74191, "r_x1": 223.57262, "r_y1": 295.74191, "r_x2": 223.57262, "r_y2": 286.94495, "r_x3": 134.76498, "r_y3": 286.94495, "coord_origin": "TOPLEFT" }, "text": "of table cell content.", "orig": "of table cell content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "In practice, we observe two major issues with prediction quality when training Im2Seq models on HTML table structure generation from images. On the one hand, we find that on large tables, the visual attention of the model often starts to drift and is not accurately moving forward cell by cell anymore. This manifests itself in either in an increasing location drift for proposed table-cells in later rows on the same column or even complete loss of vertical alignment, as illustrated in Figure 5. Addressing this with post-processing is partially possible, but clearly undesired. On the other hand, we find many instances of predictions with structural inconsistencies or plain invalid HTML output, as shown in Figure 6, which are nearly impossible to properly correct. Both problems seriously impact the TSR model performance, since they reflect not only in the task of pure structure recognition but also in the equally crucial recognition or matching of table cell content." }, { "label": "section_header", "id": 4, "page_no": 5, "cluster": { "id": 4, "label": "section_header", "bbox": { "l": 134.76498, "t": 320.6311, "r": 372.50848, "b": 331.19949, "coord_origin": "TOPLEFT" }, "confidence": 0.957028865814209, "cells": [ { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 331.19949, "r_x1": 141.48859, "r_y1": 331.19949, "r_x2": 141.48859, "r_y2": 320.6311, "r_x3": 134.76498, "r_y3": 320.6311, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.93819, "r_y0": 331.19949, "r_x1": 372.50848, "r_y1": 331.19949, "r_x2": 372.50848, "r_y2": 320.6311, "r_x3": 154.93819, "r_y3": 320.6311, "coord_origin": "TOPLEFT" }, "text": "Optimised Table Structure Language", "orig": "Optimised Table Structure Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "4 Optimised Table Structure Language" }, { "label": "text", "id": 0, "page_no": 5, "cluster": { "id": 0, "label": "text", "bbox": { "l": 134.76498, "t": 349.11697, "r": 480.59473, "b": 441.59985, "coord_origin": "TOPLEFT" }, "confidence": 0.9879323840141296, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 357.91394, "r_x1": 480.59075999999993, "r_y1": 357.91394, "r_x2": 480.59075999999993, "r_y2": 349.11697, "r_x3": 134.76498, "r_y3": 349.11697, "coord_origin": "TOPLEFT" }, "text": "To mitigate the issues with HTML in Im2Seq-based TSR models laid out before,", "orig": "To mitigate the issues with HTML in Im2Seq-based TSR models laid out before,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 369.86893, "r_x1": 480.58875, "r_y1": 369.86893, "r_x2": 480.58875, "r_y2": 361.07196000000005, "r_x3": 134.76498, "r_y3": 361.07196000000005, "coord_origin": "TOPLEFT" }, "text": "we propose here our Optimised Table Structure Language (OTSL). OTSL is", "orig": "we propose here our Optimised Table Structure Language (OTSL). OTSL is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 381.82492, "r_x1": 480.58681999999993, "r_y1": 381.82492, "r_x2": 480.58681999999993, "r_y2": 373.02795, "r_x3": 134.76498, "r_y3": 373.02795, "coord_origin": "TOPLEFT" }, "text": "designed to express table structure with a minimized vocabulary and a simple", "orig": "designed to express table structure with a minimized vocabulary and a simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 393.77991, "r_x1": 480.58875, "r_y1": 393.77991, "r_x2": 480.58875, "r_y2": 384.98294, "r_x3": 134.76498, "r_y3": 384.98294, "coord_origin": "TOPLEFT" }, "text": "set of rules, which are both significantly reduced compared to HTML. At the", "orig": "set of rules, which are both significantly reduced compared to HTML. At the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 405.73489, "r_x1": 480.58978, "r_y1": 405.73489, "r_x2": 480.58978, "r_y2": 396.93793, "r_x3": 134.76498, "r_y3": 396.93793, "coord_origin": "TOPLEFT" }, "text": "same time, OTSL enables easy error detection and correction during sequence", "orig": "same time, OTSL enables easy error detection and correction during sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 417.68988, "r_x1": 480.59473, "r_y1": 417.68988, "r_x2": 480.59473, "r_y2": 408.89291, "r_x3": 134.76498, "r_y3": 408.89291, "coord_origin": "TOPLEFT" }, "text": "generation. We further demonstrate how the compact structure representation", "orig": "generation. We further demonstrate how the compact structure representation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 429.64487, "r_x1": 480.58868, "r_y1": 429.64487, "r_x2": 480.58868, "r_y2": 420.8479, "r_x3": 134.76498, "r_y3": 420.8479, "coord_origin": "TOPLEFT" }, "text": "and minimized sequence length improves prediction accuracy and inference time", "orig": "and minimized sequence length improves prediction accuracy and inference time", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 441.59985, "r_x1": 276.67325, "r_y1": 441.59985, "r_x2": 276.67325, "r_y2": 432.80289, "r_x3": 134.76498, "r_y3": 432.80289, "coord_origin": "TOPLEFT" }, "text": "in the TableFormer architecture.", "orig": "in the TableFormer architecture.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "To mitigate the issues with HTML in Im2Seq-based TSR models laid out before, we propose here our Optimised Table Structure Language (OTSL). OTSL is designed to express table structure with a minimized vocabulary and a simple set of rules, which are both significantly reduced compared to HTML. At the same time, OTSL enables easy error detection and correction during sequence generation. We further demonstrate how the compact structure representation and minimized sequence length improves prediction accuracy and inference time in the TableFormer architecture." }, { "label": "section_header", "id": 5, "page_no": 5, "cluster": { "id": 5, "label": "section_header", "bbox": { "l": 134.76498, "t": 465.87192, "r": 261.80109, "b": 474.67886, "coord_origin": "TOPLEFT" }, "confidence": 0.9559652209281921, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 474.67886, "r_x1": 149.40204, "r_y1": 474.67886, "r_x2": 149.40204, "r_y2": 465.87192, "r_x3": 134.76498, "r_y3": 465.87192, "coord_origin": "TOPLEFT" }, "text": "4.1", "orig": "4.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.85902, "r_y0": 474.67886, "r_x1": 261.80109, "r_y1": 474.67886, "r_x2": 261.80109, "r_y2": 465.87192, "r_x3": 160.85902, "r_y3": 465.87192, "coord_origin": "TOPLEFT" }, "text": "Language Definition", "orig": "Language Definition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "4.1 Language Definition" }, { "label": "text", "id": 2, "page_no": 5, "cluster": { "id": 2, "label": "text", "bbox": { "l": 134.76498, "t": 488.99789, "r": 480.58871, "b": 521.7058400000001, "coord_origin": "TOPLEFT" }, "confidence": 0.9671263098716736, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 497.79486, "r_x1": 480.58871, "r_y1": 497.79486, "r_x2": 480.58871, "r_y2": 488.99789, "r_x3": 134.76498, "r_y3": 488.99789, "coord_origin": "TOPLEFT" }, "text": "In Figure 3, we illustrate how the OTSL is defined. In essence, the OTSL defines", "orig": "In Figure 3, we illustrate how the OTSL is defined. In essence, the OTSL defines", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 509.74985, "r_x1": 480.5867, "r_y1": 509.74985, "r_x2": 480.5867, "r_y2": 500.95288, "r_x3": 134.76498, "r_y3": 500.95288, "coord_origin": "TOPLEFT" }, "text": "only 5 tokens that directly describe a tabular structure based on an atomic 2D", "orig": "only 5 tokens that directly describe a tabular structure based on an atomic 2D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 521.7058400000001, "r_x1": 154.7131, "r_y1": 521.7058400000001, "r_x2": 154.7131, "r_y2": 512.90887, "r_x3": 134.76498, "r_y3": 512.90887, "coord_origin": "TOPLEFT" }, "text": "grid.", "orig": "grid.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "In Figure 3, we illustrate how the OTSL is defined. In essence, the OTSL defines only 5 tokens that directly describe a tabular structure based on an atomic 2D grid." }, { "label": "text", "id": 13, "page_no": 5, "cluster": { "id": 13, "label": "text", "bbox": { "l": 149.70898, "t": 525.5018600000001, "r": 409.31137, "b": 534.29883, "coord_origin": "TOPLEFT" }, "confidence": 0.8555866479873657, "cells": [ { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.70898, "r_y0": 534.29883, "r_x1": 409.31137, "r_y1": 534.29883, "r_x2": 409.31137, "r_y2": 525.5018600000001, "r_x3": 149.70898, "r_y3": 525.5018600000001, "coord_origin": "TOPLEFT" }, "text": "The OTSL vocabulary is comprised of the following tokens:", "orig": "The OTSL vocabulary is comprised of the following tokens:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The OTSL vocabulary is comprised of the following tokens:" }, { "label": "list_item", "id": 9, "page_no": 5, "cluster": { "id": 9, "label": "list_item", "bbox": { "l": 140.99298, "t": 547.96989, "r": 460.54443, "b": 556.77682, "coord_origin": "TOPLEFT" }, "confidence": 0.9184334874153137, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 140.99298, "r_y0": 556.77682, "r_x1": 146.72047, "r_y1": 556.77682, "r_x2": 146.72047, "r_y2": 547.96989, "r_x3": 140.99298, "r_y3": 547.96989, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.70099, "r_y0": 556.77682, "r_x1": 193.20619, "r_y1": 556.77682, "r_x2": 193.20619, "r_y2": 547.97986, "r_x3": 151.70099, "r_y3": 547.97986, "coord_origin": "TOPLEFT" }, "text": "\"C\" cell -", "orig": "\"C\" cell -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.52199, "r_y0": 556.77682, "r_x1": 263.46564, "r_y1": 556.77682, "r_x2": 263.46564, "r_y2": 547.97986, "r_x3": 196.52199, "r_y3": 547.97986, "coord_origin": "TOPLEFT" }, "text": "a new table cell", "orig": "a new table cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 267.815, "r_y0": 556.77682, "r_x1": 460.54443, "r_y1": 556.77682, "r_x2": 460.54443, "r_y2": 547.97986, "r_x3": 267.815, "r_y3": 547.97986, "coord_origin": "TOPLEFT" }, "text": "that either has or does not have cell content", "orig": "that either has or does not have cell content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "-\"C\" cell a new table cell that either has or does not have cell content" }, { "label": "list_item", "id": 8, "page_no": 5, "cluster": { "id": 8, "label": "list_item", "bbox": { "l": 140.99301, "t": 560.5629, "r": 480.59392999999994, "b": 581.32483, "coord_origin": "TOPLEFT" }, "confidence": 0.9319931268692017, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 140.99301, "r_y0": 569.36983, "r_x1": 146.7205, "r_y1": 569.36983, "r_x2": 146.7205, "r_y2": 560.5629, "r_x3": 140.99301, "r_y3": 560.5629, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.70102, "r_y0": 569.36983, "r_x1": 194.30011, "r_y1": 569.36983, "r_x2": 194.30011, "r_y2": 560.57286, "r_x3": 151.70102, "r_y3": 560.57286, "coord_origin": "TOPLEFT" }, "text": "\"L\" cell -", "orig": "\"L\" cell -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 198.65903, "r_y0": 569.36983, "r_x1": 264.51779, "r_y1": 569.36983, "r_x2": 264.51779, "r_y2": 560.57286, "r_x3": 198.65903, "r_y3": 560.57286, "coord_origin": "TOPLEFT" }, "text": "left-looking cell", "orig": "left-looking cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.51804, "r_y0": 569.36983, "r_x1": 480.59392999999994, "r_y1": 569.36983, "r_x2": 480.59392999999994, "r_y2": 560.57286, "r_x3": 264.51804, "r_y3": 560.57286, "coord_origin": "TOPLEFT" }, "text": ", merging with the left neighbor cell to create a", "orig": ", merging with the left neighbor cell to create a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.70103, "r_y0": 581.32483, "r_x1": 171.67604, "r_y1": 581.32483, "r_x2": 171.67604, "r_y2": 572.52786, "r_x3": 151.70103, "r_y3": 572.52786, "coord_origin": "TOPLEFT" }, "text": "span", "orig": "span", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "-\"L\" cell left-looking cell , merging with the left neighbor cell to create a span" }, { "label": "list_item", "id": 7, "page_no": 5, "cluster": { "id": 7, "label": "list_item", "bbox": { "l": 140.99304, "t": 585.11189, "r": 480.58856, "b": 605.87383, "coord_origin": "TOPLEFT" }, "confidence": 0.9438967704772949, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 140.99304, "r_y0": 593.91882, "r_x1": 146.72054, "r_y1": 593.91882, "r_x2": 146.72054, "r_y2": 585.11189, "r_x3": 140.99304, "r_y3": 585.11189, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.70105, "r_y0": 593.91882, "r_x1": 194.11086, "r_y1": 593.91882, "r_x2": 194.11086, "r_y2": 585.12186, "r_x3": 151.70105, "r_y3": 585.12186, "coord_origin": "TOPLEFT" }, "text": "\"U\" cell -", "orig": "\"U\" cell -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 197.74805, "r_y0": 593.91882, "r_x1": 259.89474, "r_y1": 593.91882, "r_x2": 259.89474, "r_y2": 585.12186, "r_x3": 197.74805, "r_y3": 585.12186, "coord_origin": "TOPLEFT" }, "text": "up-looking cell", "orig": "up-looking cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.89206, "r_y0": 593.91882, "r_x1": 480.58856, "r_y1": 593.91882, "r_x2": 480.58856, "r_y2": 585.12186, "r_x3": 259.89206, "r_y3": 585.12186, "coord_origin": "TOPLEFT" }, "text": ", merging with the upper neighbor cell to create a", "orig": ", merging with the upper neighbor cell to create a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.70105, "r_y0": 605.87383, "r_x1": 171.67606, "r_y1": 605.87383, "r_x2": 171.67606, "r_y2": 597.07686, "r_x3": 151.70105, "r_y3": 597.07686, "coord_origin": "TOPLEFT" }, "text": "span", "orig": "span", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "-\"U\" cell up-looking cell , merging with the upper neighbor cell to create a span" }, { "label": "list_item", "id": 10, "page_no": 5, "cluster": { "id": 10, "label": "list_item", "bbox": { "l": 140.99304, "t": 609.6599, "r": 454.55496, "b": 618.46683, "coord_origin": "TOPLEFT" }, "confidence": 0.9036387801170349, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 140.99304, "r_y0": 618.46683, "r_x1": 146.72054, "r_y1": 618.46683, "r_x2": 146.72054, "r_y2": 609.6599, "r_x3": 140.99304, "r_y3": 609.6599, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.70105, "r_y0": 618.46683, "r_x1": 193.48323, "r_y1": 618.46683, "r_x2": 193.48323, "r_y2": 609.66986, "r_x3": 151.70105, "r_y3": 609.66986, "coord_origin": "TOPLEFT" }, "text": "\"X\" cell -", "orig": "\"X\" cell -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.79904, "r_y0": 618.46683, "r_x1": 236.12042, "r_y1": 618.46683, "r_x2": 236.12042, "r_y2": 609.66986, "r_x3": 196.79904, "r_y3": 609.66986, "coord_origin": "TOPLEFT" }, "text": "cross cell", "orig": "cross cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 236.12505, "r_y0": 618.46683, "r_x1": 454.55496, "r_y1": 618.46683, "r_x2": 454.55496, "r_y2": 609.66986, "r_x3": 236.12505, "r_y3": 609.66986, "coord_origin": "TOPLEFT" }, "text": ", to merge with both left and upper neighbor cells", "orig": ", to merge with both left and upper neighbor cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "-\"X\" cell cross cell , to merge with both left and upper neighbor cells" }, { "label": "list_item", "id": 12, "page_no": 5, "cluster": { "id": 12, "label": "list_item", "bbox": { "l": 140.99304, "t": 622.2538900000001, "r": 328.61676, "b": 631.06082, "coord_origin": "TOPLEFT" }, "confidence": 0.8636871576309204, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 140.99304, "r_y0": 631.06082, "r_x1": 146.72054, "r_y1": 631.06082, "r_x2": 146.72054, "r_y2": 622.2538900000001, "r_x3": 140.99304, "r_y3": 622.2538900000001, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.70105, "r_y0": 631.06082, "r_x1": 181.99434, "r_y1": 631.06082, "r_x2": 181.99434, "r_y2": 622.26385, "r_x3": 151.70105, "r_y3": 622.26385, "coord_origin": "TOPLEFT" }, "text": "\"NL\" -", "orig": "\"NL\" -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.31705, "r_y0": 631.06082, "r_x1": 221.46236, "r_y1": 631.06082, "r_x2": 221.46236, "r_y2": 622.26385, "r_x3": 185.31705, "r_y3": 622.26385, "coord_origin": "TOPLEFT" }, "text": "new-line", "orig": "new-line", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 221.46104, "r_y0": 631.06082, "r_x1": 328.61676, "r_y1": 631.06082, "r_x2": 328.61676, "r_y2": 622.26385, "r_x3": 221.46104, "r_y3": 622.26385, "coord_origin": "TOPLEFT" }, "text": ", switch to the next row.", "orig": ", switch to the next row.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "-\"NL\" new-line , switch to the next row." }, { "label": "text", "id": 6, "page_no": 5, "cluster": { "id": 6, "label": "text", "bbox": { "l": 134.76505, "t": 644.10286, "r": 480.59280000000007, "b": 664.85484, "coord_origin": "TOPLEFT" }, "confidence": 0.9443338513374329, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.70905, "r_y0": 652.8998300000001, "r_x1": 480.59280000000007, "r_y1": 652.8998300000001, "r_x2": 480.59280000000007, "r_y2": 644.10286, "r_x3": 149.70905, "r_y3": 644.10286, "coord_origin": "TOPLEFT" }, "text": "A notable attribute of OTSL is that it has the capability of achieving lossless", "orig": "A notable attribute of OTSL is that it has the capability of achieving lossless", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76505, "r_y0": 664.85484, "r_x1": 228.22321, "r_y1": 664.85484, "r_x2": 228.22321, "r_y2": 656.05786, "r_x3": 134.76505, "r_y3": 656.05786, "coord_origin": "TOPLEFT" }, "text": "conversion to HTML.", "orig": "conversion to HTML.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "A notable attribute of OTSL is that it has the capability of achieving lossless conversion to HTML." } ], "body": [ { "label": "text", "id": 3, "page_no": 5, "cluster": { "id": 3, "label": "text", "bbox": { "l": 134.765, "t": 118.93377999999996, "r": 480.59479, "b": 139.68579, "coord_origin": "TOPLEFT" }, "confidence": 0.9633480906486511, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 127.73077, "r_x1": 480.59479, "r_y1": 127.73077, "r_x2": 480.59479, "r_y2": 118.93377999999996, "r_x3": 134.765, "r_y3": 118.93377999999996, "coord_origin": "TOPLEFT" }, "text": "generation. Implicitly, this also means that Im2Seq models need to learn these", "orig": "generation. Implicitly, this also means that Im2Seq models need to learn these", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 139.68579, "r_x1": 364.62503, "r_y1": 139.68579, "r_x2": 364.62503, "r_y2": 130.88878999999997, "r_x3": 134.765, "r_y3": 130.88878999999997, "coord_origin": "TOPLEFT" }, "text": "complex syntax rules, simply to deliver valid output.", "orig": "complex syntax rules, simply to deliver valid output.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "generation. Implicitly, this also means that Im2Seq models need to learn these complex syntax rules, simply to deliver valid output." }, { "label": "text", "id": 1, "page_no": 5, "cluster": { "id": 1, "label": "text", "bbox": { "l": 134.76498, "t": 143.48279000000002, "r": 480.59569999999997, "b": 295.74191, "coord_origin": "TOPLEFT" }, "confidence": 0.9856827855110168, "cells": [ { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.709, "r_y0": 152.27979000000005, "r_x1": 480.58981, "r_y1": 152.27979000000005, "r_x2": 480.58981, "r_y2": 143.48279000000002, "r_x3": 149.709, "r_y3": 143.48279000000002, "coord_origin": "TOPLEFT" }, "text": "In practice, we observe two major issues with prediction quality when train-", "orig": "In practice, we observe two major issues with prediction quality when train-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 164.23479999999995, "r_x1": 480.59378, "r_y1": 164.23479999999995, "r_x2": 480.59378, "r_y2": 155.43781, "r_x3": 134.765, "r_y3": 155.43781, "coord_origin": "TOPLEFT" }, "text": "ing Im2Seq models on HTML table structure generation from images. On the", "orig": "ing Im2Seq models on HTML table structure generation from images. On the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 176.18982000000005, "r_x1": 480.5867, "r_y1": 176.18982000000005, "r_x2": 480.5867, "r_y2": 167.39282000000003, "r_x3": 134.765, "r_y3": 167.39282000000003, "coord_origin": "TOPLEFT" }, "text": "one hand, we find that on large tables, the visual attention of the model often", "orig": "one hand, we find that on large tables, the visual attention of the model often", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 188.14484000000004, "r_x1": 480.59476, "r_y1": 188.14484000000004, "r_x2": 480.59476, "r_y2": 179.34784000000002, "r_x3": 134.765, "r_y3": 179.34784000000002, "coord_origin": "TOPLEFT" }, "text": "starts to drift and is not accurately moving forward cell by cell anymore. This", "orig": "starts to drift and is not accurately moving forward cell by cell anymore. This", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 200.09984999999995, "r_x1": 314.27805, "r_y1": 200.09984999999995, "r_x2": 314.27805, "r_y2": 191.30286, "r_x3": 134.765, "r_y3": 191.30286, "coord_origin": "TOPLEFT" }, "text": "manifests itself in either in an increasing", "orig": "manifests itself in either in an increasing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.056, "r_y0": 200.09984999999995, "r_x1": 374.08664, "r_y1": 200.09984999999995, "r_x2": 374.08664, "r_y2": 191.30286, "r_x3": 318.056, "r_y3": 191.30286, "coord_origin": "TOPLEFT" }, "text": "location drift", "orig": "location drift", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 378.80899, "r_y0": 200.09984999999995, "r_x1": 480.58594, "r_y1": 200.09984999999995, "r_x2": 480.58594, "r_y2": 191.30286, "r_x3": 378.80899, "r_y3": 191.30286, "coord_origin": "TOPLEFT" }, "text": "for proposed table-cells", "orig": "for proposed table-cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 212.05584999999996, "r_x1": 480.58771, "r_y1": 212.05584999999996, "r_x2": 480.58771, "r_y2": 203.25885000000005, "r_x3": 134.76498, "r_y3": 203.25885000000005, "coord_origin": "TOPLEFT" }, "text": "in later rows on the same column or even complete loss of vertical alignment, as", "orig": "in later rows on the same column or even complete loss of vertical alignment, as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 224.01085999999998, "r_x1": 480.59569999999997, "r_y1": 224.01085999999998, "r_x2": 480.59569999999997, "r_y2": 215.21387000000004, "r_x3": 134.76498, "r_y3": 215.21387000000004, "coord_origin": "TOPLEFT" }, "text": "illustrated in Figure 5. Addressing this with post-processing is partially possible,", "orig": "illustrated in Figure 5. Addressing this with post-processing is partially possible,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 235.96587999999997, "r_x1": 480.59454, "r_y1": 235.96587999999997, "r_x2": 480.59454, "r_y2": 227.16887999999994, "r_x3": 134.76498, "r_y3": 227.16887999999994, "coord_origin": "TOPLEFT" }, "text": "but clearly undesired. On the other hand, we find many instances of predictions", "orig": "but clearly undesired. On the other hand, we find many instances of predictions", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 247.92089999999996, "r_x1": 480.58759000000003, "r_y1": 247.92089999999996, "r_x2": 480.58759000000003, "r_y2": 239.12390000000005, "r_x3": 134.76498, "r_y3": 239.12390000000005, "coord_origin": "TOPLEFT" }, "text": "with structural inconsistencies or plain invalid HTML output, as shown in Fig-", "orig": "with structural inconsistencies or plain invalid HTML output, as shown in Fig-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 259.87591999999995, "r_x1": 480.59277, "r_y1": 259.87591999999995, "r_x2": 480.59277, "r_y2": 251.07892000000004, "r_x3": 134.76498, "r_y3": 251.07892000000004, "coord_origin": "TOPLEFT" }, "text": "ure 6, which are nearly impossible to properly correct. Both problems seriously", "orig": "ure 6, which are nearly impossible to properly correct. Both problems seriously", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 271.83092999999997, "r_x1": 480.59463999999997, "r_y1": 271.83092999999997, "r_x2": 480.59463999999997, "r_y2": 263.03394000000003, "r_x3": 134.76498, "r_y3": 263.03394000000003, "coord_origin": "TOPLEFT" }, "text": "impact the TSR model performance, since they reflect not only in the task of", "orig": "impact the TSR model performance, since they reflect not only in the task of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 283.78693, "r_x1": 480.58978, "r_y1": 283.78693, "r_x2": 480.58978, "r_y2": 274.98992999999996, "r_x3": 134.76498, "r_y3": 274.98992999999996, "coord_origin": "TOPLEFT" }, "text": "pure structure recognition but also in the equally crucial recognition or matching", "orig": "pure structure recognition but also in the equally crucial recognition or matching", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 295.74191, "r_x1": 223.57262, "r_y1": 295.74191, "r_x2": 223.57262, "r_y2": 286.94495, "r_x3": 134.76498, "r_y3": 286.94495, "coord_origin": "TOPLEFT" }, "text": "of table cell content.", "orig": "of table cell content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "In practice, we observe two major issues with prediction quality when training Im2Seq models on HTML table structure generation from images. On the one hand, we find that on large tables, the visual attention of the model often starts to drift and is not accurately moving forward cell by cell anymore. This manifests itself in either in an increasing location drift for proposed table-cells in later rows on the same column or even complete loss of vertical alignment, as illustrated in Figure 5. Addressing this with post-processing is partially possible, but clearly undesired. On the other hand, we find many instances of predictions with structural inconsistencies or plain invalid HTML output, as shown in Figure 6, which are nearly impossible to properly correct. Both problems seriously impact the TSR model performance, since they reflect not only in the task of pure structure recognition but also in the equally crucial recognition or matching of table cell content." }, { "label": "section_header", "id": 4, "page_no": 5, "cluster": { "id": 4, "label": "section_header", "bbox": { "l": 134.76498, "t": 320.6311, "r": 372.50848, "b": 331.19949, "coord_origin": "TOPLEFT" }, "confidence": 0.957028865814209, "cells": [ { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 331.19949, "r_x1": 141.48859, "r_y1": 331.19949, "r_x2": 141.48859, "r_y2": 320.6311, "r_x3": 134.76498, "r_y3": 320.6311, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.93819, "r_y0": 331.19949, "r_x1": 372.50848, "r_y1": 331.19949, "r_x2": 372.50848, "r_y2": 320.6311, "r_x3": 154.93819, "r_y3": 320.6311, "coord_origin": "TOPLEFT" }, "text": "Optimised Table Structure Language", "orig": "Optimised Table Structure Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "4 Optimised Table Structure Language" }, { "label": "text", "id": 0, "page_no": 5, "cluster": { "id": 0, "label": "text", "bbox": { "l": 134.76498, "t": 349.11697, "r": 480.59473, "b": 441.59985, "coord_origin": "TOPLEFT" }, "confidence": 0.9879323840141296, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 357.91394, "r_x1": 480.59075999999993, "r_y1": 357.91394, "r_x2": 480.59075999999993, "r_y2": 349.11697, "r_x3": 134.76498, "r_y3": 349.11697, "coord_origin": "TOPLEFT" }, "text": "To mitigate the issues with HTML in Im2Seq-based TSR models laid out before,", "orig": "To mitigate the issues with HTML in Im2Seq-based TSR models laid out before,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 369.86893, "r_x1": 480.58875, "r_y1": 369.86893, "r_x2": 480.58875, "r_y2": 361.07196000000005, "r_x3": 134.76498, "r_y3": 361.07196000000005, "coord_origin": "TOPLEFT" }, "text": "we propose here our Optimised Table Structure Language (OTSL). OTSL is", "orig": "we propose here our Optimised Table Structure Language (OTSL). OTSL is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 381.82492, "r_x1": 480.58681999999993, "r_y1": 381.82492, "r_x2": 480.58681999999993, "r_y2": 373.02795, "r_x3": 134.76498, "r_y3": 373.02795, "coord_origin": "TOPLEFT" }, "text": "designed to express table structure with a minimized vocabulary and a simple", "orig": "designed to express table structure with a minimized vocabulary and a simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 393.77991, "r_x1": 480.58875, "r_y1": 393.77991, "r_x2": 480.58875, "r_y2": 384.98294, "r_x3": 134.76498, "r_y3": 384.98294, "coord_origin": "TOPLEFT" }, "text": "set of rules, which are both significantly reduced compared to HTML. At the", "orig": "set of rules, which are both significantly reduced compared to HTML. At the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 405.73489, "r_x1": 480.58978, "r_y1": 405.73489, "r_x2": 480.58978, "r_y2": 396.93793, "r_x3": 134.76498, "r_y3": 396.93793, "coord_origin": "TOPLEFT" }, "text": "same time, OTSL enables easy error detection and correction during sequence", "orig": "same time, OTSL enables easy error detection and correction during sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 417.68988, "r_x1": 480.59473, "r_y1": 417.68988, "r_x2": 480.59473, "r_y2": 408.89291, "r_x3": 134.76498, "r_y3": 408.89291, "coord_origin": "TOPLEFT" }, "text": "generation. We further demonstrate how the compact structure representation", "orig": "generation. We further demonstrate how the compact structure representation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 429.64487, "r_x1": 480.58868, "r_y1": 429.64487, "r_x2": 480.58868, "r_y2": 420.8479, "r_x3": 134.76498, "r_y3": 420.8479, "coord_origin": "TOPLEFT" }, "text": "and minimized sequence length improves prediction accuracy and inference time", "orig": "and minimized sequence length improves prediction accuracy and inference time", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 441.59985, "r_x1": 276.67325, "r_y1": 441.59985, "r_x2": 276.67325, "r_y2": 432.80289, "r_x3": 134.76498, "r_y3": 432.80289, "coord_origin": "TOPLEFT" }, "text": "in the TableFormer architecture.", "orig": "in the TableFormer architecture.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "To mitigate the issues with HTML in Im2Seq-based TSR models laid out before, we propose here our Optimised Table Structure Language (OTSL). OTSL is designed to express table structure with a minimized vocabulary and a simple set of rules, which are both significantly reduced compared to HTML. At the same time, OTSL enables easy error detection and correction during sequence generation. We further demonstrate how the compact structure representation and minimized sequence length improves prediction accuracy and inference time in the TableFormer architecture." }, { "label": "section_header", "id": 5, "page_no": 5, "cluster": { "id": 5, "label": "section_header", "bbox": { "l": 134.76498, "t": 465.87192, "r": 261.80109, "b": 474.67886, "coord_origin": "TOPLEFT" }, "confidence": 0.9559652209281921, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 474.67886, "r_x1": 149.40204, "r_y1": 474.67886, "r_x2": 149.40204, "r_y2": 465.87192, "r_x3": 134.76498, "r_y3": 465.87192, "coord_origin": "TOPLEFT" }, "text": "4.1", "orig": "4.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.85902, "r_y0": 474.67886, "r_x1": 261.80109, "r_y1": 474.67886, "r_x2": 261.80109, "r_y2": 465.87192, "r_x3": 160.85902, "r_y3": 465.87192, "coord_origin": "TOPLEFT" }, "text": "Language Definition", "orig": "Language Definition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "4.1 Language Definition" }, { "label": "text", "id": 2, "page_no": 5, "cluster": { "id": 2, "label": "text", "bbox": { "l": 134.76498, "t": 488.99789, "r": 480.58871, "b": 521.7058400000001, "coord_origin": "TOPLEFT" }, "confidence": 0.9671263098716736, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 497.79486, "r_x1": 480.58871, "r_y1": 497.79486, "r_x2": 480.58871, "r_y2": 488.99789, "r_x3": 134.76498, "r_y3": 488.99789, "coord_origin": "TOPLEFT" }, "text": "In Figure 3, we illustrate how the OTSL is defined. In essence, the OTSL defines", "orig": "In Figure 3, we illustrate how the OTSL is defined. In essence, the OTSL defines", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 509.74985, "r_x1": 480.5867, "r_y1": 509.74985, "r_x2": 480.5867, "r_y2": 500.95288, "r_x3": 134.76498, "r_y3": 500.95288, "coord_origin": "TOPLEFT" }, "text": "only 5 tokens that directly describe a tabular structure based on an atomic 2D", "orig": "only 5 tokens that directly describe a tabular structure based on an atomic 2D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 521.7058400000001, "r_x1": 154.7131, "r_y1": 521.7058400000001, "r_x2": 154.7131, "r_y2": 512.90887, "r_x3": 134.76498, "r_y3": 512.90887, "coord_origin": "TOPLEFT" }, "text": "grid.", "orig": "grid.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "In Figure 3, we illustrate how the OTSL is defined. In essence, the OTSL defines only 5 tokens that directly describe a tabular structure based on an atomic 2D grid." }, { "label": "text", "id": 13, "page_no": 5, "cluster": { "id": 13, "label": "text", "bbox": { "l": 149.70898, "t": 525.5018600000001, "r": 409.31137, "b": 534.29883, "coord_origin": "TOPLEFT" }, "confidence": 0.8555866479873657, "cells": [ { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.70898, "r_y0": 534.29883, "r_x1": 409.31137, "r_y1": 534.29883, "r_x2": 409.31137, "r_y2": 525.5018600000001, "r_x3": 149.70898, "r_y3": 525.5018600000001, "coord_origin": "TOPLEFT" }, "text": "The OTSL vocabulary is comprised of the following tokens:", "orig": "The OTSL vocabulary is comprised of the following tokens:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The OTSL vocabulary is comprised of the following tokens:" }, { "label": "list_item", "id": 9, "page_no": 5, "cluster": { "id": 9, "label": "list_item", "bbox": { "l": 140.99298, "t": 547.96989, "r": 460.54443, "b": 556.77682, "coord_origin": "TOPLEFT" }, "confidence": 0.9184334874153137, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 140.99298, "r_y0": 556.77682, "r_x1": 146.72047, "r_y1": 556.77682, "r_x2": 146.72047, "r_y2": 547.96989, "r_x3": 140.99298, "r_y3": 547.96989, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.70099, "r_y0": 556.77682, "r_x1": 193.20619, "r_y1": 556.77682, "r_x2": 193.20619, "r_y2": 547.97986, "r_x3": 151.70099, "r_y3": 547.97986, "coord_origin": "TOPLEFT" }, "text": "\"C\" cell -", "orig": "\"C\" cell -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.52199, "r_y0": 556.77682, "r_x1": 263.46564, "r_y1": 556.77682, "r_x2": 263.46564, "r_y2": 547.97986, "r_x3": 196.52199, "r_y3": 547.97986, "coord_origin": "TOPLEFT" }, "text": "a new table cell", "orig": "a new table cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 267.815, "r_y0": 556.77682, "r_x1": 460.54443, "r_y1": 556.77682, "r_x2": 460.54443, "r_y2": 547.97986, "r_x3": 267.815, "r_y3": 547.97986, "coord_origin": "TOPLEFT" }, "text": "that either has or does not have cell content", "orig": "that either has or does not have cell content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "-\"C\" cell a new table cell that either has or does not have cell content" }, { "label": "list_item", "id": 8, "page_no": 5, "cluster": { "id": 8, "label": "list_item", "bbox": { "l": 140.99301, "t": 560.5629, "r": 480.59392999999994, "b": 581.32483, "coord_origin": "TOPLEFT" }, "confidence": 0.9319931268692017, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 140.99301, "r_y0": 569.36983, "r_x1": 146.7205, "r_y1": 569.36983, "r_x2": 146.7205, "r_y2": 560.5629, "r_x3": 140.99301, "r_y3": 560.5629, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.70102, "r_y0": 569.36983, "r_x1": 194.30011, "r_y1": 569.36983, "r_x2": 194.30011, "r_y2": 560.57286, "r_x3": 151.70102, "r_y3": 560.57286, "coord_origin": "TOPLEFT" }, "text": "\"L\" cell -", "orig": "\"L\" cell -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 198.65903, "r_y0": 569.36983, "r_x1": 264.51779, "r_y1": 569.36983, "r_x2": 264.51779, "r_y2": 560.57286, "r_x3": 198.65903, "r_y3": 560.57286, "coord_origin": "TOPLEFT" }, "text": "left-looking cell", "orig": "left-looking cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.51804, "r_y0": 569.36983, "r_x1": 480.59392999999994, "r_y1": 569.36983, "r_x2": 480.59392999999994, "r_y2": 560.57286, "r_x3": 264.51804, "r_y3": 560.57286, "coord_origin": "TOPLEFT" }, "text": ", merging with the left neighbor cell to create a", "orig": ", merging with the left neighbor cell to create a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.70103, "r_y0": 581.32483, "r_x1": 171.67604, "r_y1": 581.32483, "r_x2": 171.67604, "r_y2": 572.52786, "r_x3": 151.70103, "r_y3": 572.52786, "coord_origin": "TOPLEFT" }, "text": "span", "orig": "span", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "-\"L\" cell left-looking cell , merging with the left neighbor cell to create a span" }, { "label": "list_item", "id": 7, "page_no": 5, "cluster": { "id": 7, "label": "list_item", "bbox": { "l": 140.99304, "t": 585.11189, "r": 480.58856, "b": 605.87383, "coord_origin": "TOPLEFT" }, "confidence": 0.9438967704772949, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 140.99304, "r_y0": 593.91882, "r_x1": 146.72054, "r_y1": 593.91882, "r_x2": 146.72054, "r_y2": 585.11189, "r_x3": 140.99304, "r_y3": 585.11189, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.70105, "r_y0": 593.91882, "r_x1": 194.11086, "r_y1": 593.91882, "r_x2": 194.11086, "r_y2": 585.12186, "r_x3": 151.70105, "r_y3": 585.12186, "coord_origin": "TOPLEFT" }, "text": "\"U\" cell -", "orig": "\"U\" cell -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 197.74805, "r_y0": 593.91882, "r_x1": 259.89474, "r_y1": 593.91882, "r_x2": 259.89474, "r_y2": 585.12186, "r_x3": 197.74805, "r_y3": 585.12186, "coord_origin": "TOPLEFT" }, "text": "up-looking cell", "orig": "up-looking cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.89206, "r_y0": 593.91882, "r_x1": 480.58856, "r_y1": 593.91882, "r_x2": 480.58856, "r_y2": 585.12186, "r_x3": 259.89206, "r_y3": 585.12186, "coord_origin": "TOPLEFT" }, "text": ", merging with the upper neighbor cell to create a", "orig": ", merging with the upper neighbor cell to create a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.70105, "r_y0": 605.87383, "r_x1": 171.67606, "r_y1": 605.87383, "r_x2": 171.67606, "r_y2": 597.07686, "r_x3": 151.70105, "r_y3": 597.07686, "coord_origin": "TOPLEFT" }, "text": "span", "orig": "span", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "-\"U\" cell up-looking cell , merging with the upper neighbor cell to create a span" }, { "label": "list_item", "id": 10, "page_no": 5, "cluster": { "id": 10, "label": "list_item", "bbox": { "l": 140.99304, "t": 609.6599, "r": 454.55496, "b": 618.46683, "coord_origin": "TOPLEFT" }, "confidence": 0.9036387801170349, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 140.99304, "r_y0": 618.46683, "r_x1": 146.72054, "r_y1": 618.46683, "r_x2": 146.72054, "r_y2": 609.6599, "r_x3": 140.99304, "r_y3": 609.6599, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.70105, "r_y0": 618.46683, "r_x1": 193.48323, "r_y1": 618.46683, "r_x2": 193.48323, "r_y2": 609.66986, "r_x3": 151.70105, "r_y3": 609.66986, "coord_origin": "TOPLEFT" }, "text": "\"X\" cell -", "orig": "\"X\" cell -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.79904, "r_y0": 618.46683, "r_x1": 236.12042, "r_y1": 618.46683, "r_x2": 236.12042, "r_y2": 609.66986, "r_x3": 196.79904, "r_y3": 609.66986, "coord_origin": "TOPLEFT" }, "text": "cross cell", "orig": "cross cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 236.12505, "r_y0": 618.46683, "r_x1": 454.55496, "r_y1": 618.46683, "r_x2": 454.55496, "r_y2": 609.66986, "r_x3": 236.12505, "r_y3": 609.66986, "coord_origin": "TOPLEFT" }, "text": ", to merge with both left and upper neighbor cells", "orig": ", to merge with both left and upper neighbor cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "-\"X\" cell cross cell , to merge with both left and upper neighbor cells" }, { "label": "list_item", "id": 12, "page_no": 5, "cluster": { "id": 12, "label": "list_item", "bbox": { "l": 140.99304, "t": 622.2538900000001, "r": 328.61676, "b": 631.06082, "coord_origin": "TOPLEFT" }, "confidence": 0.8636871576309204, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 140.99304, "r_y0": 631.06082, "r_x1": 146.72054, "r_y1": 631.06082, "r_x2": 146.72054, "r_y2": 622.2538900000001, "r_x3": 140.99304, "r_y3": 622.2538900000001, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.70105, "r_y0": 631.06082, "r_x1": 181.99434, "r_y1": 631.06082, "r_x2": 181.99434, "r_y2": 622.26385, "r_x3": 151.70105, "r_y3": 622.26385, "coord_origin": "TOPLEFT" }, "text": "\"NL\" -", "orig": "\"NL\" -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.31705, "r_y0": 631.06082, "r_x1": 221.46236, "r_y1": 631.06082, "r_x2": 221.46236, "r_y2": 622.26385, "r_x3": 185.31705, "r_y3": 622.26385, "coord_origin": "TOPLEFT" }, "text": "new-line", "orig": "new-line", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 221.46104, "r_y0": 631.06082, "r_x1": 328.61676, "r_y1": 631.06082, "r_x2": 328.61676, "r_y2": 622.26385, "r_x3": 221.46104, "r_y3": 622.26385, "coord_origin": "TOPLEFT" }, "text": ", switch to the next row.", "orig": ", switch to the next row.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "-\"NL\" new-line , switch to the next row." }, { "label": "text", "id": 6, "page_no": 5, "cluster": { "id": 6, "label": "text", "bbox": { "l": 134.76505, "t": 644.10286, "r": 480.59280000000007, "b": 664.85484, "coord_origin": "TOPLEFT" }, "confidence": 0.9443338513374329, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.70905, "r_y0": 652.8998300000001, "r_x1": 480.59280000000007, "r_y1": 652.8998300000001, "r_x2": 480.59280000000007, "r_y2": 644.10286, "r_x3": 149.70905, "r_y3": 644.10286, "coord_origin": "TOPLEFT" }, "text": "A notable attribute of OTSL is that it has the capability of achieving lossless", "orig": "A notable attribute of OTSL is that it has the capability of achieving lossless", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76505, "r_y0": 664.85484, "r_x1": 228.22321, "r_y1": 664.85484, "r_x2": 228.22321, "r_y2": 656.05786, "r_x3": 134.76505, "r_y3": 656.05786, "coord_origin": "TOPLEFT" }, "text": "conversion to HTML.", "orig": "conversion to HTML.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "A notable attribute of OTSL is that it has the capability of achieving lossless conversion to HTML." } ], "headers": [ { "label": "page_header", "id": 14, "page_no": 5, "cluster": { "id": 14, "label": "page_header", "bbox": { "l": 134.765, "t": 93.77099999999996, "r": 139.37193, "b": 101.84069999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.8378868699073792, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 101.84069999999997, "r_x1": 139.37193, "r_y1": 101.84069999999997, "r_x2": 139.37193, "r_y2": 93.77099999999996, "r_x3": 134.765, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "6" }, { "label": "page_header", "id": 11, "page_no": 5, "cluster": { "id": 11, "label": "page_header", "bbox": { "l": 167.81335, "t": 93.77099999999996, "r": 231.72227, "b": 101.84069999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.8919177651405334, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.81335, "r_y0": 101.84069999999997, "r_x1": 178.07675, "r_y1": 101.84069999999997, "r_x2": 178.07675, "r_y2": 93.77099999999996, "r_x3": 167.81335, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.37415, "r_y0": 101.84069999999997, "r_x1": 231.72227, "r_y1": 101.84069999999997, "r_x2": 231.72227, "r_y2": 93.77099999999996, "r_x3": 182.37415, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "M. Lysak, et al." } ] } }, { "page_no": 6, "size": { "width": 612.0, "height": 792.0 }, "parsed_page": { "dimension": { "angle": 0.0, "rect": { "r_x0": 0.0, "r_y0": 0.0, "r_x1": 612.0, "r_y1": 0.0, "r_x2": 612.0, "r_y2": 792.0, "r_x3": 0.0, "r_y3": 792.0, "coord_origin": "BOTTOMLEFT" }, "boundary_type": "crop_box", "art_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "bleed_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "crop_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "media_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "trim_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" } }, "bitmap_resources": [], "char_cells": [], "word_cells": [], "textline_cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.478, "r_y0": 101.84069999999997, "r_x1": 447.54291000000006, "r_y1": 101.84069999999997, "r_x2": 447.54291000000006, "r_y2": 93.77099999999996, "r_x3": 194.478, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 475.98431, "r_y0": 101.84069999999997, "r_x1": 480.59125000000006, "r_y1": 101.84069999999997, "r_x2": 480.59125000000006, "r_y2": 93.77099999999996, "r_x3": 475.98431, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 133.72551999999996, "r_x1": 162.64424, "r_y1": 133.72551999999996, "r_x2": 162.64424, "r_y2": 125.79918999999984, "r_x3": 134.765, "r_y3": 125.79918999999984, "coord_origin": "TOPLEFT" }, "text": "Fig. 3.", "orig": "Fig. 3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 166.276, "r_y0": 133.93169999999998, "r_x1": 480.58675999999997, "r_y1": 133.93169999999998, "r_x2": 480.58675999999997, "r_y2": 125.86200000000008, "r_x3": 166.276, "r_y3": 125.86200000000008, "coord_origin": "TOPLEFT" }, "text": "OTSL description of table structure: A - table example; B - graphical repre-", "orig": "OTSL description of table structure: A - table example; B - graphical repre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 144.89068999999995, "r_x1": 480.5874, "r_y1": 144.89068999999995, "r_x2": 480.5874, "r_y2": 136.82097999999996, "r_x3": 134.765, "r_y3": 136.82097999999996, "coord_origin": "TOPLEFT" }, "text": "sentation of table structure; C - mapping structure on a grid; D - OTSL structure", "orig": "sentation of table structure; C - mapping structure on a grid; D - OTSL structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 155.84966999999995, "r_x1": 306.1156, "r_y1": 155.84966999999995, "r_x2": 306.1156, "r_y2": 147.77997000000005, "r_x3": 134.765, "r_y3": 147.77997000000005, "coord_origin": "TOPLEFT" }, "text": "encoding; E - explanation on cell encoding", "orig": "encoding; E - explanation on cell encoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.49326, "r_y0": 177.91540999999995, "r_x1": 381.66843, "r_y1": 177.91540999999995, "r_x2": 381.66843, "r_y2": 168.59362999999996, "r_x3": 374.49326, "r_y3": 168.59362999999996, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.74011, "r_y0": 177.82183999999995, "r_x1": 405.91528, "r_y1": 177.82183999999995, "r_x2": 405.91528, "r_y2": 168.50005999999996, "r_x3": 398.74011, "r_y3": 168.50005999999996, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 373.76862, "r_y0": 202.24730999999997, "r_x1": 380.94379, "r_y1": 202.24730999999997, "r_x2": 380.94379, "r_y2": 192.92553999999996, "r_x3": 373.76862, "r_y3": 192.92553999999996, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.66388, "r_y0": 202.39239999999995, "r_x1": 393.83905, "r_y1": 202.39239999999995, "r_x2": 393.83905, "r_y2": 193.07061999999996, "r_x3": 386.66388, "r_y3": 193.07061999999996, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.68707, "r_y0": 214.45934999999997, "r_x1": 393.86224, "r_y1": 214.45934999999997, "r_x2": 393.86224, "r_y2": 205.13756999999998, "r_x3": 386.68707, "r_y3": 205.13756999999998, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.65729, "r_y0": 190.05457, "r_x1": 405.83246, "r_y1": 190.05457, "r_x2": 405.83246, "r_y2": 180.73279000000002, "r_x3": 398.65729, "r_y3": 180.73279000000002, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.77908, "r_y0": 190.06035999999995, "r_x1": 417.95425, "r_y1": 190.06035999999995, "r_x2": 417.95425, "r_y2": 180.73859000000004, "r_x3": 410.77908, "r_y3": 180.73859000000004, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 422.90503, "r_y0": 189.97424, "r_x1": 430.08020000000005, "r_y1": 189.97424, "r_x2": 430.08020000000005, "r_y2": 180.65247, "r_x3": 422.90503, "r_y3": 180.65247, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.7807, "r_y0": 202.31042000000002, "r_x1": 405.95587, "r_y1": 202.31042000000002, "r_x2": 405.95587, "r_y2": 192.98865, "r_x3": 398.7807, "r_y3": 192.98865, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.90164, "r_y0": 202.31664999999998, "r_x1": 418.07681, "r_y1": 202.31664999999998, "r_x2": 418.07681, "r_y2": 192.99487, "r_x3": 410.90164, "r_y3": 192.99487, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.02753, "r_y0": 202.23077, "r_x1": 430.2027, "r_y1": 202.23077, "r_x2": 430.2027, "r_y2": 192.909, "r_x3": 423.02753, "r_y3": 192.909, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.78235, "r_y0": 214.63751000000002, "r_x1": 405.95752, "r_y1": 214.63751000000002, "r_x2": 405.95752, "r_y2": 205.31573000000003, "r_x3": 398.78235, "r_y3": 205.31573000000003, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.90414, "r_y0": 214.64373999999998, "r_x1": 418.07932, "r_y1": 214.64373999999998, "r_x2": 418.07932, "r_y2": 205.32196, "r_x3": 410.90414, "r_y3": 205.32196, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.03003, "r_y0": 214.55791999999997, "r_x1": 430.20520000000005, "r_y1": 214.55791999999997, "r_x2": 430.20520000000005, "r_y2": 205.23614999999995, "r_x3": 423.03003, "r_y3": 205.23614999999995, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.50574, "r_y0": 226.36059999999998, "r_x1": 393.68091, "r_y1": 226.36059999999998, "r_x2": 393.68091, "r_y2": 217.03882, "r_x3": 386.50574, "r_y3": 217.03882, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.60181, "r_y0": 226.53882, "r_x1": 405.77698, "r_y1": 226.53882, "r_x2": 405.77698, "r_y2": 217.21704, "r_x3": 398.60181, "r_y3": 217.21704, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.72275, "r_y0": 226.54498, "r_x1": 417.89792, "r_y1": 226.54498, "r_x2": 417.89792, "r_y2": 217.22321, "r_x3": 410.72275, "r_y3": 217.22321, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 422.84869, "r_y0": 226.45916999999997, "r_x1": 430.02386, "r_y1": 226.45916999999997, "r_x2": 430.02386, "r_y2": 217.13738999999998, "r_x3": 422.84869, "r_y3": 217.13738999999998, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.16009999999994, "r_y0": 177.01189999999997, "r_x1": 447.86273, "r_y1": 177.01189999999997, "r_x2": 447.86273, "r_y2": 167.69011999999998, "r_x3": 435.16009999999994, "r_y3": 167.69011999999998, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.44415, "r_y0": 189.52202999999997, "r_x1": 448.14679, "r_y1": 189.52202999999997, "r_x2": 448.14679, "r_y2": 180.20025999999996, "r_x3": 435.44415, "r_y3": 180.20025999999996, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.46735, "r_y0": 201.81652999999994, "r_x1": 448.16998000000007, "r_y1": 201.81652999999994, "r_x2": 448.16998000000007, "r_y2": 192.49474999999995, "r_x3": 435.46735, "r_y3": 192.49474999999995, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.38202, "r_y0": 214.15204000000006, "r_x1": 448.08466, "r_y1": 214.15204000000006, "r_x2": 448.08466, "r_y2": 204.83025999999995, "r_x3": 435.38202, "r_y3": 204.83025999999995, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.59906, "r_y0": 226.55548, "r_x1": 448.3017, "r_y1": 226.55548, "r_x2": 448.3017, "r_y2": 217.2337, "r_x3": 435.59906, "r_y3": 217.2337, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.14957, "r_y0": 214.55669999999998, "r_x1": 381.32474, "r_y1": 214.55669999999998, "r_x2": 381.32474, "r_y2": 205.23492, "r_x3": 374.14957, "r_y3": 205.23492, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.0419, "r_y0": 226.46826, "r_x1": 381.21707, "r_y1": 226.46826, "r_x2": 381.21707, "r_y2": 217.14648, "r_x3": 374.0419, "r_y3": 217.14648, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.34418, "r_y0": 190.25665000000004, "r_x1": 381.51935, "r_y1": 190.25665000000004, "r_x2": 381.51935, "r_y2": 180.93488000000002, "r_x3": 374.34418, "r_y3": 180.93488000000002, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 387.76285, "r_y0": 177.89966000000004, "r_x1": 393.28833, "r_y1": 177.89966000000004, "r_x2": 393.28833, "r_y2": 168.57788000000005, "r_x3": 387.76285, "r_y3": 168.57788000000005, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.86395, "r_y0": 177.38373, "r_x1": 417.38943, "r_y1": 177.38373, "r_x2": 417.38943, "r_y2": 168.06195000000002, "r_x3": 411.86395, "r_y3": 168.06195000000002, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.33563, "r_y0": 177.25616000000002, "r_x1": 428.86111, "r_y1": 177.25616000000002, "r_x2": 428.86111, "r_y2": 167.93439, "r_x3": 423.33563, "r_y3": 167.93439, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 387.13593, "r_y0": 190.10753999999997, "r_x1": 393.76453, "r_y1": 190.10753999999997, "r_x2": 393.76453, "r_y2": 180.78576999999996, "r_x3": 387.13593, "r_y3": 180.78576999999996, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.2594, "r_y0": 253.83056999999997, "r_x1": 289.43457, "r_y1": 253.83056999999997, "r_x2": 289.43457, "r_y2": 244.50878999999998, "r_x3": 282.2594, "r_y3": 244.50878999999998, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.11035, "r_y0": 266.172, "r_x1": 289.28552, "r_y1": 266.172, "r_x2": 289.28552, "r_y2": 256.85022000000004, "r_x3": 282.11035, "r_y3": 256.85022000000004, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.40848, "r_y0": 278.45477000000005, "r_x1": 289.58365, "r_y1": 278.45477000000005, "r_x2": 289.58365, "r_y2": 269.13300000000004, "r_x3": 282.40848, "r_y3": 269.13300000000004, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.52902, "r_y0": 253.81525, "r_x1": 301.0545, "r_y1": 253.81525, "r_x2": 301.0545, "r_y2": 244.49347, "r_x3": 295.52902, "r_y3": 244.49347, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 307.46613, "r_y0": 253.89550999999994, "r_x1": 312.99161, "r_y1": 253.89550999999994, "r_x2": 312.99161, "r_y2": 244.57372999999995, "r_x3": 307.46613, "r_y3": 244.57372999999995, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.76886, "r_y0": 253.76215000000002, "r_x1": 324.29434, "r_y1": 253.76215000000002, "r_x2": 324.29434, "r_y2": 244.44037000000003, "r_x3": 318.76886, "r_y3": 244.44037000000003, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 294.9021, "r_y0": 266.02332, "r_x1": 301.03976, "r_y1": 266.02332, "r_x2": 301.03976, "r_y2": 256.70154, "r_x3": 294.9021, "r_y3": 256.70154, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 307.17743, "r_y0": 266.02332, "r_x1": 325.59039, "r_y1": 266.02332, "r_x2": 325.59039, "r_y2": 256.70154, "r_x3": 307.17743, "r_y3": 256.70154, "coord_origin": "TOPLEFT" }, "text": "X X", "orig": "X X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 294.78949, "r_y0": 278.57599000000005, "r_x1": 300.92715, "r_y1": 278.57599000000005, "r_x2": 300.92715, "r_y2": 269.25420999999994, "r_x3": 294.78949, "r_y3": 269.25420999999994, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 307.06482, "r_y0": 278.57599000000005, "r_x1": 325.47778, "r_y1": 278.57599000000005, "r_x2": 325.47778, "r_y2": 269.25420999999994, "r_x3": 307.06482, "r_y3": 269.25420999999994, "coord_origin": "TOPLEFT" }, "text": "X X", "orig": "X X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 195.93939, "r_y0": 278.06976, "r_x1": 203.11456, "r_y1": 278.06976, "r_x2": 203.11456, "r_y2": 268.74798999999996, "r_x3": 195.93939, "r_y3": 268.74798999999996, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.20891, "r_y0": 278.05444, "r_x1": 214.73439, "r_y1": 278.05444, "r_x2": 214.73439, "r_y2": 268.73267, "r_x3": 209.20891, "r_y3": 268.73267, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 221.14551, "r_y0": 278.13469999999995, "r_x1": 226.67099, "r_y1": 278.13469999999995, "r_x2": 226.67099, "r_y2": 268.81293000000005, "r_x3": 221.14551, "r_y3": 268.81293000000005, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.44858, "r_y0": 278.00134, "r_x1": 237.97405999999998, "r_y1": 278.00134, "r_x2": 237.97405999999998, "r_y2": 268.67957, "r_x3": 232.44858, "r_y3": 268.67957, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.21715, "r_y0": 253.86139000000003, "r_x1": 203.39232, "r_y1": 253.86139000000003, "r_x2": 203.39232, "r_y2": 244.53961000000004, "r_x3": 196.21715, "r_y3": 244.53961000000004, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 250.32143, "r_y0": 253.41992000000005, "r_x1": 257.49661, "r_y1": 253.41992000000005, "r_x2": 257.49661, "r_y2": 244.09813999999994, "r_x3": 250.32143, "r_y3": 244.09813999999994, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 250.17235999999997, "r_y0": 265.76129000000003, "r_x1": 257.34753, "r_y1": 265.76129000000003, "r_x2": 257.34753, "r_y2": 256.43951000000004, "r_x3": 250.17235999999997, "r_y3": 256.43951000000004, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 250.47049000000004, "r_y0": 278.04400999999996, "r_x1": 257.64566, "r_y1": 278.04400999999996, "r_x2": 257.64566, "r_y2": 268.72222999999997, "r_x3": 250.47049000000004, "r_y3": 268.72222999999997, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.51135, "r_y0": 249.20911, "r_x1": 337.22485, "r_y1": 249.20911, "r_x2": 337.22485, "r_y2": 242.99463000000003, "r_x3": 334.51135, "r_y3": 242.99463000000003, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.93835, "r_y0": 249.20911, "r_x1": 391.49472, "r_y1": 249.20911, "r_x2": 391.49472, "r_y2": 242.99463000000003, "r_x3": 339.93835, "r_y3": 242.99463000000003, "coord_origin": "TOPLEFT" }, "text": "- simple cells: \"C\"", "orig": "- simple cells: \"C\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.51135, "r_y0": 259.14703, "r_x1": 337.33313, "r_y1": 259.14703, "r_x2": 337.33313, "r_y2": 252.93255999999997, "r_x3": 334.51135, "r_y3": 252.93255999999997, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.15491, "r_y0": 259.14703, "r_x1": 421.98624, "r_y1": 259.14703, "r_x2": 421.98624, "r_y2": 252.93255999999997, "r_x3": 340.15491, "r_y3": 252.93255999999997, "coord_origin": "TOPLEFT" }, "text": "- horizontal merges: \"C\", \"L\"", "orig": "- horizontal merges: \"C\", \"L\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.51135, "r_y0": 269.08496, "r_x1": 337.29868, "r_y1": 269.08496, "r_x2": 337.29868, "r_y2": 262.87048000000004, "r_x3": 334.51135, "r_y3": 262.87048000000004, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.086, "r_y0": 269.08496, "r_x1": 415.34375, "r_y1": 269.08496, "r_x2": 415.34375, "r_y2": 262.87048000000004, "r_x3": 340.086, "r_y3": 262.87048000000004, "coord_origin": "TOPLEFT" }, "text": "- vertical merges: \"C\", \"U\"", "orig": "- vertical merges: \"C\", \"U\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.51135, "r_y0": 279.02288999999996, "r_x1": 337.30188, "r_y1": 279.02288999999996, "r_x2": 337.30188, "r_y2": 272.80841, "r_x3": 334.51135, "r_y3": 272.80841, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.09241, "r_y0": 279.02288999999996, "r_x1": 426.59875, "r_y1": 279.02288999999996, "r_x2": 426.59875, "r_y2": 272.80841, "r_x3": 340.09241, "r_y3": 272.80841, "coord_origin": "TOPLEFT" }, "text": "- 2d merges: \"C\", \"L\", \"U\", \"X\"", "orig": "- 2d merges: \"C\", \"L\", \"U\", \"X\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.67178, "r_y0": 250.25671, "r_x1": 189.35544, "r_y1": 250.25671, "r_x2": 189.35544, "r_y2": 244.04224, "r_x3": 185.67178, "r_y3": 244.04224, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.96759, "r_y0": 274.56213, "r_x1": 189.65125, "r_y1": 274.56213, "r_x2": 189.65125, "r_y2": 268.34766, "r_x3": 185.96759, "r_y3": 268.34766, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.34152, "r_y0": 249.83972000000006, "r_x1": 243.02518, "r_y1": 249.83972000000006, "r_x2": 243.02518, "r_y2": 243.62523999999996, "r_x3": 239.34152, "r_y3": 243.62523999999996, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 271.32852, "r_y0": 249.70836999999995, "r_x1": 275.01218, "r_y1": 249.70836999999995, "r_x2": 275.01218, "r_y2": 243.49390000000005, "r_x3": 271.32852, "r_y3": 243.49390000000005, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.81627, "r_y0": 172.72942999999998, "r_x1": 233.49992000000003, "r_y1": 172.72942999999998, "r_x2": 233.49992000000003, "r_y2": 166.51495, "r_x3": 229.81627, "r_y3": 166.51495, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 257.24402, "r_y0": 196.17548, "r_x1": 260.92767, "r_y1": 196.17548, "r_x2": 260.92767, "r_y2": 189.961, "r_x3": 257.24402, "r_y3": 189.961, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 186.87526, "r_y0": 184.19115999999997, "r_x1": 190.55891, "r_y1": 184.19115999999997, "r_x2": 190.55891, "r_y2": 177.97668, "r_x3": 186.87526, "r_y3": 177.97668, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.48746, "r_y0": 175.22968000000003, "r_x1": 200.17111, "r_y1": 175.22968000000003, "r_x2": 200.17111, "r_y2": 169.01520000000005, "r_x3": 196.48746, "r_y3": 169.01520000000005, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 169.74728, "r_y0": 175.65039000000002, "r_x1": 175.72659, "r_y1": 175.65039000000002, "r_x2": 175.72659, "r_y2": 167.88225999999997, "r_x3": 169.74728, "r_y3": 167.88225999999997, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 169.74728, "r_y0": 214.60681, "r_x1": 175.72659, "r_y1": 214.60681, "r_x2": 175.72659, "r_y2": 206.83867999999995, "r_x3": 169.74728, "r_y3": 206.83867999999995, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 274.29419, "r_y0": 176.04785000000004, "r_x1": 280.2735, "r_y1": 176.04785000000004, "r_x2": 280.2735, "r_y2": 168.27972, "r_x3": 274.29419, "r_y3": 168.27972, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 359.56152, "r_y0": 176.04785000000004, "r_x1": 365.54083, "r_y1": 176.04785000000004, "r_x2": 365.54083, "r_y2": 168.27972, "r_x3": 359.56152, "r_y3": 168.27972, "coord_origin": "TOPLEFT" }, "text": "D", "orig": "D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 169.74728, "r_y0": 250.97960999999998, "r_x1": 175.27112, "r_y1": 250.97960999999998, "r_x2": 175.27112, "r_y2": 243.21149000000003, "r_x3": 169.74728, "r_y3": 243.21149000000003, "coord_origin": "TOPLEFT" }, "text": "E", "orig": "E", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 314.10275, "r_x1": 149.40205, "r_y1": 314.10275, "r_x2": 149.40205, "r_y2": 305.29581, "r_x3": 134.765, "r_y3": 305.29581, "coord_origin": "TOPLEFT" }, "text": "4.2", "orig": "4.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.85904, "r_y0": 314.10275, "r_x1": 246.65197999999998, "r_y1": 314.10275, "r_x2": 246.65197999999998, "r_y2": 305.29581, "r_x3": 160.85904, "r_y3": 305.29581, "coord_origin": "TOPLEFT" }, "text": "Language Syntax", "orig": "Language Syntax", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 334.04474, "r_x1": 363.79617, "r_y1": 334.04474, "r_x2": 363.79617, "r_y2": 325.24777, "r_x3": 134.765, "r_y3": 325.24777, "coord_origin": "TOPLEFT" }, "text": "The OTSL representation follows these syntax rules:", "orig": "The OTSL representation follows these syntax rules:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.97299, "r_y0": 355.97775, "r_x1": 146.71991, "r_y1": 355.97775, "r_x2": 146.71991, "r_y2": 347.18079, "r_x3": 138.97299, "r_y3": 347.18079, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.70099, "r_y0": 355.97775, "r_x1": 257.37927, "r_y1": 355.97775, "r_x2": 257.37927, "r_y2": 347.17081, "r_x3": 151.70099, "r_y3": 347.17081, "coord_origin": "TOPLEFT" }, "text": "Left-looking cell rule", "orig": "Left-looking cell rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 257.383, "r_y0": 355.97775, "r_x1": 480.58902, "r_y1": 355.97775, "r_x2": 480.58902, "r_y2": 347.18079, "r_x3": 257.383, "r_y3": 347.18079, "coord_origin": "TOPLEFT" }, "text": ": The left neighbour of an \"L\" cell must be either", "orig": ": The left neighbour of an \"L\" cell must be either", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.70099, "r_y0": 367.93375, "r_x1": 283.59387, "r_y1": 367.93375, "r_x2": 283.59387, "r_y2": 359.13678, "r_x3": 151.70099, "r_y3": 359.13678, "coord_origin": "TOPLEFT" }, "text": "another \"L\" cell or a \"C\" cell.", "orig": "another \"L\" cell or a \"C\" cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.97299, "r_y0": 379.89175, "r_x1": 146.71991, "r_y1": 379.89175, "r_x2": 146.71991, "r_y2": 371.09479, "r_x3": 138.97299, "r_y3": 371.09479, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.70099, "r_y0": 379.89175, "r_x1": 252.11203, "r_y1": 379.89175, "r_x2": 252.11203, "r_y2": 371.08481, "r_x3": 151.70099, "r_y3": 371.08481, "coord_origin": "TOPLEFT" }, "text": "Up-looking cell rule", "orig": "Up-looking cell rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 252.112, "r_y0": 379.89175, "r_x1": 480.59229000000005, "r_y1": 379.89175, "r_x2": 480.59229000000005, "r_y2": 371.09479, "r_x3": 252.112, "r_y3": 371.09479, "coord_origin": "TOPLEFT" }, "text": ": The upper neighbour of a \"U\" cell must be either", "orig": ": The upper neighbour of a \"U\" cell must be either", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.70099, "r_y0": 391.84673999999995, "r_x1": 284.8392, "r_y1": 391.84673999999995, "r_x2": 284.8392, "r_y2": 383.04977, "r_x3": 151.70099, "r_y3": 383.04977, "coord_origin": "TOPLEFT" }, "text": "another \"U\" cell or a \"C\" cell.", "orig": "another \"U\" cell or a \"C\" cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.97299, "r_y0": 403.80475, "r_x1": 146.71991, "r_y1": 403.80475, "r_x2": 146.71991, "r_y2": 395.0077800000001, "r_x3": 138.97299, "r_y3": 395.0077800000001, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.70099, "r_y0": 403.80475, "r_x1": 223.3042, "r_y1": 403.80475, "r_x2": 223.3042, "r_y2": 394.99780000000004, "r_x3": 151.70099, "r_y3": 394.99780000000004, "coord_origin": "TOPLEFT" }, "text": "Cross cell rule", "orig": "Cross cell rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 223.30699, "r_y0": 403.80475, "r_x1": 226.07360999999997, "r_y1": 403.80475, "r_x2": 226.07360999999997, "r_y2": 395.0077800000001, "r_x3": 223.30699, "r_y3": 395.0077800000001, "coord_origin": "TOPLEFT" }, "text": ":", "orig": ":", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.70099, "r_y0": 415.76373, "r_x1": 480.59238, "r_y1": 415.76373, "r_x2": 480.59238, "r_y2": 406.96677, "r_x3": 151.70099, "r_y3": 406.96677, "coord_origin": "TOPLEFT" }, "text": "The left neighbour of an \"X\" cell must be either another \"X\" cell or a \"U\"", "orig": "The left neighbour of an \"X\" cell must be either another \"X\" cell or a \"U\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.70099, "r_y0": 427.71871999999996, "r_x1": 480.59219, "r_y1": 427.71871999999996, "r_x2": 480.59219, "r_y2": 418.9217499999999, "r_x3": 151.70099, "r_y3": 418.9217499999999, "coord_origin": "TOPLEFT" }, "text": "cell, and the upper neighbour of an \"X\" cell must be either another \"X\" cell", "orig": "cell, and the upper neighbour of an \"X\" cell must be either another \"X\" cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.70099, "r_y0": 439.67371, "r_x1": 214.39663999999996, "r_y1": 439.67371, "r_x2": 214.39663999999996, "r_y2": 430.87674, "r_x3": 151.70099, "r_y3": 430.87674, "coord_origin": "TOPLEFT" }, "text": "or an \"L\" cell.", "orig": "or an \"L\" cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.97299, "r_y0": 451.63269, "r_x1": 146.71991, "r_y1": 451.63269, "r_x2": 146.71991, "r_y2": 442.83572, "r_x3": 138.97299, "r_y3": 442.83572, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.70099, "r_y0": 451.63269, "r_x1": 221.32263, "r_y1": 451.63269, "r_x2": 221.32263, "r_y2": 442.82574, "r_x3": 151.70099, "r_y3": 442.82574, "coord_origin": "TOPLEFT" }, "text": "First row rule", "orig": "First row rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 221.32700000000003, "r_y0": 451.63269, "r_x1": 474.59018, "r_y1": 451.63269, "r_x2": 474.59018, "r_y2": 442.83572, "r_x3": 221.32700000000003, "r_y3": 442.83572, "coord_origin": "TOPLEFT" }, "text": ": Only \"L\" cells and \"C\" cells are allowed in the first row.", "orig": ": Only \"L\" cells and \"C\" cells are allowed in the first row.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.97299, "r_y0": 463.5907, "r_x1": 146.71991, "r_y1": 463.5907, "r_x2": 146.71991, "r_y2": 454.7937299999999, "r_x3": 138.97299, "r_y3": 454.7937299999999, "coord_origin": "TOPLEFT" }, "text": "5.", "orig": "5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.70099, "r_y0": 463.5907, "r_x1": 240.71982, "r_y1": 463.5907, "r_x2": 240.71982, "r_y2": 454.78375, "r_x3": 151.70099, "r_y3": 454.78375, "coord_origin": "TOPLEFT" }, "text": "First column rule", "orig": "First column rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 240.71599, "r_y0": 463.5907, "r_x1": 480.58746, "r_y1": 463.5907, "r_x2": 480.58746, "r_y2": 454.7937299999999, "r_x3": 240.71599, "r_y3": 454.7937299999999, "coord_origin": "TOPLEFT" }, "text": ": Only \"U\" cells and \"C\" cells are allowed in the first", "orig": ": Only \"U\" cells and \"C\" cells are allowed in the first", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.70099, "r_y0": 475.54568, "r_x1": 186.0072, "r_y1": 475.54568, "r_x2": 186.0072, "r_y2": 466.74872, "r_x3": 151.70099, "r_y3": 466.74872, "coord_origin": "TOPLEFT" }, "text": "column.", "orig": "column.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.97299, "r_y0": 487.50369, "r_x1": 146.71991, "r_y1": 487.50369, "r_x2": 146.71991, "r_y2": 478.70673, "r_x3": 138.97299, "r_y3": 478.70673, "coord_origin": "TOPLEFT" }, "text": "6.", "orig": "6.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.70099, "r_y0": 487.50369, "r_x1": 235.15768, "r_y1": 487.50369, "r_x2": 235.15768, "r_y2": 478.69675, "r_x3": 151.70099, "r_y3": 478.69675, "coord_origin": "TOPLEFT" }, "text": "Rectangular rule", "orig": "Rectangular rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 235.15697999999998, "r_y0": 487.50369, "r_x1": 480.59457, "r_y1": 487.50369, "r_x2": 480.59457, "r_y2": 478.70673, "r_x3": 235.15697999999998, "r_y3": 478.70673, "coord_origin": "TOPLEFT" }, "text": ": The table representation is always rectangular - all rows", "orig": ": The table representation is always rectangular - all rows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.70099, "r_y0": 499.45969, "r_x1": 448.04147, "r_y1": 499.45969, "r_x2": 448.04147, "r_y2": 490.66272, "r_x3": 151.70099, "r_y3": 490.66272, "coord_origin": "TOPLEFT" }, "text": "must have an equal number of tokens, terminated with \"NL\" token.", "orig": "must have an equal number of tokens, terminated with \"NL\" token.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.70898, "r_y0": 521.38968, "r_x1": 480.59583, "r_y1": 521.38968, "r_x2": 480.59583, "r_y2": 512.59271, "r_x3": 149.70898, "r_y3": 512.59271, "coord_origin": "TOPLEFT" }, "text": "The application of these rules gives OTSL a set of unique properties. First", "orig": "The application of these rules gives OTSL a set of unique properties. First", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 533.34467, "r_x1": 480.59079, "r_y1": 533.34467, "r_x2": 480.59079, "r_y2": 524.5477000000001, "r_x3": 134.76498, "r_y3": 524.5477000000001, "coord_origin": "TOPLEFT" }, "text": "of all, the OTSL enforces a strictly rectangular structure representation, where", "orig": "of all, the OTSL enforces a strictly rectangular structure representation, where", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 545.29967, "r_x1": 480.59482, "r_y1": 545.29967, "r_x2": 480.59482, "r_y2": 536.5027, "r_x3": 134.76498, "r_y3": 536.5027, "coord_origin": "TOPLEFT" }, "text": "every new-line token starts a new row. As a consequence, all rows and all columns", "orig": "every new-line token starts a new row. As a consequence, all rows and all columns", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 557.25566, "r_x1": 480.58865000000003, "r_y1": 557.25566, "r_x2": 480.58865000000003, "r_y2": 548.4586899999999, "r_x3": 134.76498, "r_y3": 548.4586899999999, "coord_origin": "TOPLEFT" }, "text": "have exactly the same number of tokens, irrespective of cell spans. Secondly, the", "orig": "have exactly the same number of tokens, irrespective of cell spans. Secondly, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 569.21066, "r_x1": 480.59365999999994, "r_y1": 569.21066, "r_x2": 480.59365999999994, "r_y2": 560.4137000000001, "r_x3": 134.76498, "r_y3": 560.4137000000001, "coord_origin": "TOPLEFT" }, "text": "OTSL representation is unambiguous: Every table structure is represented in one", "orig": "OTSL representation is unambiguous: Every table structure is represented in one", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 581.16566, "r_x1": 480.58673, "r_y1": 581.16566, "r_x2": 480.58673, "r_y2": 572.3687, "r_x3": 134.76498, "r_y3": 572.3687, "coord_origin": "TOPLEFT" }, "text": "way. In this representation every table cell corresponds to a \"C\"-cell token, which", "orig": "way. In this representation every table cell corresponds to a \"C\"-cell token, which", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 593.12067, "r_x1": 480.59171, "r_y1": 593.12067, "r_x2": 480.59171, "r_y2": 584.3237, "r_x3": 134.76498, "r_y3": 584.3237, "coord_origin": "TOPLEFT" }, "text": "in case of spans is always located in the top-left corner of the table cell definition.", "orig": "in case of spans is always located in the top-left corner of the table cell definition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 605.07567, "r_x1": 480.59180000000003, "r_y1": 605.07567, "r_x2": 480.59180000000003, "r_y2": 596.2787, "r_x3": 134.76498, "r_y3": 596.2787, "coord_origin": "TOPLEFT" }, "text": "Third, OTSL syntax rules are only backward-looking. As a consequence, every", "orig": "Third, OTSL syntax rules are only backward-looking. As a consequence, every", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 617.03166, "r_x1": 480.5936899999999, "r_y1": 617.03166, "r_x2": 480.5936899999999, "r_y2": 608.2347, "r_x3": 134.76498, "r_y3": 608.2347, "coord_origin": "TOPLEFT" }, "text": "predicted token can be validated straight during sequence generation by looking", "orig": "predicted token can be validated straight during sequence generation by looking", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 628.98666, "r_x1": 480.59072999999995, "r_y1": 628.98666, "r_x2": 480.59072999999995, "r_y2": 620.1897, "r_x3": 134.76498, "r_y3": 620.1897, "coord_origin": "TOPLEFT" }, "text": "at the previously predicted sequence. As such, OTSL can guarantee that every", "orig": "at the previously predicted sequence. As such, OTSL can guarantee that every", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 640.9416699999999, "r_x1": 311.19769, "r_y1": 640.9416699999999, "r_x2": 311.19769, "r_y2": 632.1447000000001, "r_x3": 134.76498, "r_y3": 632.1447000000001, "coord_origin": "TOPLEFT" }, "text": "predicted sequence is syntactically valid.", "orig": "predicted sequence is syntactically valid.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.70898, "r_y0": 652.89966, "r_x1": 480.59186, "r_y1": 652.89966, "r_x2": 480.59186, "r_y2": 644.1026899999999, "r_x3": 149.70898, "r_y3": 644.1026899999999, "coord_origin": "TOPLEFT" }, "text": "These characteristics can be easily learned by sequence generator networks,", "orig": "These characteristics can be easily learned by sequence generator networks,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 664.8546699999999, "r_x1": 480.59265, "r_y1": 664.8546699999999, "r_x2": 480.59265, "r_y2": 656.05769, "r_x3": 134.76498, "r_y3": 656.05769, "coord_origin": "TOPLEFT" }, "text": "as we demonstrate further below. We find strong indications that this pattern", "orig": "as we demonstrate further below. We find strong indications that this pattern", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "has_chars": false, "has_words": false, "has_lines": true, "image": null, "lines": [] }, "predictions": { "layout": { "clusters": [ { "id": 7, "label": "page_header", "bbox": { "l": 194.478, "t": 93.77099999999996, "r": 447.54291000000006, "b": 101.84069999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.932651162147522, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.478, "r_y0": 101.84069999999997, "r_x1": 447.54291000000006, "r_y1": 101.84069999999997, "r_x2": 447.54291000000006, "r_y2": 93.77099999999996, "r_x3": 194.478, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 11, "label": "page_header", "bbox": { "l": 475.98431, "t": 93.77099999999996, "r": 480.59125000000006, "b": 101.84069999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.8749732375144958, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 475.98431, "r_y0": 101.84069999999997, "r_x1": 480.59125000000006, "r_y1": 101.84069999999997, "r_x2": 480.59125000000006, "r_y2": 93.77099999999996, "r_x3": 475.98431, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 6, "label": "caption", "bbox": { "l": 134.765, "t": 125.79918999999984, "r": 480.5874, "b": 155.84966999999995, "coord_origin": "TOPLEFT" }, "confidence": 0.9333080053329468, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 133.72551999999996, "r_x1": 162.64424, "r_y1": 133.72551999999996, "r_x2": 162.64424, "r_y2": 125.79918999999984, "r_x3": 134.765, "r_y3": 125.79918999999984, "coord_origin": "TOPLEFT" }, "text": "Fig. 3.", "orig": "Fig. 3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 166.276, "r_y0": 133.93169999999998, "r_x1": 480.58675999999997, "r_y1": 133.93169999999998, "r_x2": 480.58675999999997, "r_y2": 125.86200000000008, "r_x3": 166.276, "r_y3": 125.86200000000008, "coord_origin": "TOPLEFT" }, "text": "OTSL description of table structure: A - table example; B - graphical repre-", "orig": "OTSL description of table structure: A - table example; B - graphical repre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 144.89068999999995, "r_x1": 480.5874, "r_y1": 144.89068999999995, "r_x2": 480.5874, "r_y2": 136.82097999999996, "r_x3": 134.765, "r_y3": 136.82097999999996, "coord_origin": "TOPLEFT" }, "text": "sentation of table structure; C - mapping structure on a grid; D - OTSL structure", "orig": "sentation of table structure; C - mapping structure on a grid; D - OTSL structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 155.84966999999995, "r_x1": 306.1156, "r_y1": 155.84966999999995, "r_x2": 306.1156, "r_y2": 147.77997000000005, "r_x3": 134.765, "r_y3": 147.77997000000005, "coord_origin": "TOPLEFT" }, "text": "encoding; E - explanation on cell encoding", "orig": "encoding; E - explanation on cell encoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 12, "label": "picture", "bbox": { "l": 164.65028381347656, "t": 163.79708862304688, "r": 449.5505676269531, "b": 280.3409423828125, "coord_origin": "TOPLEFT" }, "confidence": 0.7868534922599792, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.49326, "r_y0": 177.91540999999995, "r_x1": 381.66843, "r_y1": 177.91540999999995, "r_x2": 381.66843, "r_y2": 168.59362999999996, "r_x3": 374.49326, "r_y3": 168.59362999999996, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.74011, "r_y0": 177.82183999999995, "r_x1": 405.91528, "r_y1": 177.82183999999995, "r_x2": 405.91528, "r_y2": 168.50005999999996, "r_x3": 398.74011, "r_y3": 168.50005999999996, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 373.76862, "r_y0": 202.24730999999997, "r_x1": 380.94379, "r_y1": 202.24730999999997, "r_x2": 380.94379, "r_y2": 192.92553999999996, "r_x3": 373.76862, "r_y3": 192.92553999999996, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.66388, "r_y0": 202.39239999999995, "r_x1": 393.83905, "r_y1": 202.39239999999995, "r_x2": 393.83905, "r_y2": 193.07061999999996, "r_x3": 386.66388, "r_y3": 193.07061999999996, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.68707, "r_y0": 214.45934999999997, "r_x1": 393.86224, "r_y1": 214.45934999999997, "r_x2": 393.86224, "r_y2": 205.13756999999998, "r_x3": 386.68707, "r_y3": 205.13756999999998, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.65729, "r_y0": 190.05457, "r_x1": 405.83246, "r_y1": 190.05457, "r_x2": 405.83246, "r_y2": 180.73279000000002, "r_x3": 398.65729, "r_y3": 180.73279000000002, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.77908, "r_y0": 190.06035999999995, "r_x1": 417.95425, "r_y1": 190.06035999999995, "r_x2": 417.95425, "r_y2": 180.73859000000004, "r_x3": 410.77908, "r_y3": 180.73859000000004, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 422.90503, "r_y0": 189.97424, "r_x1": 430.08020000000005, "r_y1": 189.97424, "r_x2": 430.08020000000005, "r_y2": 180.65247, "r_x3": 422.90503, "r_y3": 180.65247, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.7807, "r_y0": 202.31042000000002, "r_x1": 405.95587, "r_y1": 202.31042000000002, "r_x2": 405.95587, "r_y2": 192.98865, "r_x3": 398.7807, "r_y3": 192.98865, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.90164, "r_y0": 202.31664999999998, "r_x1": 418.07681, "r_y1": 202.31664999999998, "r_x2": 418.07681, "r_y2": 192.99487, "r_x3": 410.90164, "r_y3": 192.99487, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.02753, "r_y0": 202.23077, "r_x1": 430.2027, "r_y1": 202.23077, "r_x2": 430.2027, "r_y2": 192.909, "r_x3": 423.02753, "r_y3": 192.909, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.78235, "r_y0": 214.63751000000002, "r_x1": 405.95752, "r_y1": 214.63751000000002, "r_x2": 405.95752, "r_y2": 205.31573000000003, "r_x3": 398.78235, "r_y3": 205.31573000000003, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.90414, "r_y0": 214.64373999999998, "r_x1": 418.07932, "r_y1": 214.64373999999998, "r_x2": 418.07932, "r_y2": 205.32196, "r_x3": 410.90414, "r_y3": 205.32196, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.03003, "r_y0": 214.55791999999997, "r_x1": 430.20520000000005, "r_y1": 214.55791999999997, "r_x2": 430.20520000000005, "r_y2": 205.23614999999995, "r_x3": 423.03003, "r_y3": 205.23614999999995, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.50574, "r_y0": 226.36059999999998, "r_x1": 393.68091, "r_y1": 226.36059999999998, "r_x2": 393.68091, "r_y2": 217.03882, "r_x3": 386.50574, "r_y3": 217.03882, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.60181, "r_y0": 226.53882, "r_x1": 405.77698, "r_y1": 226.53882, "r_x2": 405.77698, "r_y2": 217.21704, "r_x3": 398.60181, "r_y3": 217.21704, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.72275, "r_y0": 226.54498, "r_x1": 417.89792, "r_y1": 226.54498, "r_x2": 417.89792, "r_y2": 217.22321, "r_x3": 410.72275, "r_y3": 217.22321, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 422.84869, "r_y0": 226.45916999999997, "r_x1": 430.02386, "r_y1": 226.45916999999997, "r_x2": 430.02386, "r_y2": 217.13738999999998, "r_x3": 422.84869, "r_y3": 217.13738999999998, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.16009999999994, "r_y0": 177.01189999999997, "r_x1": 447.86273, "r_y1": 177.01189999999997, "r_x2": 447.86273, "r_y2": 167.69011999999998, "r_x3": 435.16009999999994, "r_y3": 167.69011999999998, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.44415, "r_y0": 189.52202999999997, "r_x1": 448.14679, "r_y1": 189.52202999999997, "r_x2": 448.14679, "r_y2": 180.20025999999996, "r_x3": 435.44415, "r_y3": 180.20025999999996, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.46735, "r_y0": 201.81652999999994, "r_x1": 448.16998000000007, "r_y1": 201.81652999999994, "r_x2": 448.16998000000007, "r_y2": 192.49474999999995, "r_x3": 435.46735, "r_y3": 192.49474999999995, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.38202, "r_y0": 214.15204000000006, "r_x1": 448.08466, "r_y1": 214.15204000000006, "r_x2": 448.08466, "r_y2": 204.83025999999995, "r_x3": 435.38202, "r_y3": 204.83025999999995, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.59906, "r_y0": 226.55548, "r_x1": 448.3017, "r_y1": 226.55548, "r_x2": 448.3017, "r_y2": 217.2337, "r_x3": 435.59906, "r_y3": 217.2337, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.14957, "r_y0": 214.55669999999998, "r_x1": 381.32474, "r_y1": 214.55669999999998, "r_x2": 381.32474, "r_y2": 205.23492, "r_x3": 374.14957, "r_y3": 205.23492, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.0419, "r_y0": 226.46826, "r_x1": 381.21707, "r_y1": 226.46826, "r_x2": 381.21707, "r_y2": 217.14648, "r_x3": 374.0419, "r_y3": 217.14648, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.34418, "r_y0": 190.25665000000004, "r_x1": 381.51935, "r_y1": 190.25665000000004, "r_x2": 381.51935, "r_y2": 180.93488000000002, "r_x3": 374.34418, "r_y3": 180.93488000000002, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 387.76285, "r_y0": 177.89966000000004, "r_x1": 393.28833, "r_y1": 177.89966000000004, "r_x2": 393.28833, "r_y2": 168.57788000000005, "r_x3": 387.76285, "r_y3": 168.57788000000005, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.86395, "r_y0": 177.38373, "r_x1": 417.38943, "r_y1": 177.38373, "r_x2": 417.38943, "r_y2": 168.06195000000002, "r_x3": 411.86395, "r_y3": 168.06195000000002, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.33563, "r_y0": 177.25616000000002, "r_x1": 428.86111, "r_y1": 177.25616000000002, "r_x2": 428.86111, "r_y2": 167.93439, "r_x3": 423.33563, "r_y3": 167.93439, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 387.13593, "r_y0": 190.10753999999997, "r_x1": 393.76453, "r_y1": 190.10753999999997, "r_x2": 393.76453, "r_y2": 180.78576999999996, "r_x3": 387.13593, "r_y3": 180.78576999999996, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.2594, "r_y0": 253.83056999999997, "r_x1": 289.43457, "r_y1": 253.83056999999997, "r_x2": 289.43457, "r_y2": 244.50878999999998, "r_x3": 282.2594, "r_y3": 244.50878999999998, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.11035, "r_y0": 266.172, "r_x1": 289.28552, "r_y1": 266.172, "r_x2": 289.28552, "r_y2": 256.85022000000004, "r_x3": 282.11035, "r_y3": 256.85022000000004, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.40848, "r_y0": 278.45477000000005, "r_x1": 289.58365, "r_y1": 278.45477000000005, "r_x2": 289.58365, "r_y2": 269.13300000000004, "r_x3": 282.40848, "r_y3": 269.13300000000004, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.52902, "r_y0": 253.81525, "r_x1": 301.0545, "r_y1": 253.81525, "r_x2": 301.0545, "r_y2": 244.49347, "r_x3": 295.52902, "r_y3": 244.49347, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 307.46613, "r_y0": 253.89550999999994, "r_x1": 312.99161, "r_y1": 253.89550999999994, "r_x2": 312.99161, "r_y2": 244.57372999999995, "r_x3": 307.46613, "r_y3": 244.57372999999995, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.76886, "r_y0": 253.76215000000002, "r_x1": 324.29434, "r_y1": 253.76215000000002, "r_x2": 324.29434, "r_y2": 244.44037000000003, "r_x3": 318.76886, "r_y3": 244.44037000000003, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 294.9021, "r_y0": 266.02332, "r_x1": 301.03976, "r_y1": 266.02332, "r_x2": 301.03976, "r_y2": 256.70154, "r_x3": 294.9021, "r_y3": 256.70154, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 307.17743, "r_y0": 266.02332, "r_x1": 325.59039, "r_y1": 266.02332, "r_x2": 325.59039, "r_y2": 256.70154, "r_x3": 307.17743, "r_y3": 256.70154, "coord_origin": "TOPLEFT" }, "text": "X X", "orig": "X X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 294.78949, "r_y0": 278.57599000000005, "r_x1": 300.92715, "r_y1": 278.57599000000005, "r_x2": 300.92715, "r_y2": 269.25420999999994, "r_x3": 294.78949, "r_y3": 269.25420999999994, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 307.06482, "r_y0": 278.57599000000005, "r_x1": 325.47778, "r_y1": 278.57599000000005, "r_x2": 325.47778, "r_y2": 269.25420999999994, "r_x3": 307.06482, "r_y3": 269.25420999999994, "coord_origin": "TOPLEFT" }, "text": "X X", "orig": "X X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 195.93939, "r_y0": 278.06976, "r_x1": 203.11456, "r_y1": 278.06976, "r_x2": 203.11456, "r_y2": 268.74798999999996, "r_x3": 195.93939, "r_y3": 268.74798999999996, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.20891, "r_y0": 278.05444, "r_x1": 214.73439, "r_y1": 278.05444, "r_x2": 214.73439, "r_y2": 268.73267, "r_x3": 209.20891, "r_y3": 268.73267, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 221.14551, "r_y0": 278.13469999999995, "r_x1": 226.67099, "r_y1": 278.13469999999995, "r_x2": 226.67099, "r_y2": 268.81293000000005, "r_x3": 221.14551, "r_y3": 268.81293000000005, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.44858, "r_y0": 278.00134, "r_x1": 237.97405999999998, "r_y1": 278.00134, "r_x2": 237.97405999999998, "r_y2": 268.67957, "r_x3": 232.44858, "r_y3": 268.67957, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.21715, "r_y0": 253.86139000000003, "r_x1": 203.39232, "r_y1": 253.86139000000003, "r_x2": 203.39232, "r_y2": 244.53961000000004, "r_x3": 196.21715, "r_y3": 244.53961000000004, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 250.32143, "r_y0": 253.41992000000005, "r_x1": 257.49661, "r_y1": 253.41992000000005, "r_x2": 257.49661, "r_y2": 244.09813999999994, "r_x3": 250.32143, "r_y3": 244.09813999999994, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 250.17235999999997, "r_y0": 265.76129000000003, "r_x1": 257.34753, "r_y1": 265.76129000000003, "r_x2": 257.34753, "r_y2": 256.43951000000004, "r_x3": 250.17235999999997, "r_y3": 256.43951000000004, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 250.47049000000004, "r_y0": 278.04400999999996, "r_x1": 257.64566, "r_y1": 278.04400999999996, "r_x2": 257.64566, "r_y2": 268.72222999999997, "r_x3": 250.47049000000004, "r_y3": 268.72222999999997, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.51135, "r_y0": 249.20911, "r_x1": 337.22485, "r_y1": 249.20911, "r_x2": 337.22485, "r_y2": 242.99463000000003, "r_x3": 334.51135, "r_y3": 242.99463000000003, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.93835, "r_y0": 249.20911, "r_x1": 391.49472, "r_y1": 249.20911, "r_x2": 391.49472, "r_y2": 242.99463000000003, "r_x3": 339.93835, "r_y3": 242.99463000000003, "coord_origin": "TOPLEFT" }, "text": "- simple cells: \"C\"", "orig": "- simple cells: \"C\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.51135, "r_y0": 259.14703, "r_x1": 337.33313, "r_y1": 259.14703, "r_x2": 337.33313, "r_y2": 252.93255999999997, "r_x3": 334.51135, "r_y3": 252.93255999999997, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.15491, "r_y0": 259.14703, "r_x1": 421.98624, "r_y1": 259.14703, "r_x2": 421.98624, "r_y2": 252.93255999999997, "r_x3": 340.15491, "r_y3": 252.93255999999997, "coord_origin": "TOPLEFT" }, "text": "- horizontal merges: \"C\", \"L\"", "orig": "- horizontal merges: \"C\", \"L\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.51135, "r_y0": 269.08496, "r_x1": 337.29868, "r_y1": 269.08496, "r_x2": 337.29868, "r_y2": 262.87048000000004, "r_x3": 334.51135, "r_y3": 262.87048000000004, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.086, "r_y0": 269.08496, "r_x1": 415.34375, "r_y1": 269.08496, "r_x2": 415.34375, "r_y2": 262.87048000000004, "r_x3": 340.086, "r_y3": 262.87048000000004, "coord_origin": "TOPLEFT" }, "text": "- vertical merges: \"C\", \"U\"", "orig": "- vertical merges: \"C\", \"U\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.51135, "r_y0": 279.02288999999996, "r_x1": 337.30188, "r_y1": 279.02288999999996, "r_x2": 337.30188, "r_y2": 272.80841, "r_x3": 334.51135, "r_y3": 272.80841, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.09241, "r_y0": 279.02288999999996, "r_x1": 426.59875, "r_y1": 279.02288999999996, "r_x2": 426.59875, "r_y2": 272.80841, "r_x3": 340.09241, "r_y3": 272.80841, "coord_origin": "TOPLEFT" }, "text": "- 2d merges: \"C\", \"L\", \"U\", \"X\"", "orig": "- 2d merges: \"C\", \"L\", \"U\", \"X\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.67178, "r_y0": 250.25671, "r_x1": 189.35544, "r_y1": 250.25671, "r_x2": 189.35544, "r_y2": 244.04224, "r_x3": 185.67178, "r_y3": 244.04224, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.96759, "r_y0": 274.56213, "r_x1": 189.65125, "r_y1": 274.56213, "r_x2": 189.65125, "r_y2": 268.34766, "r_x3": 185.96759, "r_y3": 268.34766, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.34152, "r_y0": 249.83972000000006, "r_x1": 243.02518, "r_y1": 249.83972000000006, "r_x2": 243.02518, "r_y2": 243.62523999999996, "r_x3": 239.34152, "r_y3": 243.62523999999996, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 271.32852, "r_y0": 249.70836999999995, "r_x1": 275.01218, "r_y1": 249.70836999999995, "r_x2": 275.01218, "r_y2": 243.49390000000005, "r_x3": 271.32852, "r_y3": 243.49390000000005, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.81627, "r_y0": 172.72942999999998, "r_x1": 233.49992000000003, "r_y1": 172.72942999999998, "r_x2": 233.49992000000003, "r_y2": 166.51495, "r_x3": 229.81627, "r_y3": 166.51495, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 257.24402, "r_y0": 196.17548, "r_x1": 260.92767, "r_y1": 196.17548, "r_x2": 260.92767, "r_y2": 189.961, "r_x3": 257.24402, "r_y3": 189.961, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 186.87526, "r_y0": 184.19115999999997, "r_x1": 190.55891, "r_y1": 184.19115999999997, "r_x2": 190.55891, "r_y2": 177.97668, "r_x3": 186.87526, "r_y3": 177.97668, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.48746, "r_y0": 175.22968000000003, "r_x1": 200.17111, "r_y1": 175.22968000000003, "r_x2": 200.17111, "r_y2": 169.01520000000005, "r_x3": 196.48746, "r_y3": 169.01520000000005, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 169.74728, "r_y0": 175.65039000000002, "r_x1": 175.72659, "r_y1": 175.65039000000002, "r_x2": 175.72659, "r_y2": 167.88225999999997, "r_x3": 169.74728, "r_y3": 167.88225999999997, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 169.74728, "r_y0": 214.60681, "r_x1": 175.72659, "r_y1": 214.60681, "r_x2": 175.72659, "r_y2": 206.83867999999995, "r_x3": 169.74728, "r_y3": 206.83867999999995, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 274.29419, "r_y0": 176.04785000000004, "r_x1": 280.2735, "r_y1": 176.04785000000004, "r_x2": 280.2735, "r_y2": 168.27972, "r_x3": 274.29419, "r_y3": 168.27972, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 359.56152, "r_y0": 176.04785000000004, "r_x1": 365.54083, "r_y1": 176.04785000000004, "r_x2": 365.54083, "r_y2": 168.27972, "r_x3": 359.56152, "r_y3": 168.27972, "coord_origin": "TOPLEFT" }, "text": "D", "orig": "D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 169.74728, "r_y0": 250.97960999999998, "r_x1": 175.27112, "r_y1": 250.97960999999998, "r_x2": 175.27112, "r_y2": 243.21149000000003, "r_x3": 169.74728, "r_y3": 243.21149000000003, "coord_origin": "TOPLEFT" }, "text": "E", "orig": "E", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 38, "label": "text", "bbox": { "l": 374.49326, "t": 168.59362999999996, "r": 381.66843, "b": 177.91540999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.49326, "r_y0": 177.91540999999995, "r_x1": 381.66843, "r_y1": 177.91540999999995, "r_x2": 381.66843, "r_y2": 168.59362999999996, "r_x3": 374.49326, "r_y3": 168.59362999999996, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 39, "label": "text", "bbox": { "l": 398.74011, "t": 168.50005999999996, "r": 405.91528, "b": 177.82183999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.74011, "r_y0": 177.82183999999995, "r_x1": 405.91528, "r_y1": 177.82183999999995, "r_x2": 405.91528, "r_y2": 168.50005999999996, "r_x3": 398.74011, "r_y3": 168.50005999999996, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 40, "label": "text", "bbox": { "l": 373.76862, "t": 192.92553999999996, "r": 380.94379, "b": 202.24730999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 373.76862, "r_y0": 202.24730999999997, "r_x1": 380.94379, "r_y1": 202.24730999999997, "r_x2": 380.94379, "r_y2": 192.92553999999996, "r_x3": 373.76862, "r_y3": 192.92553999999996, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 386.66388, "t": 193.07061999999996, "r": 393.83905, "b": 202.39239999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.66388, "r_y0": 202.39239999999995, "r_x1": 393.83905, "r_y1": 202.39239999999995, "r_x2": 393.83905, "r_y2": 193.07061999999996, "r_x3": 386.66388, "r_y3": 193.07061999999996, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 386.68707, "t": 205.13756999999998, "r": 393.86224, "b": 214.45934999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.68707, "r_y0": 214.45934999999997, "r_x1": 393.86224, "r_y1": 214.45934999999997, "r_x2": 393.86224, "r_y2": 205.13756999999998, "r_x3": 386.68707, "r_y3": 205.13756999999998, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 398.65729, "t": 180.73279000000002, "r": 405.83246, "b": 190.05457, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.65729, "r_y0": 190.05457, "r_x1": 405.83246, "r_y1": 190.05457, "r_x2": 405.83246, "r_y2": 180.73279000000002, "r_x3": 398.65729, "r_y3": 180.73279000000002, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 410.77908, "t": 180.73859000000004, "r": 417.95425, "b": 190.06035999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.77908, "r_y0": 190.06035999999995, "r_x1": 417.95425, "r_y1": 190.06035999999995, "r_x2": 417.95425, "r_y2": 180.73859000000004, "r_x3": 410.77908, "r_y3": 180.73859000000004, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 422.90503, "t": 180.65247, "r": 430.08020000000005, "b": 189.97424, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 422.90503, "r_y0": 189.97424, "r_x1": 430.08020000000005, "r_y1": 189.97424, "r_x2": 430.08020000000005, "r_y2": 180.65247, "r_x3": 422.90503, "r_y3": 180.65247, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 398.7807, "t": 192.98865, "r": 405.95587, "b": 202.31042000000002, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.7807, "r_y0": 202.31042000000002, "r_x1": 405.95587, "r_y1": 202.31042000000002, "r_x2": 405.95587, "r_y2": 192.98865, "r_x3": 398.7807, "r_y3": 192.98865, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 410.90164, "t": 192.99487, "r": 418.07681, "b": 202.31664999999998, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.90164, "r_y0": 202.31664999999998, "r_x1": 418.07681, "r_y1": 202.31664999999998, "r_x2": 418.07681, "r_y2": 192.99487, "r_x3": 410.90164, "r_y3": 192.99487, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 423.02753, "t": 192.909, "r": 430.2027, "b": 202.23077, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.02753, "r_y0": 202.23077, "r_x1": 430.2027, "r_y1": 202.23077, "r_x2": 430.2027, "r_y2": 192.909, "r_x3": 423.02753, "r_y3": 192.909, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 398.78235, "t": 205.31573000000003, "r": 405.95752, "b": 214.63751000000002, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.78235, "r_y0": 214.63751000000002, "r_x1": 405.95752, "r_y1": 214.63751000000002, "r_x2": 405.95752, "r_y2": 205.31573000000003, "r_x3": 398.78235, "r_y3": 205.31573000000003, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 410.90414, "t": 205.32196, "r": 418.07932, "b": 214.64373999999998, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.90414, "r_y0": 214.64373999999998, "r_x1": 418.07932, "r_y1": 214.64373999999998, "r_x2": 418.07932, "r_y2": 205.32196, "r_x3": 410.90414, "r_y3": 205.32196, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 51, "label": "text", "bbox": { "l": 423.03003, "t": 205.23614999999995, "r": 430.20520000000005, "b": 214.55791999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.03003, "r_y0": 214.55791999999997, "r_x1": 430.20520000000005, "r_y1": 214.55791999999997, "r_x2": 430.20520000000005, "r_y2": 205.23614999999995, "r_x3": 423.03003, "r_y3": 205.23614999999995, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 52, "label": "text", "bbox": { "l": 386.50574, "t": 217.03882, "r": 393.68091, "b": 226.36059999999998, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.50574, "r_y0": 226.36059999999998, "r_x1": 393.68091, "r_y1": 226.36059999999998, "r_x2": 393.68091, "r_y2": 217.03882, "r_x3": 386.50574, "r_y3": 217.03882, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 53, "label": "text", "bbox": { "l": 398.60181, "t": 217.21704, "r": 405.77698, "b": 226.53882, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.60181, "r_y0": 226.53882, "r_x1": 405.77698, "r_y1": 226.53882, "r_x2": 405.77698, "r_y2": 217.21704, "r_x3": 398.60181, "r_y3": 217.21704, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 54, "label": "text", "bbox": { "l": 410.72275, "t": 217.22321, "r": 417.89792, "b": 226.54498, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.72275, "r_y0": 226.54498, "r_x1": 417.89792, "r_y1": 226.54498, "r_x2": 417.89792, "r_y2": 217.22321, "r_x3": 410.72275, "r_y3": 217.22321, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 55, "label": "text", "bbox": { "l": 422.84869, "t": 217.13738999999998, "r": 430.02386, "b": 226.45916999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 422.84869, "r_y0": 226.45916999999997, "r_x1": 430.02386, "r_y1": 226.45916999999997, "r_x2": 430.02386, "r_y2": 217.13738999999998, "r_x3": 422.84869, "r_y3": 217.13738999999998, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 56, "label": "text", "bbox": { "l": 435.16009999999994, "t": 167.69011999999998, "r": 447.86273, "b": 177.01189999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.16009999999994, "r_y0": 177.01189999999997, "r_x1": 447.86273, "r_y1": 177.01189999999997, "r_x2": 447.86273, "r_y2": 167.69011999999998, "r_x3": 435.16009999999994, "r_y3": 167.69011999999998, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 57, "label": "text", "bbox": { "l": 435.44415, "t": 180.20025999999996, "r": 448.14679, "b": 189.52202999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.44415, "r_y0": 189.52202999999997, "r_x1": 448.14679, "r_y1": 189.52202999999997, "r_x2": 448.14679, "r_y2": 180.20025999999996, "r_x3": 435.44415, "r_y3": 180.20025999999996, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 58, "label": "text", "bbox": { "l": 435.46735, "t": 192.49474999999995, "r": 448.16998000000007, "b": 201.81652999999994, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.46735, "r_y0": 201.81652999999994, "r_x1": 448.16998000000007, "r_y1": 201.81652999999994, "r_x2": 448.16998000000007, "r_y2": 192.49474999999995, "r_x3": 435.46735, "r_y3": 192.49474999999995, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 59, "label": "text", "bbox": { "l": 435.38202, "t": 204.83025999999995, "r": 448.08466, "b": 214.15204000000006, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.38202, "r_y0": 214.15204000000006, "r_x1": 448.08466, "r_y1": 214.15204000000006, "r_x2": 448.08466, "r_y2": 204.83025999999995, "r_x3": 435.38202, "r_y3": 204.83025999999995, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 60, "label": "text", "bbox": { "l": 435.59906, "t": 217.2337, "r": 448.3017, "b": 226.55548, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.59906, "r_y0": 226.55548, "r_x1": 448.3017, "r_y1": 226.55548, "r_x2": 448.3017, "r_y2": 217.2337, "r_x3": 435.59906, "r_y3": 217.2337, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 61, "label": "text", "bbox": { "l": 374.14957, "t": 205.23492, "r": 381.32474, "b": 214.55669999999998, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.14957, "r_y0": 214.55669999999998, "r_x1": 381.32474, "r_y1": 214.55669999999998, "r_x2": 381.32474, "r_y2": 205.23492, "r_x3": 374.14957, "r_y3": 205.23492, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 62, "label": "text", "bbox": { "l": 374.0419, "t": 217.14648, "r": 381.21707, "b": 226.46826, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.0419, "r_y0": 226.46826, "r_x1": 381.21707, "r_y1": 226.46826, "r_x2": 381.21707, "r_y2": 217.14648, "r_x3": 374.0419, "r_y3": 217.14648, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 374.34418, "t": 180.93488000000002, "r": 381.51935, "b": 190.25665000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.34418, "r_y0": 190.25665000000004, "r_x1": 381.51935, "r_y1": 190.25665000000004, "r_x2": 381.51935, "r_y2": 180.93488000000002, "r_x3": 374.34418, "r_y3": 180.93488000000002, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 387.76285, "t": 168.57788000000005, "r": 393.28833, "b": 177.89966000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 387.76285, "r_y0": 177.89966000000004, "r_x1": 393.28833, "r_y1": 177.89966000000004, "r_x2": 393.28833, "r_y2": 168.57788000000005, "r_x3": 387.76285, "r_y3": 168.57788000000005, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 411.86395, "t": 168.06195000000002, "r": 417.38943, "b": 177.38373, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.86395, "r_y0": 177.38373, "r_x1": 417.38943, "r_y1": 177.38373, "r_x2": 417.38943, "r_y2": 168.06195000000002, "r_x3": 411.86395, "r_y3": 168.06195000000002, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 423.33563, "t": 167.93439, "r": 428.86111, "b": 177.25616000000002, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.33563, "r_y0": 177.25616000000002, "r_x1": 428.86111, "r_y1": 177.25616000000002, "r_x2": 428.86111, "r_y2": 167.93439, "r_x3": 423.33563, "r_y3": 167.93439, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 387.13593, "t": 180.78576999999996, "r": 393.76453, "b": 190.10753999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 387.13593, "r_y0": 190.10753999999997, "r_x1": 393.76453, "r_y1": 190.10753999999997, "r_x2": 393.76453, "r_y2": 180.78576999999996, "r_x3": 387.13593, "r_y3": 180.78576999999996, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 282.2594, "t": 244.50878999999998, "r": 289.43457, "b": 253.83056999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.2594, "r_y0": 253.83056999999997, "r_x1": 289.43457, "r_y1": 253.83056999999997, "r_x2": 289.43457, "r_y2": 244.50878999999998, "r_x3": 282.2594, "r_y3": 244.50878999999998, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 282.11035, "t": 256.85022000000004, "r": 289.28552, "b": 266.172, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.11035, "r_y0": 266.172, "r_x1": 289.28552, "r_y1": 266.172, "r_x2": 289.28552, "r_y2": 256.85022000000004, "r_x3": 282.11035, "r_y3": 256.85022000000004, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 282.40848, "t": 269.13300000000004, "r": 289.58365, "b": 278.45477000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.40848, "r_y0": 278.45477000000005, "r_x1": 289.58365, "r_y1": 278.45477000000005, "r_x2": 289.58365, "r_y2": 269.13300000000004, "r_x3": 282.40848, "r_y3": 269.13300000000004, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 295.52902, "t": 244.49347, "r": 301.0545, "b": 253.81525, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.52902, "r_y0": 253.81525, "r_x1": 301.0545, "r_y1": 253.81525, "r_x2": 301.0545, "r_y2": 244.49347, "r_x3": 295.52902, "r_y3": 244.49347, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 307.46613, "t": 244.57372999999995, "r": 312.99161, "b": 253.89550999999994, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 307.46613, "r_y0": 253.89550999999994, "r_x1": 312.99161, "r_y1": 253.89550999999994, "r_x2": 312.99161, "r_y2": 244.57372999999995, "r_x3": 307.46613, "r_y3": 244.57372999999995, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 318.76886, "t": 244.44037000000003, "r": 324.29434, "b": 253.76215000000002, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.76886, "r_y0": 253.76215000000002, "r_x1": 324.29434, "r_y1": 253.76215000000002, "r_x2": 324.29434, "r_y2": 244.44037000000003, "r_x3": 318.76886, "r_y3": 244.44037000000003, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 294.9021, "t": 256.70154, "r": 301.03976, "b": 266.02332, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 294.9021, "r_y0": 266.02332, "r_x1": 301.03976, "r_y1": 266.02332, "r_x2": 301.03976, "r_y2": 256.70154, "r_x3": 294.9021, "r_y3": 256.70154, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 307.17743, "t": 256.70154, "r": 325.59039, "b": 266.02332, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 307.17743, "r_y0": 266.02332, "r_x1": 325.59039, "r_y1": 266.02332, "r_x2": 325.59039, "r_y2": 256.70154, "r_x3": 307.17743, "r_y3": 256.70154, "coord_origin": "TOPLEFT" }, "text": "X X", "orig": "X X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 294.78949, "t": 269.25420999999994, "r": 300.92715, "b": 278.57599000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 294.78949, "r_y0": 278.57599000000005, "r_x1": 300.92715, "r_y1": 278.57599000000005, "r_x2": 300.92715, "r_y2": 269.25420999999994, "r_x3": 294.78949, "r_y3": 269.25420999999994, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 307.06482, "t": 269.25420999999994, "r": 325.47778, "b": 278.57599000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 307.06482, "r_y0": 278.57599000000005, "r_x1": 325.47778, "r_y1": 278.57599000000005, "r_x2": 325.47778, "r_y2": 269.25420999999994, "r_x3": 307.06482, "r_y3": 269.25420999999994, "coord_origin": "TOPLEFT" }, "text": "X X", "orig": "X X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 195.93939, "t": 268.74798999999996, "r": 203.11456, "b": 278.06976, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 195.93939, "r_y0": 278.06976, "r_x1": 203.11456, "r_y1": 278.06976, "r_x2": 203.11456, "r_y2": 268.74798999999996, "r_x3": 195.93939, "r_y3": 268.74798999999996, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 209.20891, "t": 268.73267, "r": 214.73439, "b": 278.05444, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.20891, "r_y0": 278.05444, "r_x1": 214.73439, "r_y1": 278.05444, "r_x2": 214.73439, "r_y2": 268.73267, "r_x3": 209.20891, "r_y3": 268.73267, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 80, "label": "text", "bbox": { "l": 221.14551, "t": 268.81293000000005, "r": 226.67099, "b": 278.13469999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 221.14551, "r_y0": 278.13469999999995, "r_x1": 226.67099, "r_y1": 278.13469999999995, "r_x2": 226.67099, "r_y2": 268.81293000000005, "r_x3": 221.14551, "r_y3": 268.81293000000005, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 81, "label": "text", "bbox": { "l": 232.44858, "t": 268.67957, "r": 237.97405999999998, "b": 278.00134, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.44858, "r_y0": 278.00134, "r_x1": 237.97405999999998, "r_y1": 278.00134, "r_x2": 237.97405999999998, "r_y2": 268.67957, "r_x3": 232.44858, "r_y3": 268.67957, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 82, "label": "text", "bbox": { "l": 196.21715, "t": 244.53961000000004, "r": 203.39232, "b": 253.86139000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.21715, "r_y0": 253.86139000000003, "r_x1": 203.39232, "r_y1": 253.86139000000003, "r_x2": 203.39232, "r_y2": 244.53961000000004, "r_x3": 196.21715, "r_y3": 244.53961000000004, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 83, "label": "text", "bbox": { "l": 250.32143, "t": 244.09813999999994, "r": 257.49661, "b": 253.41992000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 250.32143, "r_y0": 253.41992000000005, "r_x1": 257.49661, "r_y1": 253.41992000000005, "r_x2": 257.49661, "r_y2": 244.09813999999994, "r_x3": 250.32143, "r_y3": 244.09813999999994, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 84, "label": "text", "bbox": { "l": 250.17235999999997, "t": 256.43951000000004, "r": 257.34753, "b": 265.76129000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 250.17235999999997, "r_y0": 265.76129000000003, "r_x1": 257.34753, "r_y1": 265.76129000000003, "r_x2": 257.34753, "r_y2": 256.43951000000004, "r_x3": 250.17235999999997, "r_y3": 256.43951000000004, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 85, "label": "text", "bbox": { "l": 250.47049000000004, "t": 268.72222999999997, "r": 257.64566, "b": 278.04400999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 250.47049000000004, "r_y0": 278.04400999999996, "r_x1": 257.64566, "r_y1": 278.04400999999996, "r_x2": 257.64566, "r_y2": 268.72222999999997, "r_x3": 250.47049000000004, "r_y3": 268.72222999999997, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 86, "label": "text", "bbox": { "l": 334.51135, "t": 242.99463000000003, "r": 337.22485, "b": 249.20911, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.51135, "r_y0": 249.20911, "r_x1": 337.22485, "r_y1": 249.20911, "r_x2": 337.22485, "r_y2": 242.99463000000003, "r_x3": 334.51135, "r_y3": 242.99463000000003, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 87, "label": "text", "bbox": { "l": 339.93835, "t": 242.99463000000003, "r": 391.49472, "b": 249.20911, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.93835, "r_y0": 249.20911, "r_x1": 391.49472, "r_y1": 249.20911, "r_x2": 391.49472, "r_y2": 242.99463000000003, "r_x3": 339.93835, "r_y3": 242.99463000000003, "coord_origin": "TOPLEFT" }, "text": "- simple cells: \"C\"", "orig": "- simple cells: \"C\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 88, "label": "text", "bbox": { "l": 334.51135, "t": 252.93255999999997, "r": 337.33313, "b": 259.14703, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.51135, "r_y0": 259.14703, "r_x1": 337.33313, "r_y1": 259.14703, "r_x2": 337.33313, "r_y2": 252.93255999999997, "r_x3": 334.51135, "r_y3": 252.93255999999997, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 89, "label": "text", "bbox": { "l": 340.15491, "t": 252.93255999999997, "r": 421.98624, "b": 259.14703, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.15491, "r_y0": 259.14703, "r_x1": 421.98624, "r_y1": 259.14703, "r_x2": 421.98624, "r_y2": 252.93255999999997, "r_x3": 340.15491, "r_y3": 252.93255999999997, "coord_origin": "TOPLEFT" }, "text": "- horizontal merges: \"C\", \"L\"", "orig": "- horizontal merges: \"C\", \"L\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 90, "label": "text", "bbox": { "l": 334.51135, "t": 262.87048000000004, "r": 337.29868, "b": 269.08496, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.51135, "r_y0": 269.08496, "r_x1": 337.29868, "r_y1": 269.08496, "r_x2": 337.29868, "r_y2": 262.87048000000004, "r_x3": 334.51135, "r_y3": 262.87048000000004, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 91, "label": "text", "bbox": { "l": 340.086, "t": 262.87048000000004, "r": 415.34375, "b": 269.08496, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.086, "r_y0": 269.08496, "r_x1": 415.34375, "r_y1": 269.08496, "r_x2": 415.34375, "r_y2": 262.87048000000004, "r_x3": 340.086, "r_y3": 262.87048000000004, "coord_origin": "TOPLEFT" }, "text": "- vertical merges: \"C\", \"U\"", "orig": "- vertical merges: \"C\", \"U\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 18, "label": "list_item", "bbox": { "l": 334.51135, "t": 272.80841, "r": 426.59875, "b": 279.02288999999996, "coord_origin": "TOPLEFT" }, "confidence": 0.5250625610351562, "cells": [ { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.51135, "r_y0": 279.02288999999996, "r_x1": 337.30188, "r_y1": 279.02288999999996, "r_x2": 337.30188, "r_y2": 272.80841, "r_x3": 334.51135, "r_y3": 272.80841, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.09241, "r_y0": 279.02288999999996, "r_x1": 426.59875, "r_y1": 279.02288999999996, "r_x2": 426.59875, "r_y2": 272.80841, "r_x3": 340.09241, "r_y3": 272.80841, "coord_origin": "TOPLEFT" }, "text": "- 2d merges: \"C\", \"L\", \"U\", \"X\"", "orig": "- 2d merges: \"C\", \"L\", \"U\", \"X\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 92, "label": "text", "bbox": { "l": 185.67178, "t": 244.04224, "r": 189.35544, "b": 250.25671, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.67178, "r_y0": 250.25671, "r_x1": 189.35544, "r_y1": 250.25671, "r_x2": 189.35544, "r_y2": 244.04224, "r_x3": 185.67178, "r_y3": 244.04224, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 93, "label": "text", "bbox": { "l": 185.96759, "t": 268.34766, "r": 189.65125, "b": 274.56213, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.96759, "r_y0": 274.56213, "r_x1": 189.65125, "r_y1": 274.56213, "r_x2": 189.65125, "r_y2": 268.34766, "r_x3": 185.96759, "r_y3": 268.34766, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 94, "label": "text", "bbox": { "l": 239.34152, "t": 243.62523999999996, "r": 243.02518, "b": 249.83972000000006, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.34152, "r_y0": 249.83972000000006, "r_x1": 243.02518, "r_y1": 249.83972000000006, "r_x2": 243.02518, "r_y2": 243.62523999999996, "r_x3": 239.34152, "r_y3": 243.62523999999996, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 95, "label": "text", "bbox": { "l": 271.32852, "t": 243.49390000000005, "r": 275.01218, "b": 249.70836999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 271.32852, "r_y0": 249.70836999999995, "r_x1": 275.01218, "r_y1": 249.70836999999995, "r_x2": 275.01218, "r_y2": 243.49390000000005, "r_x3": 271.32852, "r_y3": 243.49390000000005, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 96, "label": "text", "bbox": { "l": 229.81627, "t": 166.51495, "r": 233.49992000000003, "b": 172.72942999999998, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.81627, "r_y0": 172.72942999999998, "r_x1": 233.49992000000003, "r_y1": 172.72942999999998, "r_x2": 233.49992000000003, "r_y2": 166.51495, "r_x3": 229.81627, "r_y3": 166.51495, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 97, "label": "text", "bbox": { "l": 257.24402, "t": 189.961, "r": 260.92767, "b": 196.17548, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 257.24402, "r_y0": 196.17548, "r_x1": 260.92767, "r_y1": 196.17548, "r_x2": 260.92767, "r_y2": 189.961, "r_x3": 257.24402, "r_y3": 189.961, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 98, "label": "text", "bbox": { "l": 186.87526, "t": 177.97668, "r": 190.55891, "b": 184.19115999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 186.87526, "r_y0": 184.19115999999997, "r_x1": 190.55891, "r_y1": 184.19115999999997, "r_x2": 190.55891, "r_y2": 177.97668, "r_x3": 186.87526, "r_y3": 177.97668, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 99, "label": "text", "bbox": { "l": 196.48746, "t": 169.01520000000005, "r": 200.17111, "b": 175.22968000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.48746, "r_y0": 175.22968000000003, "r_x1": 200.17111, "r_y1": 175.22968000000003, "r_x2": 200.17111, "r_y2": 169.01520000000005, "r_x3": 196.48746, "r_y3": 169.01520000000005, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 100, "label": "text", "bbox": { "l": 169.74728, "t": 167.88225999999997, "r": 175.72659, "b": 175.65039000000002, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 169.74728, "r_y0": 175.65039000000002, "r_x1": 175.72659, "r_y1": 175.65039000000002, "r_x2": 175.72659, "r_y2": 167.88225999999997, "r_x3": 169.74728, "r_y3": 167.88225999999997, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 101, "label": "text", "bbox": { "l": 169.74728, "t": 206.83867999999995, "r": 175.72659, "b": 214.60681, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 169.74728, "r_y0": 214.60681, "r_x1": 175.72659, "r_y1": 214.60681, "r_x2": 175.72659, "r_y2": 206.83867999999995, "r_x3": 169.74728, "r_y3": 206.83867999999995, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 102, "label": "text", "bbox": { "l": 274.29419, "t": 168.27972, "r": 280.2735, "b": 176.04785000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 274.29419, "r_y0": 176.04785000000004, "r_x1": 280.2735, "r_y1": 176.04785000000004, "r_x2": 280.2735, "r_y2": 168.27972, "r_x3": 274.29419, "r_y3": 168.27972, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 103, "label": "text", "bbox": { "l": 359.56152, "t": 168.27972, "r": 365.54083, "b": 176.04785000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 359.56152, "r_y0": 176.04785000000004, "r_x1": 365.54083, "r_y1": 176.04785000000004, "r_x2": 365.54083, "r_y2": 168.27972, "r_x3": 359.56152, "r_y3": 168.27972, "coord_origin": "TOPLEFT" }, "text": "D", "orig": "D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 104, "label": "text", "bbox": { "l": 169.74728, "t": 243.21149000000003, "r": 175.27112, "b": 250.97960999999998, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 169.74728, "r_y0": 250.97960999999998, "r_x1": 175.27112, "r_y1": 250.97960999999998, "r_x2": 175.27112, "r_y2": 243.21149000000003, "r_x3": 169.74728, "r_y3": 243.21149000000003, "coord_origin": "TOPLEFT" }, "text": "E", "orig": "E", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, { "id": 9, "label": "section_header", "bbox": { "l": 134.765, "t": 305.29581, "r": 246.65197999999998, "b": 314.10275, "coord_origin": "TOPLEFT" }, "confidence": 0.9233023524284363, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 314.10275, "r_x1": 149.40205, "r_y1": 314.10275, "r_x2": 149.40205, "r_y2": 305.29581, "r_x3": 134.765, "r_y3": 305.29581, "coord_origin": "TOPLEFT" }, "text": "4.2", "orig": "4.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.85904, "r_y0": 314.10275, "r_x1": 246.65197999999998, "r_y1": 314.10275, "r_x2": 246.65197999999998, "r_y2": 305.29581, "r_x3": 160.85904, "r_y3": 305.29581, "coord_origin": "TOPLEFT" }, "text": "Language Syntax", "orig": "Language Syntax", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 10, "label": "text", "bbox": { "l": 134.765, "t": 325.24777, "r": 363.79617, "b": 334.04474, "coord_origin": "TOPLEFT" }, "confidence": 0.9169168472290039, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 334.04474, "r_x1": 363.79617, "r_y1": 334.04474, "r_x2": 363.79617, "r_y2": 325.24777, "r_x3": 134.765, "r_y3": 325.24777, "coord_origin": "TOPLEFT" }, "text": "The OTSL representation follows these syntax rules:", "orig": "The OTSL representation follows these syntax rules:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 3, "label": "list_item", "bbox": { "l": 138.97299, "t": 347.17081, "r": 480.58902, "b": 367.93375, "coord_origin": "TOPLEFT" }, "confidence": 0.9588112235069275, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.97299, "r_y0": 355.97775, "r_x1": 146.71991, "r_y1": 355.97775, "r_x2": 146.71991, "r_y2": 347.18079, "r_x3": 138.97299, "r_y3": 347.18079, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.70099, "r_y0": 355.97775, "r_x1": 257.37927, "r_y1": 355.97775, "r_x2": 257.37927, "r_y2": 347.17081, "r_x3": 151.70099, "r_y3": 347.17081, "coord_origin": "TOPLEFT" }, "text": "Left-looking cell rule", "orig": "Left-looking cell rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 257.383, "r_y0": 355.97775, "r_x1": 480.58902, "r_y1": 355.97775, "r_x2": 480.58902, "r_y2": 347.18079, "r_x3": 257.383, "r_y3": 347.18079, "coord_origin": "TOPLEFT" }, "text": ": The left neighbour of an \"L\" cell must be either", "orig": ": The left neighbour of an \"L\" cell must be either", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.70099, "r_y0": 367.93375, "r_x1": 283.59387, "r_y1": 367.93375, "r_x2": 283.59387, "r_y2": 359.13678, "r_x3": 151.70099, "r_y3": 359.13678, "coord_origin": "TOPLEFT" }, "text": "another \"L\" cell or a \"C\" cell.", "orig": "another \"L\" cell or a \"C\" cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 4, "label": "list_item", "bbox": { "l": 138.97299, "t": 371.08481, "r": 480.59229000000005, "b": 391.84673999999995, "coord_origin": "TOPLEFT" }, "confidence": 0.9585386514663696, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.97299, "r_y0": 379.89175, "r_x1": 146.71991, "r_y1": 379.89175, "r_x2": 146.71991, "r_y2": 371.09479, "r_x3": 138.97299, "r_y3": 371.09479, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.70099, "r_y0": 379.89175, "r_x1": 252.11203, "r_y1": 379.89175, "r_x2": 252.11203, "r_y2": 371.08481, "r_x3": 151.70099, "r_y3": 371.08481, "coord_origin": "TOPLEFT" }, "text": "Up-looking cell rule", "orig": "Up-looking cell rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 252.112, "r_y0": 379.89175, "r_x1": 480.59229000000005, "r_y1": 379.89175, "r_x2": 480.59229000000005, "r_y2": 371.09479, "r_x3": 252.112, "r_y3": 371.09479, "coord_origin": "TOPLEFT" }, "text": ": The upper neighbour of a \"U\" cell must be either", "orig": ": The upper neighbour of a \"U\" cell must be either", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.70099, "r_y0": 391.84673999999995, "r_x1": 284.8392, "r_y1": 391.84673999999995, "r_x2": 284.8392, "r_y2": 383.04977, "r_x3": 151.70099, "r_y3": 383.04977, "coord_origin": "TOPLEFT" }, "text": "another \"U\" cell or a \"C\" cell.", "orig": "another \"U\" cell or a \"C\" cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 14, "label": "section_header", "bbox": { "l": 138.97299, "t": 394.99780000000004, "r": 226.07360999999997, "b": 403.80475, "coord_origin": "TOPLEFT" }, "confidence": 0.6506174206733704, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.97299, "r_y0": 403.80475, "r_x1": 146.71991, "r_y1": 403.80475, "r_x2": 146.71991, "r_y2": 395.0077800000001, "r_x3": 138.97299, "r_y3": 395.0077800000001, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.70099, "r_y0": 403.80475, "r_x1": 223.3042, "r_y1": 403.80475, "r_x2": 223.3042, "r_y2": 394.99780000000004, "r_x3": 151.70099, "r_y3": 394.99780000000004, "coord_origin": "TOPLEFT" }, "text": "Cross cell rule", "orig": "Cross cell rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 223.30699, "r_y0": 403.80475, "r_x1": 226.07360999999997, "r_y1": 403.80475, "r_x2": 226.07360999999997, "r_y2": 395.0077800000001, "r_x3": 223.30699, "r_y3": 395.0077800000001, "coord_origin": "TOPLEFT" }, "text": ":", "orig": ":", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 13, "label": "list_item", "bbox": { "l": 151.70099, "t": 406.96677, "r": 480.59238, "b": 439.67371, "coord_origin": "TOPLEFT" }, "confidence": 0.7247239947319031, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.70099, "r_y0": 415.76373, "r_x1": 480.59238, "r_y1": 415.76373, "r_x2": 480.59238, "r_y2": 406.96677, "r_x3": 151.70099, "r_y3": 406.96677, "coord_origin": "TOPLEFT" }, "text": "The left neighbour of an \"X\" cell must be either another \"X\" cell or a \"U\"", "orig": "The left neighbour of an \"X\" cell must be either another \"X\" cell or a \"U\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.70099, "r_y0": 427.71871999999996, "r_x1": 480.59219, "r_y1": 427.71871999999996, "r_x2": 480.59219, "r_y2": 418.9217499999999, "r_x3": 151.70099, "r_y3": 418.9217499999999, "coord_origin": "TOPLEFT" }, "text": "cell, and the upper neighbour of an \"X\" cell must be either another \"X\" cell", "orig": "cell, and the upper neighbour of an \"X\" cell must be either another \"X\" cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.70099, "r_y0": 439.67371, "r_x1": 214.39663999999996, "r_y1": 439.67371, "r_x2": 214.39663999999996, "r_y2": 430.87674, "r_x3": 151.70099, "r_y3": 430.87674, "coord_origin": "TOPLEFT" }, "text": "or an \"L\" cell.", "orig": "or an \"L\" cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 8, "label": "list_item", "bbox": { "l": 138.97299, "t": 442.82574, "r": 474.59018, "b": 451.63269, "coord_origin": "TOPLEFT" }, "confidence": 0.9259927272796631, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.97299, "r_y0": 451.63269, "r_x1": 146.71991, "r_y1": 451.63269, "r_x2": 146.71991, "r_y2": 442.83572, "r_x3": 138.97299, "r_y3": 442.83572, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.70099, "r_y0": 451.63269, "r_x1": 221.32263, "r_y1": 451.63269, "r_x2": 221.32263, "r_y2": 442.82574, "r_x3": 151.70099, "r_y3": 442.82574, "coord_origin": "TOPLEFT" }, "text": "First row rule", "orig": "First row rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 221.32700000000003, "r_y0": 451.63269, "r_x1": 474.59018, "r_y1": 451.63269, "r_x2": 474.59018, "r_y2": 442.83572, "r_x3": 221.32700000000003, "r_y3": 442.83572, "coord_origin": "TOPLEFT" }, "text": ": Only \"L\" cells and \"C\" cells are allowed in the first row.", "orig": ": Only \"L\" cells and \"C\" cells are allowed in the first row.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 5, "label": "list_item", "bbox": { "l": 138.97299, "t": 454.78375, "r": 480.58746, "b": 475.54568, "coord_origin": "TOPLEFT" }, "confidence": 0.9420599937438965, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.97299, "r_y0": 463.5907, "r_x1": 146.71991, "r_y1": 463.5907, "r_x2": 146.71991, "r_y2": 454.7937299999999, "r_x3": 138.97299, "r_y3": 454.7937299999999, "coord_origin": "TOPLEFT" }, "text": "5.", "orig": "5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.70099, "r_y0": 463.5907, "r_x1": 240.71982, "r_y1": 463.5907, "r_x2": 240.71982, "r_y2": 454.78375, "r_x3": 151.70099, "r_y3": 454.78375, "coord_origin": "TOPLEFT" }, "text": "First column rule", "orig": "First column rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 240.71599, "r_y0": 463.5907, "r_x1": 480.58746, "r_y1": 463.5907, "r_x2": 480.58746, "r_y2": 454.7937299999999, "r_x3": 240.71599, "r_y3": 454.7937299999999, "coord_origin": "TOPLEFT" }, "text": ": Only \"U\" cells and \"C\" cells are allowed in the first", "orig": ": Only \"U\" cells and \"C\" cells are allowed in the first", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.70099, "r_y0": 475.54568, "r_x1": 186.0072, "r_y1": 475.54568, "r_x2": 186.0072, "r_y2": 466.74872, "r_x3": 151.70099, "r_y3": 466.74872, "coord_origin": "TOPLEFT" }, "text": "column.", "orig": "column.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 1, "label": "list_item", "bbox": { "l": 138.97299, "t": 478.69675, "r": 480.59457, "b": 499.45969, "coord_origin": "TOPLEFT" }, "confidence": 0.9617829918861389, "cells": [ { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.97299, "r_y0": 487.50369, "r_x1": 146.71991, "r_y1": 487.50369, "r_x2": 146.71991, "r_y2": 478.70673, "r_x3": 138.97299, "r_y3": 478.70673, "coord_origin": "TOPLEFT" }, "text": "6.", "orig": "6.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.70099, "r_y0": 487.50369, "r_x1": 235.15768, "r_y1": 487.50369, "r_x2": 235.15768, "r_y2": 478.69675, "r_x3": 151.70099, "r_y3": 478.69675, "coord_origin": "TOPLEFT" }, "text": "Rectangular rule", "orig": "Rectangular rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 235.15697999999998, "r_y0": 487.50369, "r_x1": 480.59457, "r_y1": 487.50369, "r_x2": 480.59457, "r_y2": 478.70673, "r_x3": 235.15697999999998, "r_y3": 478.70673, "coord_origin": "TOPLEFT" }, "text": ": The table representation is always rectangular - all rows", "orig": ": The table representation is always rectangular - all rows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.70099, "r_y0": 499.45969, "r_x1": 448.04147, "r_y1": 499.45969, "r_x2": 448.04147, "r_y2": 490.66272, "r_x3": 151.70099, "r_y3": 490.66272, "coord_origin": "TOPLEFT" }, "text": "must have an equal number of tokens, terminated with \"NL\" token.", "orig": "must have an equal number of tokens, terminated with \"NL\" token.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 0, "label": "text", "bbox": { "l": 134.76498, "t": 512.59271, "r": 480.59583, "b": 640.9416699999999, "coord_origin": "TOPLEFT" }, "confidence": 0.9785562753677368, "cells": [ { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.70898, "r_y0": 521.38968, "r_x1": 480.59583, "r_y1": 521.38968, "r_x2": 480.59583, "r_y2": 512.59271, "r_x3": 149.70898, "r_y3": 512.59271, "coord_origin": "TOPLEFT" }, "text": "The application of these rules gives OTSL a set of unique properties. First", "orig": "The application of these rules gives OTSL a set of unique properties. First", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 533.34467, "r_x1": 480.59079, "r_y1": 533.34467, "r_x2": 480.59079, "r_y2": 524.5477000000001, "r_x3": 134.76498, "r_y3": 524.5477000000001, "coord_origin": "TOPLEFT" }, "text": "of all, the OTSL enforces a strictly rectangular structure representation, where", "orig": "of all, the OTSL enforces a strictly rectangular structure representation, where", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 545.29967, "r_x1": 480.59482, "r_y1": 545.29967, "r_x2": 480.59482, "r_y2": 536.5027, "r_x3": 134.76498, "r_y3": 536.5027, "coord_origin": "TOPLEFT" }, "text": "every new-line token starts a new row. As a consequence, all rows and all columns", "orig": "every new-line token starts a new row. As a consequence, all rows and all columns", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 557.25566, "r_x1": 480.58865000000003, "r_y1": 557.25566, "r_x2": 480.58865000000003, "r_y2": 548.4586899999999, "r_x3": 134.76498, "r_y3": 548.4586899999999, "coord_origin": "TOPLEFT" }, "text": "have exactly the same number of tokens, irrespective of cell spans. Secondly, the", "orig": "have exactly the same number of tokens, irrespective of cell spans. Secondly, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 569.21066, "r_x1": 480.59365999999994, "r_y1": 569.21066, "r_x2": 480.59365999999994, "r_y2": 560.4137000000001, "r_x3": 134.76498, "r_y3": 560.4137000000001, "coord_origin": "TOPLEFT" }, "text": "OTSL representation is unambiguous: Every table structure is represented in one", "orig": "OTSL representation is unambiguous: Every table structure is represented in one", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 581.16566, "r_x1": 480.58673, "r_y1": 581.16566, "r_x2": 480.58673, "r_y2": 572.3687, "r_x3": 134.76498, "r_y3": 572.3687, "coord_origin": "TOPLEFT" }, "text": "way. In this representation every table cell corresponds to a \"C\"-cell token, which", "orig": "way. In this representation every table cell corresponds to a \"C\"-cell token, which", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 593.12067, "r_x1": 480.59171, "r_y1": 593.12067, "r_x2": 480.59171, "r_y2": 584.3237, "r_x3": 134.76498, "r_y3": 584.3237, "coord_origin": "TOPLEFT" }, "text": "in case of spans is always located in the top-left corner of the table cell definition.", "orig": "in case of spans is always located in the top-left corner of the table cell definition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 605.07567, "r_x1": 480.59180000000003, "r_y1": 605.07567, "r_x2": 480.59180000000003, "r_y2": 596.2787, "r_x3": 134.76498, "r_y3": 596.2787, "coord_origin": "TOPLEFT" }, "text": "Third, OTSL syntax rules are only backward-looking. As a consequence, every", "orig": "Third, OTSL syntax rules are only backward-looking. As a consequence, every", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 617.03166, "r_x1": 480.5936899999999, "r_y1": 617.03166, "r_x2": 480.5936899999999, "r_y2": 608.2347, "r_x3": 134.76498, "r_y3": 608.2347, "coord_origin": "TOPLEFT" }, "text": "predicted token can be validated straight during sequence generation by looking", "orig": "predicted token can be validated straight during sequence generation by looking", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 628.98666, "r_x1": 480.59072999999995, "r_y1": 628.98666, "r_x2": 480.59072999999995, "r_y2": 620.1897, "r_x3": 134.76498, "r_y3": 620.1897, "coord_origin": "TOPLEFT" }, "text": "at the previously predicted sequence. As such, OTSL can guarantee that every", "orig": "at the previously predicted sequence. As such, OTSL can guarantee that every", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 640.9416699999999, "r_x1": 311.19769, "r_y1": 640.9416699999999, "r_x2": 311.19769, "r_y2": 632.1447000000001, "r_x3": 134.76498, "r_y3": 632.1447000000001, "coord_origin": "TOPLEFT" }, "text": "predicted sequence is syntactically valid.", "orig": "predicted sequence is syntactically valid.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 2, "label": "text", "bbox": { "l": 134.76498, "t": 644.1026899999999, "r": 480.59265, "b": 664.8546699999999, "coord_origin": "TOPLEFT" }, "confidence": 0.9590610861778259, "cells": [ { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.70898, "r_y0": 652.89966, "r_x1": 480.59186, "r_y1": 652.89966, "r_x2": 480.59186, "r_y2": 644.1026899999999, "r_x3": 149.70898, "r_y3": 644.1026899999999, "coord_origin": "TOPLEFT" }, "text": "These characteristics can be easily learned by sequence generator networks,", "orig": "These characteristics can be easily learned by sequence generator networks,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 664.8546699999999, "r_x1": 480.59265, "r_y1": 664.8546699999999, "r_x2": 480.59265, "r_y2": 656.05769, "r_x3": 134.76498, "r_y3": 656.05769, "coord_origin": "TOPLEFT" }, "text": "as we demonstrate further below. We find strong indications that this pattern", "orig": "as we demonstrate further below. We find strong indications that this pattern", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "tablestructure": { "table_map": {} }, "figures_classification": null, "equations_prediction": null, "vlm_response": null }, "assembled": { "elements": [ { "label": "page_header", "id": 7, "page_no": 6, "cluster": { "id": 7, "label": "page_header", "bbox": { "l": 194.478, "t": 93.77099999999996, "r": 447.54291000000006, "b": 101.84069999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.932651162147522, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.478, "r_y0": 101.84069999999997, "r_x1": 447.54291000000006, "r_y1": 101.84069999999997, "r_x2": 447.54291000000006, "r_y2": 93.77099999999996, "r_x3": 194.478, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Optimized Table Tokenization for Table Structure Recognition" }, { "label": "page_header", "id": 11, "page_no": 6, "cluster": { "id": 11, "label": "page_header", "bbox": { "l": 475.98431, "t": 93.77099999999996, "r": 480.59125000000006, "b": 101.84069999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.8749732375144958, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 475.98431, "r_y0": 101.84069999999997, "r_x1": 480.59125000000006, "r_y1": 101.84069999999997, "r_x2": 480.59125000000006, "r_y2": 93.77099999999996, "r_x3": 475.98431, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "7" }, { "label": "caption", "id": 6, "page_no": 6, "cluster": { "id": 6, "label": "caption", "bbox": { "l": 134.765, "t": 125.79918999999984, "r": 480.5874, "b": 155.84966999999995, "coord_origin": "TOPLEFT" }, "confidence": 0.9333080053329468, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 133.72551999999996, "r_x1": 162.64424, "r_y1": 133.72551999999996, "r_x2": 162.64424, "r_y2": 125.79918999999984, "r_x3": 134.765, "r_y3": 125.79918999999984, "coord_origin": "TOPLEFT" }, "text": "Fig. 3.", "orig": "Fig. 3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 166.276, "r_y0": 133.93169999999998, "r_x1": 480.58675999999997, "r_y1": 133.93169999999998, "r_x2": 480.58675999999997, "r_y2": 125.86200000000008, "r_x3": 166.276, "r_y3": 125.86200000000008, "coord_origin": "TOPLEFT" }, "text": "OTSL description of table structure: A - table example; B - graphical repre-", "orig": "OTSL description of table structure: A - table example; B - graphical repre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 144.89068999999995, "r_x1": 480.5874, "r_y1": 144.89068999999995, "r_x2": 480.5874, "r_y2": 136.82097999999996, "r_x3": 134.765, "r_y3": 136.82097999999996, "coord_origin": "TOPLEFT" }, "text": "sentation of table structure; C - mapping structure on a grid; D - OTSL structure", "orig": "sentation of table structure; C - mapping structure on a grid; D - OTSL structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 155.84966999999995, "r_x1": 306.1156, "r_y1": 155.84966999999995, "r_x2": 306.1156, "r_y2": 147.77997000000005, "r_x3": 134.765, "r_y3": 147.77997000000005, "coord_origin": "TOPLEFT" }, "text": "encoding; E - explanation on cell encoding", "orig": "encoding; E - explanation on cell encoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Fig. 3. OTSL description of table structure: A - table example; B - graphical representation of table structure; C - mapping structure on a grid; D - OTSL structure encoding; E - explanation on cell encoding" }, { "label": "picture", "id": 12, "page_no": 6, "cluster": { "id": 12, "label": "picture", "bbox": { "l": 164.65028381347656, "t": 163.79708862304688, "r": 449.5505676269531, "b": 280.3409423828125, "coord_origin": "TOPLEFT" }, "confidence": 0.7868534922599792, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.49326, "r_y0": 177.91540999999995, "r_x1": 381.66843, "r_y1": 177.91540999999995, "r_x2": 381.66843, "r_y2": 168.59362999999996, "r_x3": 374.49326, "r_y3": 168.59362999999996, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.74011, "r_y0": 177.82183999999995, "r_x1": 405.91528, "r_y1": 177.82183999999995, "r_x2": 405.91528, "r_y2": 168.50005999999996, "r_x3": 398.74011, "r_y3": 168.50005999999996, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 373.76862, "r_y0": 202.24730999999997, "r_x1": 380.94379, "r_y1": 202.24730999999997, "r_x2": 380.94379, "r_y2": 192.92553999999996, "r_x3": 373.76862, "r_y3": 192.92553999999996, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.66388, "r_y0": 202.39239999999995, "r_x1": 393.83905, "r_y1": 202.39239999999995, "r_x2": 393.83905, "r_y2": 193.07061999999996, "r_x3": 386.66388, "r_y3": 193.07061999999996, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.68707, "r_y0": 214.45934999999997, "r_x1": 393.86224, "r_y1": 214.45934999999997, "r_x2": 393.86224, "r_y2": 205.13756999999998, "r_x3": 386.68707, "r_y3": 205.13756999999998, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.65729, "r_y0": 190.05457, "r_x1": 405.83246, "r_y1": 190.05457, "r_x2": 405.83246, "r_y2": 180.73279000000002, "r_x3": 398.65729, "r_y3": 180.73279000000002, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.77908, "r_y0": 190.06035999999995, "r_x1": 417.95425, "r_y1": 190.06035999999995, "r_x2": 417.95425, "r_y2": 180.73859000000004, "r_x3": 410.77908, "r_y3": 180.73859000000004, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 422.90503, "r_y0": 189.97424, "r_x1": 430.08020000000005, "r_y1": 189.97424, "r_x2": 430.08020000000005, "r_y2": 180.65247, "r_x3": 422.90503, "r_y3": 180.65247, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.7807, "r_y0": 202.31042000000002, "r_x1": 405.95587, "r_y1": 202.31042000000002, "r_x2": 405.95587, "r_y2": 192.98865, "r_x3": 398.7807, "r_y3": 192.98865, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.90164, "r_y0": 202.31664999999998, "r_x1": 418.07681, "r_y1": 202.31664999999998, "r_x2": 418.07681, "r_y2": 192.99487, "r_x3": 410.90164, "r_y3": 192.99487, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.02753, "r_y0": 202.23077, "r_x1": 430.2027, "r_y1": 202.23077, "r_x2": 430.2027, "r_y2": 192.909, "r_x3": 423.02753, "r_y3": 192.909, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.78235, "r_y0": 214.63751000000002, "r_x1": 405.95752, "r_y1": 214.63751000000002, "r_x2": 405.95752, "r_y2": 205.31573000000003, "r_x3": 398.78235, "r_y3": 205.31573000000003, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.90414, "r_y0": 214.64373999999998, "r_x1": 418.07932, "r_y1": 214.64373999999998, "r_x2": 418.07932, "r_y2": 205.32196, "r_x3": 410.90414, "r_y3": 205.32196, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.03003, "r_y0": 214.55791999999997, "r_x1": 430.20520000000005, "r_y1": 214.55791999999997, "r_x2": 430.20520000000005, "r_y2": 205.23614999999995, "r_x3": 423.03003, "r_y3": 205.23614999999995, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.50574, "r_y0": 226.36059999999998, "r_x1": 393.68091, "r_y1": 226.36059999999998, "r_x2": 393.68091, "r_y2": 217.03882, "r_x3": 386.50574, "r_y3": 217.03882, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.60181, "r_y0": 226.53882, "r_x1": 405.77698, "r_y1": 226.53882, "r_x2": 405.77698, "r_y2": 217.21704, "r_x3": 398.60181, "r_y3": 217.21704, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.72275, "r_y0": 226.54498, "r_x1": 417.89792, "r_y1": 226.54498, "r_x2": 417.89792, "r_y2": 217.22321, "r_x3": 410.72275, "r_y3": 217.22321, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 422.84869, "r_y0": 226.45916999999997, "r_x1": 430.02386, "r_y1": 226.45916999999997, "r_x2": 430.02386, "r_y2": 217.13738999999998, "r_x3": 422.84869, "r_y3": 217.13738999999998, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.16009999999994, "r_y0": 177.01189999999997, "r_x1": 447.86273, "r_y1": 177.01189999999997, "r_x2": 447.86273, "r_y2": 167.69011999999998, "r_x3": 435.16009999999994, "r_y3": 167.69011999999998, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.44415, "r_y0": 189.52202999999997, "r_x1": 448.14679, "r_y1": 189.52202999999997, "r_x2": 448.14679, "r_y2": 180.20025999999996, "r_x3": 435.44415, "r_y3": 180.20025999999996, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.46735, "r_y0": 201.81652999999994, "r_x1": 448.16998000000007, "r_y1": 201.81652999999994, "r_x2": 448.16998000000007, "r_y2": 192.49474999999995, "r_x3": 435.46735, "r_y3": 192.49474999999995, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.38202, "r_y0": 214.15204000000006, "r_x1": 448.08466, "r_y1": 214.15204000000006, "r_x2": 448.08466, "r_y2": 204.83025999999995, "r_x3": 435.38202, "r_y3": 204.83025999999995, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.59906, "r_y0": 226.55548, "r_x1": 448.3017, "r_y1": 226.55548, "r_x2": 448.3017, "r_y2": 217.2337, "r_x3": 435.59906, "r_y3": 217.2337, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.14957, "r_y0": 214.55669999999998, "r_x1": 381.32474, "r_y1": 214.55669999999998, "r_x2": 381.32474, "r_y2": 205.23492, "r_x3": 374.14957, "r_y3": 205.23492, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.0419, "r_y0": 226.46826, "r_x1": 381.21707, "r_y1": 226.46826, "r_x2": 381.21707, "r_y2": 217.14648, "r_x3": 374.0419, "r_y3": 217.14648, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.34418, "r_y0": 190.25665000000004, "r_x1": 381.51935, "r_y1": 190.25665000000004, "r_x2": 381.51935, "r_y2": 180.93488000000002, "r_x3": 374.34418, "r_y3": 180.93488000000002, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 387.76285, "r_y0": 177.89966000000004, "r_x1": 393.28833, "r_y1": 177.89966000000004, "r_x2": 393.28833, "r_y2": 168.57788000000005, "r_x3": 387.76285, "r_y3": 168.57788000000005, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.86395, "r_y0": 177.38373, "r_x1": 417.38943, "r_y1": 177.38373, "r_x2": 417.38943, "r_y2": 168.06195000000002, "r_x3": 411.86395, "r_y3": 168.06195000000002, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.33563, "r_y0": 177.25616000000002, "r_x1": 428.86111, "r_y1": 177.25616000000002, "r_x2": 428.86111, "r_y2": 167.93439, "r_x3": 423.33563, "r_y3": 167.93439, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 387.13593, "r_y0": 190.10753999999997, "r_x1": 393.76453, "r_y1": 190.10753999999997, "r_x2": 393.76453, "r_y2": 180.78576999999996, "r_x3": 387.13593, "r_y3": 180.78576999999996, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.2594, "r_y0": 253.83056999999997, "r_x1": 289.43457, "r_y1": 253.83056999999997, "r_x2": 289.43457, "r_y2": 244.50878999999998, "r_x3": 282.2594, "r_y3": 244.50878999999998, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.11035, "r_y0": 266.172, "r_x1": 289.28552, "r_y1": 266.172, "r_x2": 289.28552, "r_y2": 256.85022000000004, "r_x3": 282.11035, "r_y3": 256.85022000000004, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.40848, "r_y0": 278.45477000000005, "r_x1": 289.58365, "r_y1": 278.45477000000005, "r_x2": 289.58365, "r_y2": 269.13300000000004, "r_x3": 282.40848, "r_y3": 269.13300000000004, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.52902, "r_y0": 253.81525, "r_x1": 301.0545, "r_y1": 253.81525, "r_x2": 301.0545, "r_y2": 244.49347, "r_x3": 295.52902, "r_y3": 244.49347, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 307.46613, "r_y0": 253.89550999999994, "r_x1": 312.99161, "r_y1": 253.89550999999994, "r_x2": 312.99161, "r_y2": 244.57372999999995, "r_x3": 307.46613, "r_y3": 244.57372999999995, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.76886, "r_y0": 253.76215000000002, "r_x1": 324.29434, "r_y1": 253.76215000000002, "r_x2": 324.29434, "r_y2": 244.44037000000003, "r_x3": 318.76886, "r_y3": 244.44037000000003, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 294.9021, "r_y0": 266.02332, "r_x1": 301.03976, "r_y1": 266.02332, "r_x2": 301.03976, "r_y2": 256.70154, "r_x3": 294.9021, "r_y3": 256.70154, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 307.17743, "r_y0": 266.02332, "r_x1": 325.59039, "r_y1": 266.02332, "r_x2": 325.59039, "r_y2": 256.70154, "r_x3": 307.17743, "r_y3": 256.70154, "coord_origin": "TOPLEFT" }, "text": "X X", "orig": "X X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 294.78949, "r_y0": 278.57599000000005, "r_x1": 300.92715, "r_y1": 278.57599000000005, "r_x2": 300.92715, "r_y2": 269.25420999999994, "r_x3": 294.78949, "r_y3": 269.25420999999994, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 307.06482, "r_y0": 278.57599000000005, "r_x1": 325.47778, "r_y1": 278.57599000000005, "r_x2": 325.47778, "r_y2": 269.25420999999994, "r_x3": 307.06482, "r_y3": 269.25420999999994, "coord_origin": "TOPLEFT" }, "text": "X X", "orig": "X X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 195.93939, "r_y0": 278.06976, "r_x1": 203.11456, "r_y1": 278.06976, "r_x2": 203.11456, "r_y2": 268.74798999999996, "r_x3": 195.93939, "r_y3": 268.74798999999996, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.20891, "r_y0": 278.05444, "r_x1": 214.73439, "r_y1": 278.05444, "r_x2": 214.73439, "r_y2": 268.73267, "r_x3": 209.20891, "r_y3": 268.73267, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 221.14551, "r_y0": 278.13469999999995, "r_x1": 226.67099, "r_y1": 278.13469999999995, "r_x2": 226.67099, "r_y2": 268.81293000000005, "r_x3": 221.14551, "r_y3": 268.81293000000005, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.44858, "r_y0": 278.00134, "r_x1": 237.97405999999998, "r_y1": 278.00134, "r_x2": 237.97405999999998, "r_y2": 268.67957, "r_x3": 232.44858, "r_y3": 268.67957, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.21715, "r_y0": 253.86139000000003, "r_x1": 203.39232, "r_y1": 253.86139000000003, "r_x2": 203.39232, "r_y2": 244.53961000000004, "r_x3": 196.21715, "r_y3": 244.53961000000004, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 250.32143, "r_y0": 253.41992000000005, "r_x1": 257.49661, "r_y1": 253.41992000000005, "r_x2": 257.49661, "r_y2": 244.09813999999994, "r_x3": 250.32143, "r_y3": 244.09813999999994, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 250.17235999999997, "r_y0": 265.76129000000003, "r_x1": 257.34753, "r_y1": 265.76129000000003, "r_x2": 257.34753, "r_y2": 256.43951000000004, "r_x3": 250.17235999999997, "r_y3": 256.43951000000004, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 250.47049000000004, "r_y0": 278.04400999999996, "r_x1": 257.64566, "r_y1": 278.04400999999996, "r_x2": 257.64566, "r_y2": 268.72222999999997, "r_x3": 250.47049000000004, "r_y3": 268.72222999999997, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.51135, "r_y0": 249.20911, "r_x1": 337.22485, "r_y1": 249.20911, "r_x2": 337.22485, "r_y2": 242.99463000000003, "r_x3": 334.51135, "r_y3": 242.99463000000003, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.93835, "r_y0": 249.20911, "r_x1": 391.49472, "r_y1": 249.20911, "r_x2": 391.49472, "r_y2": 242.99463000000003, "r_x3": 339.93835, "r_y3": 242.99463000000003, "coord_origin": "TOPLEFT" }, "text": "- simple cells: \"C\"", "orig": "- simple cells: \"C\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.51135, "r_y0": 259.14703, "r_x1": 337.33313, "r_y1": 259.14703, "r_x2": 337.33313, "r_y2": 252.93255999999997, "r_x3": 334.51135, "r_y3": 252.93255999999997, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.15491, "r_y0": 259.14703, "r_x1": 421.98624, "r_y1": 259.14703, "r_x2": 421.98624, "r_y2": 252.93255999999997, "r_x3": 340.15491, "r_y3": 252.93255999999997, "coord_origin": "TOPLEFT" }, "text": "- horizontal merges: \"C\", \"L\"", "orig": "- horizontal merges: \"C\", \"L\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.51135, "r_y0": 269.08496, "r_x1": 337.29868, "r_y1": 269.08496, "r_x2": 337.29868, "r_y2": 262.87048000000004, "r_x3": 334.51135, "r_y3": 262.87048000000004, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.086, "r_y0": 269.08496, "r_x1": 415.34375, "r_y1": 269.08496, "r_x2": 415.34375, "r_y2": 262.87048000000004, "r_x3": 340.086, "r_y3": 262.87048000000004, "coord_origin": "TOPLEFT" }, "text": "- vertical merges: \"C\", \"U\"", "orig": "- vertical merges: \"C\", \"U\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.51135, "r_y0": 279.02288999999996, "r_x1": 337.30188, "r_y1": 279.02288999999996, "r_x2": 337.30188, "r_y2": 272.80841, "r_x3": 334.51135, "r_y3": 272.80841, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.09241, "r_y0": 279.02288999999996, "r_x1": 426.59875, "r_y1": 279.02288999999996, "r_x2": 426.59875, "r_y2": 272.80841, "r_x3": 340.09241, "r_y3": 272.80841, "coord_origin": "TOPLEFT" }, "text": "- 2d merges: \"C\", \"L\", \"U\", \"X\"", "orig": "- 2d merges: \"C\", \"L\", \"U\", \"X\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.67178, "r_y0": 250.25671, "r_x1": 189.35544, "r_y1": 250.25671, "r_x2": 189.35544, "r_y2": 244.04224, "r_x3": 185.67178, "r_y3": 244.04224, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.96759, "r_y0": 274.56213, "r_x1": 189.65125, "r_y1": 274.56213, "r_x2": 189.65125, "r_y2": 268.34766, "r_x3": 185.96759, "r_y3": 268.34766, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.34152, "r_y0": 249.83972000000006, "r_x1": 243.02518, "r_y1": 249.83972000000006, "r_x2": 243.02518, "r_y2": 243.62523999999996, "r_x3": 239.34152, "r_y3": 243.62523999999996, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 271.32852, "r_y0": 249.70836999999995, "r_x1": 275.01218, "r_y1": 249.70836999999995, "r_x2": 275.01218, "r_y2": 243.49390000000005, "r_x3": 271.32852, "r_y3": 243.49390000000005, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.81627, "r_y0": 172.72942999999998, "r_x1": 233.49992000000003, "r_y1": 172.72942999999998, "r_x2": 233.49992000000003, "r_y2": 166.51495, "r_x3": 229.81627, "r_y3": 166.51495, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 257.24402, "r_y0": 196.17548, "r_x1": 260.92767, "r_y1": 196.17548, "r_x2": 260.92767, "r_y2": 189.961, "r_x3": 257.24402, "r_y3": 189.961, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 186.87526, "r_y0": 184.19115999999997, "r_x1": 190.55891, "r_y1": 184.19115999999997, "r_x2": 190.55891, "r_y2": 177.97668, "r_x3": 186.87526, "r_y3": 177.97668, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.48746, "r_y0": 175.22968000000003, "r_x1": 200.17111, "r_y1": 175.22968000000003, "r_x2": 200.17111, "r_y2": 169.01520000000005, "r_x3": 196.48746, "r_y3": 169.01520000000005, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 169.74728, "r_y0": 175.65039000000002, "r_x1": 175.72659, "r_y1": 175.65039000000002, "r_x2": 175.72659, "r_y2": 167.88225999999997, "r_x3": 169.74728, "r_y3": 167.88225999999997, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 169.74728, "r_y0": 214.60681, "r_x1": 175.72659, "r_y1": 214.60681, "r_x2": 175.72659, "r_y2": 206.83867999999995, "r_x3": 169.74728, "r_y3": 206.83867999999995, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 274.29419, "r_y0": 176.04785000000004, "r_x1": 280.2735, "r_y1": 176.04785000000004, "r_x2": 280.2735, "r_y2": 168.27972, "r_x3": 274.29419, "r_y3": 168.27972, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 359.56152, "r_y0": 176.04785000000004, "r_x1": 365.54083, "r_y1": 176.04785000000004, "r_x2": 365.54083, "r_y2": 168.27972, "r_x3": 359.56152, "r_y3": 168.27972, "coord_origin": "TOPLEFT" }, "text": "D", "orig": "D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 169.74728, "r_y0": 250.97960999999998, "r_x1": 175.27112, "r_y1": 250.97960999999998, "r_x2": 175.27112, "r_y2": 243.21149000000003, "r_x3": 169.74728, "r_y3": 243.21149000000003, "coord_origin": "TOPLEFT" }, "text": "E", "orig": "E", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 38, "label": "text", "bbox": { "l": 374.49326, "t": 168.59362999999996, "r": 381.66843, "b": 177.91540999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.49326, "r_y0": 177.91540999999995, "r_x1": 381.66843, "r_y1": 177.91540999999995, "r_x2": 381.66843, "r_y2": 168.59362999999996, "r_x3": 374.49326, "r_y3": 168.59362999999996, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 39, "label": "text", "bbox": { "l": 398.74011, "t": 168.50005999999996, "r": 405.91528, "b": 177.82183999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.74011, "r_y0": 177.82183999999995, "r_x1": 405.91528, "r_y1": 177.82183999999995, "r_x2": 405.91528, "r_y2": 168.50005999999996, "r_x3": 398.74011, "r_y3": 168.50005999999996, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 40, "label": "text", "bbox": { "l": 373.76862, "t": 192.92553999999996, "r": 380.94379, "b": 202.24730999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 373.76862, "r_y0": 202.24730999999997, "r_x1": 380.94379, "r_y1": 202.24730999999997, "r_x2": 380.94379, "r_y2": 192.92553999999996, "r_x3": 373.76862, "r_y3": 192.92553999999996, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 386.66388, "t": 193.07061999999996, "r": 393.83905, "b": 202.39239999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.66388, "r_y0": 202.39239999999995, "r_x1": 393.83905, "r_y1": 202.39239999999995, "r_x2": 393.83905, "r_y2": 193.07061999999996, "r_x3": 386.66388, "r_y3": 193.07061999999996, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 386.68707, "t": 205.13756999999998, "r": 393.86224, "b": 214.45934999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.68707, "r_y0": 214.45934999999997, "r_x1": 393.86224, "r_y1": 214.45934999999997, "r_x2": 393.86224, "r_y2": 205.13756999999998, "r_x3": 386.68707, "r_y3": 205.13756999999998, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 398.65729, "t": 180.73279000000002, "r": 405.83246, "b": 190.05457, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.65729, "r_y0": 190.05457, "r_x1": 405.83246, "r_y1": 190.05457, "r_x2": 405.83246, "r_y2": 180.73279000000002, "r_x3": 398.65729, "r_y3": 180.73279000000002, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 410.77908, "t": 180.73859000000004, "r": 417.95425, "b": 190.06035999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.77908, "r_y0": 190.06035999999995, "r_x1": 417.95425, "r_y1": 190.06035999999995, "r_x2": 417.95425, "r_y2": 180.73859000000004, "r_x3": 410.77908, "r_y3": 180.73859000000004, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 422.90503, "t": 180.65247, "r": 430.08020000000005, "b": 189.97424, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 422.90503, "r_y0": 189.97424, "r_x1": 430.08020000000005, "r_y1": 189.97424, "r_x2": 430.08020000000005, "r_y2": 180.65247, "r_x3": 422.90503, "r_y3": 180.65247, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 398.7807, "t": 192.98865, "r": 405.95587, "b": 202.31042000000002, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.7807, "r_y0": 202.31042000000002, "r_x1": 405.95587, "r_y1": 202.31042000000002, "r_x2": 405.95587, "r_y2": 192.98865, "r_x3": 398.7807, "r_y3": 192.98865, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 410.90164, "t": 192.99487, "r": 418.07681, "b": 202.31664999999998, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.90164, "r_y0": 202.31664999999998, "r_x1": 418.07681, "r_y1": 202.31664999999998, "r_x2": 418.07681, "r_y2": 192.99487, "r_x3": 410.90164, "r_y3": 192.99487, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 423.02753, "t": 192.909, "r": 430.2027, "b": 202.23077, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.02753, "r_y0": 202.23077, "r_x1": 430.2027, "r_y1": 202.23077, "r_x2": 430.2027, "r_y2": 192.909, "r_x3": 423.02753, "r_y3": 192.909, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 398.78235, "t": 205.31573000000003, "r": 405.95752, "b": 214.63751000000002, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.78235, "r_y0": 214.63751000000002, "r_x1": 405.95752, "r_y1": 214.63751000000002, "r_x2": 405.95752, "r_y2": 205.31573000000003, "r_x3": 398.78235, "r_y3": 205.31573000000003, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 410.90414, "t": 205.32196, "r": 418.07932, "b": 214.64373999999998, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.90414, "r_y0": 214.64373999999998, "r_x1": 418.07932, "r_y1": 214.64373999999998, "r_x2": 418.07932, "r_y2": 205.32196, "r_x3": 410.90414, "r_y3": 205.32196, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 51, "label": "text", "bbox": { "l": 423.03003, "t": 205.23614999999995, "r": 430.20520000000005, "b": 214.55791999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.03003, "r_y0": 214.55791999999997, "r_x1": 430.20520000000005, "r_y1": 214.55791999999997, "r_x2": 430.20520000000005, "r_y2": 205.23614999999995, "r_x3": 423.03003, "r_y3": 205.23614999999995, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 52, "label": "text", "bbox": { "l": 386.50574, "t": 217.03882, "r": 393.68091, "b": 226.36059999999998, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.50574, "r_y0": 226.36059999999998, "r_x1": 393.68091, "r_y1": 226.36059999999998, "r_x2": 393.68091, "r_y2": 217.03882, "r_x3": 386.50574, "r_y3": 217.03882, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 53, "label": "text", "bbox": { "l": 398.60181, "t": 217.21704, "r": 405.77698, "b": 226.53882, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.60181, "r_y0": 226.53882, "r_x1": 405.77698, "r_y1": 226.53882, "r_x2": 405.77698, "r_y2": 217.21704, "r_x3": 398.60181, "r_y3": 217.21704, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 54, "label": "text", "bbox": { "l": 410.72275, "t": 217.22321, "r": 417.89792, "b": 226.54498, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.72275, "r_y0": 226.54498, "r_x1": 417.89792, "r_y1": 226.54498, "r_x2": 417.89792, "r_y2": 217.22321, "r_x3": 410.72275, "r_y3": 217.22321, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 55, "label": "text", "bbox": { "l": 422.84869, "t": 217.13738999999998, "r": 430.02386, "b": 226.45916999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 422.84869, "r_y0": 226.45916999999997, "r_x1": 430.02386, "r_y1": 226.45916999999997, "r_x2": 430.02386, "r_y2": 217.13738999999998, "r_x3": 422.84869, "r_y3": 217.13738999999998, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 56, "label": "text", "bbox": { "l": 435.16009999999994, "t": 167.69011999999998, "r": 447.86273, "b": 177.01189999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.16009999999994, "r_y0": 177.01189999999997, "r_x1": 447.86273, "r_y1": 177.01189999999997, "r_x2": 447.86273, "r_y2": 167.69011999999998, "r_x3": 435.16009999999994, "r_y3": 167.69011999999998, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 57, "label": "text", "bbox": { "l": 435.44415, "t": 180.20025999999996, "r": 448.14679, "b": 189.52202999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.44415, "r_y0": 189.52202999999997, "r_x1": 448.14679, "r_y1": 189.52202999999997, "r_x2": 448.14679, "r_y2": 180.20025999999996, "r_x3": 435.44415, "r_y3": 180.20025999999996, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 58, "label": "text", "bbox": { "l": 435.46735, "t": 192.49474999999995, "r": 448.16998000000007, "b": 201.81652999999994, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.46735, "r_y0": 201.81652999999994, "r_x1": 448.16998000000007, "r_y1": 201.81652999999994, "r_x2": 448.16998000000007, "r_y2": 192.49474999999995, "r_x3": 435.46735, "r_y3": 192.49474999999995, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 59, "label": "text", "bbox": { "l": 435.38202, "t": 204.83025999999995, "r": 448.08466, "b": 214.15204000000006, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.38202, "r_y0": 214.15204000000006, "r_x1": 448.08466, "r_y1": 214.15204000000006, "r_x2": 448.08466, "r_y2": 204.83025999999995, "r_x3": 435.38202, "r_y3": 204.83025999999995, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 60, "label": "text", "bbox": { "l": 435.59906, "t": 217.2337, "r": 448.3017, "b": 226.55548, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.59906, "r_y0": 226.55548, "r_x1": 448.3017, "r_y1": 226.55548, "r_x2": 448.3017, "r_y2": 217.2337, "r_x3": 435.59906, "r_y3": 217.2337, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 61, "label": "text", "bbox": { "l": 374.14957, "t": 205.23492, "r": 381.32474, "b": 214.55669999999998, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.14957, "r_y0": 214.55669999999998, "r_x1": 381.32474, "r_y1": 214.55669999999998, "r_x2": 381.32474, "r_y2": 205.23492, "r_x3": 374.14957, "r_y3": 205.23492, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 62, "label": "text", "bbox": { "l": 374.0419, "t": 217.14648, "r": 381.21707, "b": 226.46826, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.0419, "r_y0": 226.46826, "r_x1": 381.21707, "r_y1": 226.46826, "r_x2": 381.21707, "r_y2": 217.14648, "r_x3": 374.0419, "r_y3": 217.14648, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 374.34418, "t": 180.93488000000002, "r": 381.51935, "b": 190.25665000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.34418, "r_y0": 190.25665000000004, "r_x1": 381.51935, "r_y1": 190.25665000000004, "r_x2": 381.51935, "r_y2": 180.93488000000002, "r_x3": 374.34418, "r_y3": 180.93488000000002, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 387.76285, "t": 168.57788000000005, "r": 393.28833, "b": 177.89966000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 387.76285, "r_y0": 177.89966000000004, "r_x1": 393.28833, "r_y1": 177.89966000000004, "r_x2": 393.28833, "r_y2": 168.57788000000005, "r_x3": 387.76285, "r_y3": 168.57788000000005, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 411.86395, "t": 168.06195000000002, "r": 417.38943, "b": 177.38373, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.86395, "r_y0": 177.38373, "r_x1": 417.38943, "r_y1": 177.38373, "r_x2": 417.38943, "r_y2": 168.06195000000002, "r_x3": 411.86395, "r_y3": 168.06195000000002, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 423.33563, "t": 167.93439, "r": 428.86111, "b": 177.25616000000002, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.33563, "r_y0": 177.25616000000002, "r_x1": 428.86111, "r_y1": 177.25616000000002, "r_x2": 428.86111, "r_y2": 167.93439, "r_x3": 423.33563, "r_y3": 167.93439, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 387.13593, "t": 180.78576999999996, "r": 393.76453, "b": 190.10753999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 387.13593, "r_y0": 190.10753999999997, "r_x1": 393.76453, "r_y1": 190.10753999999997, "r_x2": 393.76453, "r_y2": 180.78576999999996, "r_x3": 387.13593, "r_y3": 180.78576999999996, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 282.2594, "t": 244.50878999999998, "r": 289.43457, "b": 253.83056999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.2594, "r_y0": 253.83056999999997, "r_x1": 289.43457, "r_y1": 253.83056999999997, "r_x2": 289.43457, "r_y2": 244.50878999999998, "r_x3": 282.2594, "r_y3": 244.50878999999998, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 282.11035, "t": 256.85022000000004, "r": 289.28552, "b": 266.172, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.11035, "r_y0": 266.172, "r_x1": 289.28552, "r_y1": 266.172, "r_x2": 289.28552, "r_y2": 256.85022000000004, "r_x3": 282.11035, "r_y3": 256.85022000000004, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 282.40848, "t": 269.13300000000004, "r": 289.58365, "b": 278.45477000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.40848, "r_y0": 278.45477000000005, "r_x1": 289.58365, "r_y1": 278.45477000000005, "r_x2": 289.58365, "r_y2": 269.13300000000004, "r_x3": 282.40848, "r_y3": 269.13300000000004, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 295.52902, "t": 244.49347, "r": 301.0545, "b": 253.81525, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.52902, "r_y0": 253.81525, "r_x1": 301.0545, "r_y1": 253.81525, "r_x2": 301.0545, "r_y2": 244.49347, "r_x3": 295.52902, "r_y3": 244.49347, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 307.46613, "t": 244.57372999999995, "r": 312.99161, "b": 253.89550999999994, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 307.46613, "r_y0": 253.89550999999994, "r_x1": 312.99161, "r_y1": 253.89550999999994, "r_x2": 312.99161, "r_y2": 244.57372999999995, "r_x3": 307.46613, "r_y3": 244.57372999999995, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 318.76886, "t": 244.44037000000003, "r": 324.29434, "b": 253.76215000000002, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.76886, "r_y0": 253.76215000000002, "r_x1": 324.29434, "r_y1": 253.76215000000002, "r_x2": 324.29434, "r_y2": 244.44037000000003, "r_x3": 318.76886, "r_y3": 244.44037000000003, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 294.9021, "t": 256.70154, "r": 301.03976, "b": 266.02332, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 294.9021, "r_y0": 266.02332, "r_x1": 301.03976, "r_y1": 266.02332, "r_x2": 301.03976, "r_y2": 256.70154, "r_x3": 294.9021, "r_y3": 256.70154, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 307.17743, "t": 256.70154, "r": 325.59039, "b": 266.02332, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 307.17743, "r_y0": 266.02332, "r_x1": 325.59039, "r_y1": 266.02332, "r_x2": 325.59039, "r_y2": 256.70154, "r_x3": 307.17743, "r_y3": 256.70154, "coord_origin": "TOPLEFT" }, "text": "X X", "orig": "X X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 294.78949, "t": 269.25420999999994, "r": 300.92715, "b": 278.57599000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 294.78949, "r_y0": 278.57599000000005, "r_x1": 300.92715, "r_y1": 278.57599000000005, "r_x2": 300.92715, "r_y2": 269.25420999999994, "r_x3": 294.78949, "r_y3": 269.25420999999994, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 307.06482, "t": 269.25420999999994, "r": 325.47778, "b": 278.57599000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 307.06482, "r_y0": 278.57599000000005, "r_x1": 325.47778, "r_y1": 278.57599000000005, "r_x2": 325.47778, "r_y2": 269.25420999999994, "r_x3": 307.06482, "r_y3": 269.25420999999994, "coord_origin": "TOPLEFT" }, "text": "X X", "orig": "X X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 195.93939, "t": 268.74798999999996, "r": 203.11456, "b": 278.06976, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 195.93939, "r_y0": 278.06976, "r_x1": 203.11456, "r_y1": 278.06976, "r_x2": 203.11456, "r_y2": 268.74798999999996, "r_x3": 195.93939, "r_y3": 268.74798999999996, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 209.20891, "t": 268.73267, "r": 214.73439, "b": 278.05444, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.20891, "r_y0": 278.05444, "r_x1": 214.73439, "r_y1": 278.05444, "r_x2": 214.73439, "r_y2": 268.73267, "r_x3": 209.20891, "r_y3": 268.73267, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 80, "label": "text", "bbox": { "l": 221.14551, "t": 268.81293000000005, "r": 226.67099, "b": 278.13469999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 221.14551, "r_y0": 278.13469999999995, "r_x1": 226.67099, "r_y1": 278.13469999999995, "r_x2": 226.67099, "r_y2": 268.81293000000005, "r_x3": 221.14551, "r_y3": 268.81293000000005, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 81, "label": "text", "bbox": { "l": 232.44858, "t": 268.67957, "r": 237.97405999999998, "b": 278.00134, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.44858, "r_y0": 278.00134, "r_x1": 237.97405999999998, "r_y1": 278.00134, "r_x2": 237.97405999999998, "r_y2": 268.67957, "r_x3": 232.44858, "r_y3": 268.67957, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 82, "label": "text", "bbox": { "l": 196.21715, "t": 244.53961000000004, "r": 203.39232, "b": 253.86139000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.21715, "r_y0": 253.86139000000003, "r_x1": 203.39232, "r_y1": 253.86139000000003, "r_x2": 203.39232, "r_y2": 244.53961000000004, "r_x3": 196.21715, "r_y3": 244.53961000000004, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 83, "label": "text", "bbox": { "l": 250.32143, "t": 244.09813999999994, "r": 257.49661, "b": 253.41992000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 250.32143, "r_y0": 253.41992000000005, "r_x1": 257.49661, "r_y1": 253.41992000000005, "r_x2": 257.49661, "r_y2": 244.09813999999994, "r_x3": 250.32143, "r_y3": 244.09813999999994, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 84, "label": "text", "bbox": { "l": 250.17235999999997, "t": 256.43951000000004, "r": 257.34753, "b": 265.76129000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 250.17235999999997, "r_y0": 265.76129000000003, "r_x1": 257.34753, "r_y1": 265.76129000000003, "r_x2": 257.34753, "r_y2": 256.43951000000004, "r_x3": 250.17235999999997, "r_y3": 256.43951000000004, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 85, "label": "text", "bbox": { "l": 250.47049000000004, "t": 268.72222999999997, "r": 257.64566, "b": 278.04400999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 250.47049000000004, "r_y0": 278.04400999999996, "r_x1": 257.64566, "r_y1": 278.04400999999996, "r_x2": 257.64566, "r_y2": 268.72222999999997, "r_x3": 250.47049000000004, "r_y3": 268.72222999999997, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 86, "label": "text", "bbox": { "l": 334.51135, "t": 242.99463000000003, "r": 337.22485, "b": 249.20911, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.51135, "r_y0": 249.20911, "r_x1": 337.22485, "r_y1": 249.20911, "r_x2": 337.22485, "r_y2": 242.99463000000003, "r_x3": 334.51135, "r_y3": 242.99463000000003, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 87, "label": "text", "bbox": { "l": 339.93835, "t": 242.99463000000003, "r": 391.49472, "b": 249.20911, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.93835, "r_y0": 249.20911, "r_x1": 391.49472, "r_y1": 249.20911, "r_x2": 391.49472, "r_y2": 242.99463000000003, "r_x3": 339.93835, "r_y3": 242.99463000000003, "coord_origin": "TOPLEFT" }, "text": "- simple cells: \"C\"", "orig": "- simple cells: \"C\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 88, "label": "text", "bbox": { "l": 334.51135, "t": 252.93255999999997, "r": 337.33313, "b": 259.14703, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.51135, "r_y0": 259.14703, "r_x1": 337.33313, "r_y1": 259.14703, "r_x2": 337.33313, "r_y2": 252.93255999999997, "r_x3": 334.51135, "r_y3": 252.93255999999997, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 89, "label": "text", "bbox": { "l": 340.15491, "t": 252.93255999999997, "r": 421.98624, "b": 259.14703, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.15491, "r_y0": 259.14703, "r_x1": 421.98624, "r_y1": 259.14703, "r_x2": 421.98624, "r_y2": 252.93255999999997, "r_x3": 340.15491, "r_y3": 252.93255999999997, "coord_origin": "TOPLEFT" }, "text": "- horizontal merges: \"C\", \"L\"", "orig": "- horizontal merges: \"C\", \"L\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 90, "label": "text", "bbox": { "l": 334.51135, "t": 262.87048000000004, "r": 337.29868, "b": 269.08496, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.51135, "r_y0": 269.08496, "r_x1": 337.29868, "r_y1": 269.08496, "r_x2": 337.29868, "r_y2": 262.87048000000004, "r_x3": 334.51135, "r_y3": 262.87048000000004, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 91, "label": "text", "bbox": { "l": 340.086, "t": 262.87048000000004, "r": 415.34375, "b": 269.08496, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.086, "r_y0": 269.08496, "r_x1": 415.34375, "r_y1": 269.08496, "r_x2": 415.34375, "r_y2": 262.87048000000004, "r_x3": 340.086, "r_y3": 262.87048000000004, "coord_origin": "TOPLEFT" }, "text": "- vertical merges: \"C\", \"U\"", "orig": "- vertical merges: \"C\", \"U\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 18, "label": "list_item", "bbox": { "l": 334.51135, "t": 272.80841, "r": 426.59875, "b": 279.02288999999996, "coord_origin": "TOPLEFT" }, "confidence": 0.5250625610351562, "cells": [ { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.51135, "r_y0": 279.02288999999996, "r_x1": 337.30188, "r_y1": 279.02288999999996, "r_x2": 337.30188, "r_y2": 272.80841, "r_x3": 334.51135, "r_y3": 272.80841, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.09241, "r_y0": 279.02288999999996, "r_x1": 426.59875, "r_y1": 279.02288999999996, "r_x2": 426.59875, "r_y2": 272.80841, "r_x3": 340.09241, "r_y3": 272.80841, "coord_origin": "TOPLEFT" }, "text": "- 2d merges: \"C\", \"L\", \"U\", \"X\"", "orig": "- 2d merges: \"C\", \"L\", \"U\", \"X\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 92, "label": "text", "bbox": { "l": 185.67178, "t": 244.04224, "r": 189.35544, "b": 250.25671, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.67178, "r_y0": 250.25671, "r_x1": 189.35544, "r_y1": 250.25671, "r_x2": 189.35544, "r_y2": 244.04224, "r_x3": 185.67178, "r_y3": 244.04224, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 93, "label": "text", "bbox": { "l": 185.96759, "t": 268.34766, "r": 189.65125, "b": 274.56213, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.96759, "r_y0": 274.56213, "r_x1": 189.65125, "r_y1": 274.56213, "r_x2": 189.65125, "r_y2": 268.34766, "r_x3": 185.96759, "r_y3": 268.34766, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 94, "label": "text", "bbox": { "l": 239.34152, "t": 243.62523999999996, "r": 243.02518, "b": 249.83972000000006, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.34152, "r_y0": 249.83972000000006, "r_x1": 243.02518, "r_y1": 249.83972000000006, "r_x2": 243.02518, "r_y2": 243.62523999999996, "r_x3": 239.34152, "r_y3": 243.62523999999996, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 95, "label": "text", "bbox": { "l": 271.32852, "t": 243.49390000000005, "r": 275.01218, "b": 249.70836999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 271.32852, "r_y0": 249.70836999999995, "r_x1": 275.01218, "r_y1": 249.70836999999995, "r_x2": 275.01218, "r_y2": 243.49390000000005, "r_x3": 271.32852, "r_y3": 243.49390000000005, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 96, "label": "text", "bbox": { "l": 229.81627, "t": 166.51495, "r": 233.49992000000003, "b": 172.72942999999998, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.81627, "r_y0": 172.72942999999998, "r_x1": 233.49992000000003, "r_y1": 172.72942999999998, "r_x2": 233.49992000000003, "r_y2": 166.51495, "r_x3": 229.81627, "r_y3": 166.51495, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 97, "label": "text", "bbox": { "l": 257.24402, "t": 189.961, "r": 260.92767, "b": 196.17548, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 257.24402, "r_y0": 196.17548, "r_x1": 260.92767, "r_y1": 196.17548, "r_x2": 260.92767, "r_y2": 189.961, "r_x3": 257.24402, "r_y3": 189.961, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 98, "label": "text", "bbox": { "l": 186.87526, "t": 177.97668, "r": 190.55891, "b": 184.19115999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 186.87526, "r_y0": 184.19115999999997, "r_x1": 190.55891, "r_y1": 184.19115999999997, "r_x2": 190.55891, "r_y2": 177.97668, "r_x3": 186.87526, "r_y3": 177.97668, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 99, "label": "text", "bbox": { "l": 196.48746, "t": 169.01520000000005, "r": 200.17111, "b": 175.22968000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.48746, "r_y0": 175.22968000000003, "r_x1": 200.17111, "r_y1": 175.22968000000003, "r_x2": 200.17111, "r_y2": 169.01520000000005, "r_x3": 196.48746, "r_y3": 169.01520000000005, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 100, "label": "text", "bbox": { "l": 169.74728, "t": 167.88225999999997, "r": 175.72659, "b": 175.65039000000002, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 169.74728, "r_y0": 175.65039000000002, "r_x1": 175.72659, "r_y1": 175.65039000000002, "r_x2": 175.72659, "r_y2": 167.88225999999997, "r_x3": 169.74728, "r_y3": 167.88225999999997, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 101, "label": "text", "bbox": { "l": 169.74728, "t": 206.83867999999995, "r": 175.72659, "b": 214.60681, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 169.74728, "r_y0": 214.60681, "r_x1": 175.72659, "r_y1": 214.60681, "r_x2": 175.72659, "r_y2": 206.83867999999995, "r_x3": 169.74728, "r_y3": 206.83867999999995, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 102, "label": "text", "bbox": { "l": 274.29419, "t": 168.27972, "r": 280.2735, "b": 176.04785000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 274.29419, "r_y0": 176.04785000000004, "r_x1": 280.2735, "r_y1": 176.04785000000004, "r_x2": 280.2735, "r_y2": 168.27972, "r_x3": 274.29419, "r_y3": 168.27972, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 103, "label": "text", "bbox": { "l": 359.56152, "t": 168.27972, "r": 365.54083, "b": 176.04785000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 359.56152, "r_y0": 176.04785000000004, "r_x1": 365.54083, "r_y1": 176.04785000000004, "r_x2": 365.54083, "r_y2": 168.27972, "r_x3": 359.56152, "r_y3": 168.27972, "coord_origin": "TOPLEFT" }, "text": "D", "orig": "D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 104, "label": "text", "bbox": { "l": 169.74728, "t": 243.21149000000003, "r": 175.27112, "b": 250.97960999999998, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 169.74728, "r_y0": 250.97960999999998, "r_x1": 175.27112, "r_y1": 250.97960999999998, "r_x2": 175.27112, "r_y2": 243.21149000000003, "r_x3": 169.74728, "r_y3": 243.21149000000003, "coord_origin": "TOPLEFT" }, "text": "E", "orig": "E", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "section_header", "id": 9, "page_no": 6, "cluster": { "id": 9, "label": "section_header", "bbox": { "l": 134.765, "t": 305.29581, "r": 246.65197999999998, "b": 314.10275, "coord_origin": "TOPLEFT" }, "confidence": 0.9233023524284363, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 314.10275, "r_x1": 149.40205, "r_y1": 314.10275, "r_x2": 149.40205, "r_y2": 305.29581, "r_x3": 134.765, "r_y3": 305.29581, "coord_origin": "TOPLEFT" }, "text": "4.2", "orig": "4.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.85904, "r_y0": 314.10275, "r_x1": 246.65197999999998, "r_y1": 314.10275, "r_x2": 246.65197999999998, "r_y2": 305.29581, "r_x3": 160.85904, "r_y3": 305.29581, "coord_origin": "TOPLEFT" }, "text": "Language Syntax", "orig": "Language Syntax", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "4.2 Language Syntax" }, { "label": "text", "id": 10, "page_no": 6, "cluster": { "id": 10, "label": "text", "bbox": { "l": 134.765, "t": 325.24777, "r": 363.79617, "b": 334.04474, "coord_origin": "TOPLEFT" }, "confidence": 0.9169168472290039, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 334.04474, "r_x1": 363.79617, "r_y1": 334.04474, "r_x2": 363.79617, "r_y2": 325.24777, "r_x3": 134.765, "r_y3": 325.24777, "coord_origin": "TOPLEFT" }, "text": "The OTSL representation follows these syntax rules:", "orig": "The OTSL representation follows these syntax rules:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The OTSL representation follows these syntax rules:" }, { "label": "list_item", "id": 3, "page_no": 6, "cluster": { "id": 3, "label": "list_item", "bbox": { "l": 138.97299, "t": 347.17081, "r": 480.58902, "b": 367.93375, "coord_origin": "TOPLEFT" }, "confidence": 0.9588112235069275, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.97299, "r_y0": 355.97775, "r_x1": 146.71991, "r_y1": 355.97775, "r_x2": 146.71991, "r_y2": 347.18079, "r_x3": 138.97299, "r_y3": 347.18079, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.70099, "r_y0": 355.97775, "r_x1": 257.37927, "r_y1": 355.97775, "r_x2": 257.37927, "r_y2": 347.17081, "r_x3": 151.70099, "r_y3": 347.17081, "coord_origin": "TOPLEFT" }, "text": "Left-looking cell rule", "orig": "Left-looking cell rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 257.383, "r_y0": 355.97775, "r_x1": 480.58902, "r_y1": 355.97775, "r_x2": 480.58902, "r_y2": 347.18079, "r_x3": 257.383, "r_y3": 347.18079, "coord_origin": "TOPLEFT" }, "text": ": The left neighbour of an \"L\" cell must be either", "orig": ": The left neighbour of an \"L\" cell must be either", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.70099, "r_y0": 367.93375, "r_x1": 283.59387, "r_y1": 367.93375, "r_x2": 283.59387, "r_y2": 359.13678, "r_x3": 151.70099, "r_y3": 359.13678, "coord_origin": "TOPLEFT" }, "text": "another \"L\" cell or a \"C\" cell.", "orig": "another \"L\" cell or a \"C\" cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "1. Left-looking cell rule : The left neighbour of an \"L\" cell must be either another \"L\" cell or a \"C\" cell." }, { "label": "list_item", "id": 4, "page_no": 6, "cluster": { "id": 4, "label": "list_item", "bbox": { "l": 138.97299, "t": 371.08481, "r": 480.59229000000005, "b": 391.84673999999995, "coord_origin": "TOPLEFT" }, "confidence": 0.9585386514663696, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.97299, "r_y0": 379.89175, "r_x1": 146.71991, "r_y1": 379.89175, "r_x2": 146.71991, "r_y2": 371.09479, "r_x3": 138.97299, "r_y3": 371.09479, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.70099, "r_y0": 379.89175, "r_x1": 252.11203, "r_y1": 379.89175, "r_x2": 252.11203, "r_y2": 371.08481, "r_x3": 151.70099, "r_y3": 371.08481, "coord_origin": "TOPLEFT" }, "text": "Up-looking cell rule", "orig": "Up-looking cell rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 252.112, "r_y0": 379.89175, "r_x1": 480.59229000000005, "r_y1": 379.89175, "r_x2": 480.59229000000005, "r_y2": 371.09479, "r_x3": 252.112, "r_y3": 371.09479, "coord_origin": "TOPLEFT" }, "text": ": The upper neighbour of a \"U\" cell must be either", "orig": ": The upper neighbour of a \"U\" cell must be either", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.70099, "r_y0": 391.84673999999995, "r_x1": 284.8392, "r_y1": 391.84673999999995, "r_x2": 284.8392, "r_y2": 383.04977, "r_x3": 151.70099, "r_y3": 383.04977, "coord_origin": "TOPLEFT" }, "text": "another \"U\" cell or a \"C\" cell.", "orig": "another \"U\" cell or a \"C\" cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "2. Up-looking cell rule : The upper neighbour of a \"U\" cell must be either another \"U\" cell or a \"C\" cell." }, { "label": "section_header", "id": 14, "page_no": 6, "cluster": { "id": 14, "label": "section_header", "bbox": { "l": 138.97299, "t": 394.99780000000004, "r": 226.07360999999997, "b": 403.80475, "coord_origin": "TOPLEFT" }, "confidence": 0.6506174206733704, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.97299, "r_y0": 403.80475, "r_x1": 146.71991, "r_y1": 403.80475, "r_x2": 146.71991, "r_y2": 395.0077800000001, "r_x3": 138.97299, "r_y3": 395.0077800000001, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.70099, "r_y0": 403.80475, "r_x1": 223.3042, "r_y1": 403.80475, "r_x2": 223.3042, "r_y2": 394.99780000000004, "r_x3": 151.70099, "r_y3": 394.99780000000004, "coord_origin": "TOPLEFT" }, "text": "Cross cell rule", "orig": "Cross cell rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 223.30699, "r_y0": 403.80475, "r_x1": 226.07360999999997, "r_y1": 403.80475, "r_x2": 226.07360999999997, "r_y2": 395.0077800000001, "r_x3": 223.30699, "r_y3": 395.0077800000001, "coord_origin": "TOPLEFT" }, "text": ":", "orig": ":", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "3. Cross cell rule :" }, { "label": "list_item", "id": 13, "page_no": 6, "cluster": { "id": 13, "label": "list_item", "bbox": { "l": 151.70099, "t": 406.96677, "r": 480.59238, "b": 439.67371, "coord_origin": "TOPLEFT" }, "confidence": 0.7247239947319031, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.70099, "r_y0": 415.76373, "r_x1": 480.59238, "r_y1": 415.76373, "r_x2": 480.59238, "r_y2": 406.96677, "r_x3": 151.70099, "r_y3": 406.96677, "coord_origin": "TOPLEFT" }, "text": "The left neighbour of an \"X\" cell must be either another \"X\" cell or a \"U\"", "orig": "The left neighbour of an \"X\" cell must be either another \"X\" cell or a \"U\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.70099, "r_y0": 427.71871999999996, "r_x1": 480.59219, "r_y1": 427.71871999999996, "r_x2": 480.59219, "r_y2": 418.9217499999999, "r_x3": 151.70099, "r_y3": 418.9217499999999, "coord_origin": "TOPLEFT" }, "text": "cell, and the upper neighbour of an \"X\" cell must be either another \"X\" cell", "orig": "cell, and the upper neighbour of an \"X\" cell must be either another \"X\" cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.70099, "r_y0": 439.67371, "r_x1": 214.39663999999996, "r_y1": 439.67371, "r_x2": 214.39663999999996, "r_y2": 430.87674, "r_x3": 151.70099, "r_y3": 430.87674, "coord_origin": "TOPLEFT" }, "text": "or an \"L\" cell.", "orig": "or an \"L\" cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The left neighbour of an \"X\" cell must be either another \"X\" cell or a \"U\" cell, and the upper neighbour of an \"X\" cell must be either another \"X\" cell or an \"L\" cell." }, { "label": "list_item", "id": 8, "page_no": 6, "cluster": { "id": 8, "label": "list_item", "bbox": { "l": 138.97299, "t": 442.82574, "r": 474.59018, "b": 451.63269, "coord_origin": "TOPLEFT" }, "confidence": 0.9259927272796631, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.97299, "r_y0": 451.63269, "r_x1": 146.71991, "r_y1": 451.63269, "r_x2": 146.71991, "r_y2": 442.83572, "r_x3": 138.97299, "r_y3": 442.83572, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.70099, "r_y0": 451.63269, "r_x1": 221.32263, "r_y1": 451.63269, "r_x2": 221.32263, "r_y2": 442.82574, "r_x3": 151.70099, "r_y3": 442.82574, "coord_origin": "TOPLEFT" }, "text": "First row rule", "orig": "First row rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 221.32700000000003, "r_y0": 451.63269, "r_x1": 474.59018, "r_y1": 451.63269, "r_x2": 474.59018, "r_y2": 442.83572, "r_x3": 221.32700000000003, "r_y3": 442.83572, "coord_origin": "TOPLEFT" }, "text": ": Only \"L\" cells and \"C\" cells are allowed in the first row.", "orig": ": Only \"L\" cells and \"C\" cells are allowed in the first row.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "4. First row rule : Only \"L\" cells and \"C\" cells are allowed in the first row." }, { "label": "list_item", "id": 5, "page_no": 6, "cluster": { "id": 5, "label": "list_item", "bbox": { "l": 138.97299, "t": 454.78375, "r": 480.58746, "b": 475.54568, "coord_origin": "TOPLEFT" }, "confidence": 0.9420599937438965, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.97299, "r_y0": 463.5907, "r_x1": 146.71991, "r_y1": 463.5907, "r_x2": 146.71991, "r_y2": 454.7937299999999, "r_x3": 138.97299, "r_y3": 454.7937299999999, "coord_origin": "TOPLEFT" }, "text": "5.", "orig": "5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.70099, "r_y0": 463.5907, "r_x1": 240.71982, "r_y1": 463.5907, "r_x2": 240.71982, "r_y2": 454.78375, "r_x3": 151.70099, "r_y3": 454.78375, "coord_origin": "TOPLEFT" }, "text": "First column rule", "orig": "First column rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 240.71599, "r_y0": 463.5907, "r_x1": 480.58746, "r_y1": 463.5907, "r_x2": 480.58746, "r_y2": 454.7937299999999, "r_x3": 240.71599, "r_y3": 454.7937299999999, "coord_origin": "TOPLEFT" }, "text": ": Only \"U\" cells and \"C\" cells are allowed in the first", "orig": ": Only \"U\" cells and \"C\" cells are allowed in the first", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.70099, "r_y0": 475.54568, "r_x1": 186.0072, "r_y1": 475.54568, "r_x2": 186.0072, "r_y2": 466.74872, "r_x3": 151.70099, "r_y3": 466.74872, "coord_origin": "TOPLEFT" }, "text": "column.", "orig": "column.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "5. First column rule : Only \"U\" cells and \"C\" cells are allowed in the first column." }, { "label": "list_item", "id": 1, "page_no": 6, "cluster": { "id": 1, "label": "list_item", "bbox": { "l": 138.97299, "t": 478.69675, "r": 480.59457, "b": 499.45969, "coord_origin": "TOPLEFT" }, "confidence": 0.9617829918861389, "cells": [ { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.97299, "r_y0": 487.50369, "r_x1": 146.71991, "r_y1": 487.50369, "r_x2": 146.71991, "r_y2": 478.70673, "r_x3": 138.97299, "r_y3": 478.70673, "coord_origin": "TOPLEFT" }, "text": "6.", "orig": "6.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.70099, "r_y0": 487.50369, "r_x1": 235.15768, "r_y1": 487.50369, "r_x2": 235.15768, "r_y2": 478.69675, "r_x3": 151.70099, "r_y3": 478.69675, "coord_origin": "TOPLEFT" }, "text": "Rectangular rule", "orig": "Rectangular rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 235.15697999999998, "r_y0": 487.50369, "r_x1": 480.59457, "r_y1": 487.50369, "r_x2": 480.59457, "r_y2": 478.70673, "r_x3": 235.15697999999998, "r_y3": 478.70673, "coord_origin": "TOPLEFT" }, "text": ": The table representation is always rectangular - all rows", "orig": ": The table representation is always rectangular - all rows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.70099, "r_y0": 499.45969, "r_x1": 448.04147, "r_y1": 499.45969, "r_x2": 448.04147, "r_y2": 490.66272, "r_x3": 151.70099, "r_y3": 490.66272, "coord_origin": "TOPLEFT" }, "text": "must have an equal number of tokens, terminated with \"NL\" token.", "orig": "must have an equal number of tokens, terminated with \"NL\" token.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "6. Rectangular rule : The table representation is always rectangular - all rows must have an equal number of tokens, terminated with \"NL\" token." }, { "label": "text", "id": 0, "page_no": 6, "cluster": { "id": 0, "label": "text", "bbox": { "l": 134.76498, "t": 512.59271, "r": 480.59583, "b": 640.9416699999999, "coord_origin": "TOPLEFT" }, "confidence": 0.9785562753677368, "cells": [ { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.70898, "r_y0": 521.38968, "r_x1": 480.59583, "r_y1": 521.38968, "r_x2": 480.59583, "r_y2": 512.59271, "r_x3": 149.70898, "r_y3": 512.59271, "coord_origin": "TOPLEFT" }, "text": "The application of these rules gives OTSL a set of unique properties. First", "orig": "The application of these rules gives OTSL a set of unique properties. First", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 533.34467, "r_x1": 480.59079, "r_y1": 533.34467, "r_x2": 480.59079, "r_y2": 524.5477000000001, "r_x3": 134.76498, "r_y3": 524.5477000000001, "coord_origin": "TOPLEFT" }, "text": "of all, the OTSL enforces a strictly rectangular structure representation, where", "orig": "of all, the OTSL enforces a strictly rectangular structure representation, where", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 545.29967, "r_x1": 480.59482, "r_y1": 545.29967, "r_x2": 480.59482, "r_y2": 536.5027, "r_x3": 134.76498, "r_y3": 536.5027, "coord_origin": "TOPLEFT" }, "text": "every new-line token starts a new row. As a consequence, all rows and all columns", "orig": "every new-line token starts a new row. As a consequence, all rows and all columns", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 557.25566, "r_x1": 480.58865000000003, "r_y1": 557.25566, "r_x2": 480.58865000000003, "r_y2": 548.4586899999999, "r_x3": 134.76498, "r_y3": 548.4586899999999, "coord_origin": "TOPLEFT" }, "text": "have exactly the same number of tokens, irrespective of cell spans. Secondly, the", "orig": "have exactly the same number of tokens, irrespective of cell spans. Secondly, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 569.21066, "r_x1": 480.59365999999994, "r_y1": 569.21066, "r_x2": 480.59365999999994, "r_y2": 560.4137000000001, "r_x3": 134.76498, "r_y3": 560.4137000000001, "coord_origin": "TOPLEFT" }, "text": "OTSL representation is unambiguous: Every table structure is represented in one", "orig": "OTSL representation is unambiguous: Every table structure is represented in one", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 581.16566, "r_x1": 480.58673, "r_y1": 581.16566, "r_x2": 480.58673, "r_y2": 572.3687, "r_x3": 134.76498, "r_y3": 572.3687, "coord_origin": "TOPLEFT" }, "text": "way. In this representation every table cell corresponds to a \"C\"-cell token, which", "orig": "way. In this representation every table cell corresponds to a \"C\"-cell token, which", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 593.12067, "r_x1": 480.59171, "r_y1": 593.12067, "r_x2": 480.59171, "r_y2": 584.3237, "r_x3": 134.76498, "r_y3": 584.3237, "coord_origin": "TOPLEFT" }, "text": "in case of spans is always located in the top-left corner of the table cell definition.", "orig": "in case of spans is always located in the top-left corner of the table cell definition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 605.07567, "r_x1": 480.59180000000003, "r_y1": 605.07567, "r_x2": 480.59180000000003, "r_y2": 596.2787, "r_x3": 134.76498, "r_y3": 596.2787, "coord_origin": "TOPLEFT" }, "text": "Third, OTSL syntax rules are only backward-looking. As a consequence, every", "orig": "Third, OTSL syntax rules are only backward-looking. As a consequence, every", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 617.03166, "r_x1": 480.5936899999999, "r_y1": 617.03166, "r_x2": 480.5936899999999, "r_y2": 608.2347, "r_x3": 134.76498, "r_y3": 608.2347, "coord_origin": "TOPLEFT" }, "text": "predicted token can be validated straight during sequence generation by looking", "orig": "predicted token can be validated straight during sequence generation by looking", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 628.98666, "r_x1": 480.59072999999995, "r_y1": 628.98666, "r_x2": 480.59072999999995, "r_y2": 620.1897, "r_x3": 134.76498, "r_y3": 620.1897, "coord_origin": "TOPLEFT" }, "text": "at the previously predicted sequence. As such, OTSL can guarantee that every", "orig": "at the previously predicted sequence. As such, OTSL can guarantee that every", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 640.9416699999999, "r_x1": 311.19769, "r_y1": 640.9416699999999, "r_x2": 311.19769, "r_y2": 632.1447000000001, "r_x3": 134.76498, "r_y3": 632.1447000000001, "coord_origin": "TOPLEFT" }, "text": "predicted sequence is syntactically valid.", "orig": "predicted sequence is syntactically valid.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The application of these rules gives OTSL a set of unique properties. First of all, the OTSL enforces a strictly rectangular structure representation, where every new-line token starts a new row. As a consequence, all rows and all columns have exactly the same number of tokens, irrespective of cell spans. Secondly, the OTSL representation is unambiguous: Every table structure is represented in one way. In this representation every table cell corresponds to a \"C\"-cell token, which in case of spans is always located in the top-left corner of the table cell definition. Third, OTSL syntax rules are only backward-looking. As a consequence, every predicted token can be validated straight during sequence generation by looking at the previously predicted sequence. As such, OTSL can guarantee that every predicted sequence is syntactically valid." }, { "label": "text", "id": 2, "page_no": 6, "cluster": { "id": 2, "label": "text", "bbox": { "l": 134.76498, "t": 644.1026899999999, "r": 480.59265, "b": 664.8546699999999, "coord_origin": "TOPLEFT" }, "confidence": 0.9590610861778259, "cells": [ { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.70898, "r_y0": 652.89966, "r_x1": 480.59186, "r_y1": 652.89966, "r_x2": 480.59186, "r_y2": 644.1026899999999, "r_x3": 149.70898, "r_y3": 644.1026899999999, "coord_origin": "TOPLEFT" }, "text": "These characteristics can be easily learned by sequence generator networks,", "orig": "These characteristics can be easily learned by sequence generator networks,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 664.8546699999999, "r_x1": 480.59265, "r_y1": 664.8546699999999, "r_x2": 480.59265, "r_y2": 656.05769, "r_x3": 134.76498, "r_y3": 656.05769, "coord_origin": "TOPLEFT" }, "text": "as we demonstrate further below. We find strong indications that this pattern", "orig": "as we demonstrate further below. We find strong indications that this pattern", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "These characteristics can be easily learned by sequence generator networks, as we demonstrate further below. We find strong indications that this pattern" } ], "body": [ { "label": "caption", "id": 6, "page_no": 6, "cluster": { "id": 6, "label": "caption", "bbox": { "l": 134.765, "t": 125.79918999999984, "r": 480.5874, "b": 155.84966999999995, "coord_origin": "TOPLEFT" }, "confidence": 0.9333080053329468, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 133.72551999999996, "r_x1": 162.64424, "r_y1": 133.72551999999996, "r_x2": 162.64424, "r_y2": 125.79918999999984, "r_x3": 134.765, "r_y3": 125.79918999999984, "coord_origin": "TOPLEFT" }, "text": "Fig. 3.", "orig": "Fig. 3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 166.276, "r_y0": 133.93169999999998, "r_x1": 480.58675999999997, "r_y1": 133.93169999999998, "r_x2": 480.58675999999997, "r_y2": 125.86200000000008, "r_x3": 166.276, "r_y3": 125.86200000000008, "coord_origin": "TOPLEFT" }, "text": "OTSL description of table structure: A - table example; B - graphical repre-", "orig": "OTSL description of table structure: A - table example; B - graphical repre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 144.89068999999995, "r_x1": 480.5874, "r_y1": 144.89068999999995, "r_x2": 480.5874, "r_y2": 136.82097999999996, "r_x3": 134.765, "r_y3": 136.82097999999996, "coord_origin": "TOPLEFT" }, "text": "sentation of table structure; C - mapping structure on a grid; D - OTSL structure", "orig": "sentation of table structure; C - mapping structure on a grid; D - OTSL structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 155.84966999999995, "r_x1": 306.1156, "r_y1": 155.84966999999995, "r_x2": 306.1156, "r_y2": 147.77997000000005, "r_x3": 134.765, "r_y3": 147.77997000000005, "coord_origin": "TOPLEFT" }, "text": "encoding; E - explanation on cell encoding", "orig": "encoding; E - explanation on cell encoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Fig. 3. OTSL description of table structure: A - table example; B - graphical representation of table structure; C - mapping structure on a grid; D - OTSL structure encoding; E - explanation on cell encoding" }, { "label": "picture", "id": 12, "page_no": 6, "cluster": { "id": 12, "label": "picture", "bbox": { "l": 164.65028381347656, "t": 163.79708862304688, "r": 449.5505676269531, "b": 280.3409423828125, "coord_origin": "TOPLEFT" }, "confidence": 0.7868534922599792, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.49326, "r_y0": 177.91540999999995, "r_x1": 381.66843, "r_y1": 177.91540999999995, "r_x2": 381.66843, "r_y2": 168.59362999999996, "r_x3": 374.49326, "r_y3": 168.59362999999996, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.74011, "r_y0": 177.82183999999995, "r_x1": 405.91528, "r_y1": 177.82183999999995, "r_x2": 405.91528, "r_y2": 168.50005999999996, "r_x3": 398.74011, "r_y3": 168.50005999999996, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 373.76862, "r_y0": 202.24730999999997, "r_x1": 380.94379, "r_y1": 202.24730999999997, "r_x2": 380.94379, "r_y2": 192.92553999999996, "r_x3": 373.76862, "r_y3": 192.92553999999996, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.66388, "r_y0": 202.39239999999995, "r_x1": 393.83905, "r_y1": 202.39239999999995, "r_x2": 393.83905, "r_y2": 193.07061999999996, "r_x3": 386.66388, "r_y3": 193.07061999999996, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.68707, "r_y0": 214.45934999999997, "r_x1": 393.86224, "r_y1": 214.45934999999997, "r_x2": 393.86224, "r_y2": 205.13756999999998, "r_x3": 386.68707, "r_y3": 205.13756999999998, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.65729, "r_y0": 190.05457, "r_x1": 405.83246, "r_y1": 190.05457, "r_x2": 405.83246, "r_y2": 180.73279000000002, "r_x3": 398.65729, "r_y3": 180.73279000000002, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.77908, "r_y0": 190.06035999999995, "r_x1": 417.95425, "r_y1": 190.06035999999995, "r_x2": 417.95425, "r_y2": 180.73859000000004, "r_x3": 410.77908, "r_y3": 180.73859000000004, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 422.90503, "r_y0": 189.97424, "r_x1": 430.08020000000005, "r_y1": 189.97424, "r_x2": 430.08020000000005, "r_y2": 180.65247, "r_x3": 422.90503, "r_y3": 180.65247, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.7807, "r_y0": 202.31042000000002, "r_x1": 405.95587, "r_y1": 202.31042000000002, "r_x2": 405.95587, "r_y2": 192.98865, "r_x3": 398.7807, "r_y3": 192.98865, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.90164, "r_y0": 202.31664999999998, "r_x1": 418.07681, "r_y1": 202.31664999999998, "r_x2": 418.07681, "r_y2": 192.99487, "r_x3": 410.90164, "r_y3": 192.99487, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.02753, "r_y0": 202.23077, "r_x1": 430.2027, "r_y1": 202.23077, "r_x2": 430.2027, "r_y2": 192.909, "r_x3": 423.02753, "r_y3": 192.909, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.78235, "r_y0": 214.63751000000002, "r_x1": 405.95752, "r_y1": 214.63751000000002, "r_x2": 405.95752, "r_y2": 205.31573000000003, "r_x3": 398.78235, "r_y3": 205.31573000000003, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.90414, "r_y0": 214.64373999999998, "r_x1": 418.07932, "r_y1": 214.64373999999998, "r_x2": 418.07932, "r_y2": 205.32196, "r_x3": 410.90414, "r_y3": 205.32196, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.03003, "r_y0": 214.55791999999997, "r_x1": 430.20520000000005, "r_y1": 214.55791999999997, "r_x2": 430.20520000000005, "r_y2": 205.23614999999995, "r_x3": 423.03003, "r_y3": 205.23614999999995, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.50574, "r_y0": 226.36059999999998, "r_x1": 393.68091, "r_y1": 226.36059999999998, "r_x2": 393.68091, "r_y2": 217.03882, "r_x3": 386.50574, "r_y3": 217.03882, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.60181, "r_y0": 226.53882, "r_x1": 405.77698, "r_y1": 226.53882, "r_x2": 405.77698, "r_y2": 217.21704, "r_x3": 398.60181, "r_y3": 217.21704, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.72275, "r_y0": 226.54498, "r_x1": 417.89792, "r_y1": 226.54498, "r_x2": 417.89792, "r_y2": 217.22321, "r_x3": 410.72275, "r_y3": 217.22321, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 422.84869, "r_y0": 226.45916999999997, "r_x1": 430.02386, "r_y1": 226.45916999999997, "r_x2": 430.02386, "r_y2": 217.13738999999998, "r_x3": 422.84869, "r_y3": 217.13738999999998, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.16009999999994, "r_y0": 177.01189999999997, "r_x1": 447.86273, "r_y1": 177.01189999999997, "r_x2": 447.86273, "r_y2": 167.69011999999998, "r_x3": 435.16009999999994, "r_y3": 167.69011999999998, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.44415, "r_y0": 189.52202999999997, "r_x1": 448.14679, "r_y1": 189.52202999999997, "r_x2": 448.14679, "r_y2": 180.20025999999996, "r_x3": 435.44415, "r_y3": 180.20025999999996, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.46735, "r_y0": 201.81652999999994, "r_x1": 448.16998000000007, "r_y1": 201.81652999999994, "r_x2": 448.16998000000007, "r_y2": 192.49474999999995, "r_x3": 435.46735, "r_y3": 192.49474999999995, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.38202, "r_y0": 214.15204000000006, "r_x1": 448.08466, "r_y1": 214.15204000000006, "r_x2": 448.08466, "r_y2": 204.83025999999995, "r_x3": 435.38202, "r_y3": 204.83025999999995, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.59906, "r_y0": 226.55548, "r_x1": 448.3017, "r_y1": 226.55548, "r_x2": 448.3017, "r_y2": 217.2337, "r_x3": 435.59906, "r_y3": 217.2337, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.14957, "r_y0": 214.55669999999998, "r_x1": 381.32474, "r_y1": 214.55669999999998, "r_x2": 381.32474, "r_y2": 205.23492, "r_x3": 374.14957, "r_y3": 205.23492, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.0419, "r_y0": 226.46826, "r_x1": 381.21707, "r_y1": 226.46826, "r_x2": 381.21707, "r_y2": 217.14648, "r_x3": 374.0419, "r_y3": 217.14648, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.34418, "r_y0": 190.25665000000004, "r_x1": 381.51935, "r_y1": 190.25665000000004, "r_x2": 381.51935, "r_y2": 180.93488000000002, "r_x3": 374.34418, "r_y3": 180.93488000000002, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 387.76285, "r_y0": 177.89966000000004, "r_x1": 393.28833, "r_y1": 177.89966000000004, "r_x2": 393.28833, "r_y2": 168.57788000000005, "r_x3": 387.76285, "r_y3": 168.57788000000005, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.86395, "r_y0": 177.38373, "r_x1": 417.38943, "r_y1": 177.38373, "r_x2": 417.38943, "r_y2": 168.06195000000002, "r_x3": 411.86395, "r_y3": 168.06195000000002, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.33563, "r_y0": 177.25616000000002, "r_x1": 428.86111, "r_y1": 177.25616000000002, "r_x2": 428.86111, "r_y2": 167.93439, "r_x3": 423.33563, "r_y3": 167.93439, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 387.13593, "r_y0": 190.10753999999997, "r_x1": 393.76453, "r_y1": 190.10753999999997, "r_x2": 393.76453, "r_y2": 180.78576999999996, "r_x3": 387.13593, "r_y3": 180.78576999999996, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.2594, "r_y0": 253.83056999999997, "r_x1": 289.43457, "r_y1": 253.83056999999997, "r_x2": 289.43457, "r_y2": 244.50878999999998, "r_x3": 282.2594, "r_y3": 244.50878999999998, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.11035, "r_y0": 266.172, "r_x1": 289.28552, "r_y1": 266.172, "r_x2": 289.28552, "r_y2": 256.85022000000004, "r_x3": 282.11035, "r_y3": 256.85022000000004, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.40848, "r_y0": 278.45477000000005, "r_x1": 289.58365, "r_y1": 278.45477000000005, "r_x2": 289.58365, "r_y2": 269.13300000000004, "r_x3": 282.40848, "r_y3": 269.13300000000004, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.52902, "r_y0": 253.81525, "r_x1": 301.0545, "r_y1": 253.81525, "r_x2": 301.0545, "r_y2": 244.49347, "r_x3": 295.52902, "r_y3": 244.49347, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 307.46613, "r_y0": 253.89550999999994, "r_x1": 312.99161, "r_y1": 253.89550999999994, "r_x2": 312.99161, "r_y2": 244.57372999999995, "r_x3": 307.46613, "r_y3": 244.57372999999995, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.76886, "r_y0": 253.76215000000002, "r_x1": 324.29434, "r_y1": 253.76215000000002, "r_x2": 324.29434, "r_y2": 244.44037000000003, "r_x3": 318.76886, "r_y3": 244.44037000000003, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 294.9021, "r_y0": 266.02332, "r_x1": 301.03976, "r_y1": 266.02332, "r_x2": 301.03976, "r_y2": 256.70154, "r_x3": 294.9021, "r_y3": 256.70154, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 307.17743, "r_y0": 266.02332, "r_x1": 325.59039, "r_y1": 266.02332, "r_x2": 325.59039, "r_y2": 256.70154, "r_x3": 307.17743, "r_y3": 256.70154, "coord_origin": "TOPLEFT" }, "text": "X X", "orig": "X X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 294.78949, "r_y0": 278.57599000000005, "r_x1": 300.92715, "r_y1": 278.57599000000005, "r_x2": 300.92715, "r_y2": 269.25420999999994, "r_x3": 294.78949, "r_y3": 269.25420999999994, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 307.06482, "r_y0": 278.57599000000005, "r_x1": 325.47778, "r_y1": 278.57599000000005, "r_x2": 325.47778, "r_y2": 269.25420999999994, "r_x3": 307.06482, "r_y3": 269.25420999999994, "coord_origin": "TOPLEFT" }, "text": "X X", "orig": "X X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 195.93939, "r_y0": 278.06976, "r_x1": 203.11456, "r_y1": 278.06976, "r_x2": 203.11456, "r_y2": 268.74798999999996, "r_x3": 195.93939, "r_y3": 268.74798999999996, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.20891, "r_y0": 278.05444, "r_x1": 214.73439, "r_y1": 278.05444, "r_x2": 214.73439, "r_y2": 268.73267, "r_x3": 209.20891, "r_y3": 268.73267, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 221.14551, "r_y0": 278.13469999999995, "r_x1": 226.67099, "r_y1": 278.13469999999995, "r_x2": 226.67099, "r_y2": 268.81293000000005, "r_x3": 221.14551, "r_y3": 268.81293000000005, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.44858, "r_y0": 278.00134, "r_x1": 237.97405999999998, "r_y1": 278.00134, "r_x2": 237.97405999999998, "r_y2": 268.67957, "r_x3": 232.44858, "r_y3": 268.67957, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.21715, "r_y0": 253.86139000000003, "r_x1": 203.39232, "r_y1": 253.86139000000003, "r_x2": 203.39232, "r_y2": 244.53961000000004, "r_x3": 196.21715, "r_y3": 244.53961000000004, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 250.32143, "r_y0": 253.41992000000005, "r_x1": 257.49661, "r_y1": 253.41992000000005, "r_x2": 257.49661, "r_y2": 244.09813999999994, "r_x3": 250.32143, "r_y3": 244.09813999999994, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 250.17235999999997, "r_y0": 265.76129000000003, "r_x1": 257.34753, "r_y1": 265.76129000000003, "r_x2": 257.34753, "r_y2": 256.43951000000004, "r_x3": 250.17235999999997, "r_y3": 256.43951000000004, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 250.47049000000004, "r_y0": 278.04400999999996, "r_x1": 257.64566, "r_y1": 278.04400999999996, "r_x2": 257.64566, "r_y2": 268.72222999999997, "r_x3": 250.47049000000004, "r_y3": 268.72222999999997, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.51135, "r_y0": 249.20911, "r_x1": 337.22485, "r_y1": 249.20911, "r_x2": 337.22485, "r_y2": 242.99463000000003, "r_x3": 334.51135, "r_y3": 242.99463000000003, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.93835, "r_y0": 249.20911, "r_x1": 391.49472, "r_y1": 249.20911, "r_x2": 391.49472, "r_y2": 242.99463000000003, "r_x3": 339.93835, "r_y3": 242.99463000000003, "coord_origin": "TOPLEFT" }, "text": "- simple cells: \"C\"", "orig": "- simple cells: \"C\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.51135, "r_y0": 259.14703, "r_x1": 337.33313, "r_y1": 259.14703, "r_x2": 337.33313, "r_y2": 252.93255999999997, "r_x3": 334.51135, "r_y3": 252.93255999999997, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.15491, "r_y0": 259.14703, "r_x1": 421.98624, "r_y1": 259.14703, "r_x2": 421.98624, "r_y2": 252.93255999999997, "r_x3": 340.15491, "r_y3": 252.93255999999997, "coord_origin": "TOPLEFT" }, "text": "- horizontal merges: \"C\", \"L\"", "orig": "- horizontal merges: \"C\", \"L\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.51135, "r_y0": 269.08496, "r_x1": 337.29868, "r_y1": 269.08496, "r_x2": 337.29868, "r_y2": 262.87048000000004, "r_x3": 334.51135, "r_y3": 262.87048000000004, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.086, "r_y0": 269.08496, "r_x1": 415.34375, "r_y1": 269.08496, "r_x2": 415.34375, "r_y2": 262.87048000000004, "r_x3": 340.086, "r_y3": 262.87048000000004, "coord_origin": "TOPLEFT" }, "text": "- vertical merges: \"C\", \"U\"", "orig": "- vertical merges: \"C\", \"U\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.51135, "r_y0": 279.02288999999996, "r_x1": 337.30188, "r_y1": 279.02288999999996, "r_x2": 337.30188, "r_y2": 272.80841, "r_x3": 334.51135, "r_y3": 272.80841, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.09241, "r_y0": 279.02288999999996, "r_x1": 426.59875, "r_y1": 279.02288999999996, "r_x2": 426.59875, "r_y2": 272.80841, "r_x3": 340.09241, "r_y3": 272.80841, "coord_origin": "TOPLEFT" }, "text": "- 2d merges: \"C\", \"L\", \"U\", \"X\"", "orig": "- 2d merges: \"C\", \"L\", \"U\", \"X\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.67178, "r_y0": 250.25671, "r_x1": 189.35544, "r_y1": 250.25671, "r_x2": 189.35544, "r_y2": 244.04224, "r_x3": 185.67178, "r_y3": 244.04224, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.96759, "r_y0": 274.56213, "r_x1": 189.65125, "r_y1": 274.56213, "r_x2": 189.65125, "r_y2": 268.34766, "r_x3": 185.96759, "r_y3": 268.34766, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.34152, "r_y0": 249.83972000000006, "r_x1": 243.02518, "r_y1": 249.83972000000006, "r_x2": 243.02518, "r_y2": 243.62523999999996, "r_x3": 239.34152, "r_y3": 243.62523999999996, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 271.32852, "r_y0": 249.70836999999995, "r_x1": 275.01218, "r_y1": 249.70836999999995, "r_x2": 275.01218, "r_y2": 243.49390000000005, "r_x3": 271.32852, "r_y3": 243.49390000000005, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.81627, "r_y0": 172.72942999999998, "r_x1": 233.49992000000003, "r_y1": 172.72942999999998, "r_x2": 233.49992000000003, "r_y2": 166.51495, "r_x3": 229.81627, "r_y3": 166.51495, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 257.24402, "r_y0": 196.17548, "r_x1": 260.92767, "r_y1": 196.17548, "r_x2": 260.92767, "r_y2": 189.961, "r_x3": 257.24402, "r_y3": 189.961, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 186.87526, "r_y0": 184.19115999999997, "r_x1": 190.55891, "r_y1": 184.19115999999997, "r_x2": 190.55891, "r_y2": 177.97668, "r_x3": 186.87526, "r_y3": 177.97668, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.48746, "r_y0": 175.22968000000003, "r_x1": 200.17111, "r_y1": 175.22968000000003, "r_x2": 200.17111, "r_y2": 169.01520000000005, "r_x3": 196.48746, "r_y3": 169.01520000000005, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 169.74728, "r_y0": 175.65039000000002, "r_x1": 175.72659, "r_y1": 175.65039000000002, "r_x2": 175.72659, "r_y2": 167.88225999999997, "r_x3": 169.74728, "r_y3": 167.88225999999997, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 169.74728, "r_y0": 214.60681, "r_x1": 175.72659, "r_y1": 214.60681, "r_x2": 175.72659, "r_y2": 206.83867999999995, "r_x3": 169.74728, "r_y3": 206.83867999999995, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 274.29419, "r_y0": 176.04785000000004, "r_x1": 280.2735, "r_y1": 176.04785000000004, "r_x2": 280.2735, "r_y2": 168.27972, "r_x3": 274.29419, "r_y3": 168.27972, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 359.56152, "r_y0": 176.04785000000004, "r_x1": 365.54083, "r_y1": 176.04785000000004, "r_x2": 365.54083, "r_y2": 168.27972, "r_x3": 359.56152, "r_y3": 168.27972, "coord_origin": "TOPLEFT" }, "text": "D", "orig": "D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 169.74728, "r_y0": 250.97960999999998, "r_x1": 175.27112, "r_y1": 250.97960999999998, "r_x2": 175.27112, "r_y2": 243.21149000000003, "r_x3": 169.74728, "r_y3": 243.21149000000003, "coord_origin": "TOPLEFT" }, "text": "E", "orig": "E", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 38, "label": "text", "bbox": { "l": 374.49326, "t": 168.59362999999996, "r": 381.66843, "b": 177.91540999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.49326, "r_y0": 177.91540999999995, "r_x1": 381.66843, "r_y1": 177.91540999999995, "r_x2": 381.66843, "r_y2": 168.59362999999996, "r_x3": 374.49326, "r_y3": 168.59362999999996, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 39, "label": "text", "bbox": { "l": 398.74011, "t": 168.50005999999996, "r": 405.91528, "b": 177.82183999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.74011, "r_y0": 177.82183999999995, "r_x1": 405.91528, "r_y1": 177.82183999999995, "r_x2": 405.91528, "r_y2": 168.50005999999996, "r_x3": 398.74011, "r_y3": 168.50005999999996, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 40, "label": "text", "bbox": { "l": 373.76862, "t": 192.92553999999996, "r": 380.94379, "b": 202.24730999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 373.76862, "r_y0": 202.24730999999997, "r_x1": 380.94379, "r_y1": 202.24730999999997, "r_x2": 380.94379, "r_y2": 192.92553999999996, "r_x3": 373.76862, "r_y3": 192.92553999999996, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 386.66388, "t": 193.07061999999996, "r": 393.83905, "b": 202.39239999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.66388, "r_y0": 202.39239999999995, "r_x1": 393.83905, "r_y1": 202.39239999999995, "r_x2": 393.83905, "r_y2": 193.07061999999996, "r_x3": 386.66388, "r_y3": 193.07061999999996, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 386.68707, "t": 205.13756999999998, "r": 393.86224, "b": 214.45934999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.68707, "r_y0": 214.45934999999997, "r_x1": 393.86224, "r_y1": 214.45934999999997, "r_x2": 393.86224, "r_y2": 205.13756999999998, "r_x3": 386.68707, "r_y3": 205.13756999999998, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 398.65729, "t": 180.73279000000002, "r": 405.83246, "b": 190.05457, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.65729, "r_y0": 190.05457, "r_x1": 405.83246, "r_y1": 190.05457, "r_x2": 405.83246, "r_y2": 180.73279000000002, "r_x3": 398.65729, "r_y3": 180.73279000000002, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 410.77908, "t": 180.73859000000004, "r": 417.95425, "b": 190.06035999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.77908, "r_y0": 190.06035999999995, "r_x1": 417.95425, "r_y1": 190.06035999999995, "r_x2": 417.95425, "r_y2": 180.73859000000004, "r_x3": 410.77908, "r_y3": 180.73859000000004, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 422.90503, "t": 180.65247, "r": 430.08020000000005, "b": 189.97424, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 422.90503, "r_y0": 189.97424, "r_x1": 430.08020000000005, "r_y1": 189.97424, "r_x2": 430.08020000000005, "r_y2": 180.65247, "r_x3": 422.90503, "r_y3": 180.65247, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 398.7807, "t": 192.98865, "r": 405.95587, "b": 202.31042000000002, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.7807, "r_y0": 202.31042000000002, "r_x1": 405.95587, "r_y1": 202.31042000000002, "r_x2": 405.95587, "r_y2": 192.98865, "r_x3": 398.7807, "r_y3": 192.98865, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 410.90164, "t": 192.99487, "r": 418.07681, "b": 202.31664999999998, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.90164, "r_y0": 202.31664999999998, "r_x1": 418.07681, "r_y1": 202.31664999999998, "r_x2": 418.07681, "r_y2": 192.99487, "r_x3": 410.90164, "r_y3": 192.99487, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 423.02753, "t": 192.909, "r": 430.2027, "b": 202.23077, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.02753, "r_y0": 202.23077, "r_x1": 430.2027, "r_y1": 202.23077, "r_x2": 430.2027, "r_y2": 192.909, "r_x3": 423.02753, "r_y3": 192.909, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 398.78235, "t": 205.31573000000003, "r": 405.95752, "b": 214.63751000000002, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.78235, "r_y0": 214.63751000000002, "r_x1": 405.95752, "r_y1": 214.63751000000002, "r_x2": 405.95752, "r_y2": 205.31573000000003, "r_x3": 398.78235, "r_y3": 205.31573000000003, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 410.90414, "t": 205.32196, "r": 418.07932, "b": 214.64373999999998, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.90414, "r_y0": 214.64373999999998, "r_x1": 418.07932, "r_y1": 214.64373999999998, "r_x2": 418.07932, "r_y2": 205.32196, "r_x3": 410.90414, "r_y3": 205.32196, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 51, "label": "text", "bbox": { "l": 423.03003, "t": 205.23614999999995, "r": 430.20520000000005, "b": 214.55791999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.03003, "r_y0": 214.55791999999997, "r_x1": 430.20520000000005, "r_y1": 214.55791999999997, "r_x2": 430.20520000000005, "r_y2": 205.23614999999995, "r_x3": 423.03003, "r_y3": 205.23614999999995, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 52, "label": "text", "bbox": { "l": 386.50574, "t": 217.03882, "r": 393.68091, "b": 226.36059999999998, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.50574, "r_y0": 226.36059999999998, "r_x1": 393.68091, "r_y1": 226.36059999999998, "r_x2": 393.68091, "r_y2": 217.03882, "r_x3": 386.50574, "r_y3": 217.03882, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 53, "label": "text", "bbox": { "l": 398.60181, "t": 217.21704, "r": 405.77698, "b": 226.53882, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.60181, "r_y0": 226.53882, "r_x1": 405.77698, "r_y1": 226.53882, "r_x2": 405.77698, "r_y2": 217.21704, "r_x3": 398.60181, "r_y3": 217.21704, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 54, "label": "text", "bbox": { "l": 410.72275, "t": 217.22321, "r": 417.89792, "b": 226.54498, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.72275, "r_y0": 226.54498, "r_x1": 417.89792, "r_y1": 226.54498, "r_x2": 417.89792, "r_y2": 217.22321, "r_x3": 410.72275, "r_y3": 217.22321, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 55, "label": "text", "bbox": { "l": 422.84869, "t": 217.13738999999998, "r": 430.02386, "b": 226.45916999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 422.84869, "r_y0": 226.45916999999997, "r_x1": 430.02386, "r_y1": 226.45916999999997, "r_x2": 430.02386, "r_y2": 217.13738999999998, "r_x3": 422.84869, "r_y3": 217.13738999999998, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 56, "label": "text", "bbox": { "l": 435.16009999999994, "t": 167.69011999999998, "r": 447.86273, "b": 177.01189999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.16009999999994, "r_y0": 177.01189999999997, "r_x1": 447.86273, "r_y1": 177.01189999999997, "r_x2": 447.86273, "r_y2": 167.69011999999998, "r_x3": 435.16009999999994, "r_y3": 167.69011999999998, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 57, "label": "text", "bbox": { "l": 435.44415, "t": 180.20025999999996, "r": 448.14679, "b": 189.52202999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.44415, "r_y0": 189.52202999999997, "r_x1": 448.14679, "r_y1": 189.52202999999997, "r_x2": 448.14679, "r_y2": 180.20025999999996, "r_x3": 435.44415, "r_y3": 180.20025999999996, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 58, "label": "text", "bbox": { "l": 435.46735, "t": 192.49474999999995, "r": 448.16998000000007, "b": 201.81652999999994, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.46735, "r_y0": 201.81652999999994, "r_x1": 448.16998000000007, "r_y1": 201.81652999999994, "r_x2": 448.16998000000007, "r_y2": 192.49474999999995, "r_x3": 435.46735, "r_y3": 192.49474999999995, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 59, "label": "text", "bbox": { "l": 435.38202, "t": 204.83025999999995, "r": 448.08466, "b": 214.15204000000006, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.38202, "r_y0": 214.15204000000006, "r_x1": 448.08466, "r_y1": 214.15204000000006, "r_x2": 448.08466, "r_y2": 204.83025999999995, "r_x3": 435.38202, "r_y3": 204.83025999999995, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 60, "label": "text", "bbox": { "l": 435.59906, "t": 217.2337, "r": 448.3017, "b": 226.55548, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.59906, "r_y0": 226.55548, "r_x1": 448.3017, "r_y1": 226.55548, "r_x2": 448.3017, "r_y2": 217.2337, "r_x3": 435.59906, "r_y3": 217.2337, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 61, "label": "text", "bbox": { "l": 374.14957, "t": 205.23492, "r": 381.32474, "b": 214.55669999999998, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.14957, "r_y0": 214.55669999999998, "r_x1": 381.32474, "r_y1": 214.55669999999998, "r_x2": 381.32474, "r_y2": 205.23492, "r_x3": 374.14957, "r_y3": 205.23492, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 62, "label": "text", "bbox": { "l": 374.0419, "t": 217.14648, "r": 381.21707, "b": 226.46826, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.0419, "r_y0": 226.46826, "r_x1": 381.21707, "r_y1": 226.46826, "r_x2": 381.21707, "r_y2": 217.14648, "r_x3": 374.0419, "r_y3": 217.14648, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 374.34418, "t": 180.93488000000002, "r": 381.51935, "b": 190.25665000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.34418, "r_y0": 190.25665000000004, "r_x1": 381.51935, "r_y1": 190.25665000000004, "r_x2": 381.51935, "r_y2": 180.93488000000002, "r_x3": 374.34418, "r_y3": 180.93488000000002, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 387.76285, "t": 168.57788000000005, "r": 393.28833, "b": 177.89966000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 387.76285, "r_y0": 177.89966000000004, "r_x1": 393.28833, "r_y1": 177.89966000000004, "r_x2": 393.28833, "r_y2": 168.57788000000005, "r_x3": 387.76285, "r_y3": 168.57788000000005, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 411.86395, "t": 168.06195000000002, "r": 417.38943, "b": 177.38373, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.86395, "r_y0": 177.38373, "r_x1": 417.38943, "r_y1": 177.38373, "r_x2": 417.38943, "r_y2": 168.06195000000002, "r_x3": 411.86395, "r_y3": 168.06195000000002, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 423.33563, "t": 167.93439, "r": 428.86111, "b": 177.25616000000002, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.33563, "r_y0": 177.25616000000002, "r_x1": 428.86111, "r_y1": 177.25616000000002, "r_x2": 428.86111, "r_y2": 167.93439, "r_x3": 423.33563, "r_y3": 167.93439, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 387.13593, "t": 180.78576999999996, "r": 393.76453, "b": 190.10753999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 387.13593, "r_y0": 190.10753999999997, "r_x1": 393.76453, "r_y1": 190.10753999999997, "r_x2": 393.76453, "r_y2": 180.78576999999996, "r_x3": 387.13593, "r_y3": 180.78576999999996, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 282.2594, "t": 244.50878999999998, "r": 289.43457, "b": 253.83056999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.2594, "r_y0": 253.83056999999997, "r_x1": 289.43457, "r_y1": 253.83056999999997, "r_x2": 289.43457, "r_y2": 244.50878999999998, "r_x3": 282.2594, "r_y3": 244.50878999999998, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 282.11035, "t": 256.85022000000004, "r": 289.28552, "b": 266.172, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.11035, "r_y0": 266.172, "r_x1": 289.28552, "r_y1": 266.172, "r_x2": 289.28552, "r_y2": 256.85022000000004, "r_x3": 282.11035, "r_y3": 256.85022000000004, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 282.40848, "t": 269.13300000000004, "r": 289.58365, "b": 278.45477000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.40848, "r_y0": 278.45477000000005, "r_x1": 289.58365, "r_y1": 278.45477000000005, "r_x2": 289.58365, "r_y2": 269.13300000000004, "r_x3": 282.40848, "r_y3": 269.13300000000004, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 295.52902, "t": 244.49347, "r": 301.0545, "b": 253.81525, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.52902, "r_y0": 253.81525, "r_x1": 301.0545, "r_y1": 253.81525, "r_x2": 301.0545, "r_y2": 244.49347, "r_x3": 295.52902, "r_y3": 244.49347, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 307.46613, "t": 244.57372999999995, "r": 312.99161, "b": 253.89550999999994, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 307.46613, "r_y0": 253.89550999999994, "r_x1": 312.99161, "r_y1": 253.89550999999994, "r_x2": 312.99161, "r_y2": 244.57372999999995, "r_x3": 307.46613, "r_y3": 244.57372999999995, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 318.76886, "t": 244.44037000000003, "r": 324.29434, "b": 253.76215000000002, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.76886, "r_y0": 253.76215000000002, "r_x1": 324.29434, "r_y1": 253.76215000000002, "r_x2": 324.29434, "r_y2": 244.44037000000003, "r_x3": 318.76886, "r_y3": 244.44037000000003, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 294.9021, "t": 256.70154, "r": 301.03976, "b": 266.02332, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 294.9021, "r_y0": 266.02332, "r_x1": 301.03976, "r_y1": 266.02332, "r_x2": 301.03976, "r_y2": 256.70154, "r_x3": 294.9021, "r_y3": 256.70154, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 307.17743, "t": 256.70154, "r": 325.59039, "b": 266.02332, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 307.17743, "r_y0": 266.02332, "r_x1": 325.59039, "r_y1": 266.02332, "r_x2": 325.59039, "r_y2": 256.70154, "r_x3": 307.17743, "r_y3": 256.70154, "coord_origin": "TOPLEFT" }, "text": "X X", "orig": "X X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 294.78949, "t": 269.25420999999994, "r": 300.92715, "b": 278.57599000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 294.78949, "r_y0": 278.57599000000005, "r_x1": 300.92715, "r_y1": 278.57599000000005, "r_x2": 300.92715, "r_y2": 269.25420999999994, "r_x3": 294.78949, "r_y3": 269.25420999999994, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 307.06482, "t": 269.25420999999994, "r": 325.47778, "b": 278.57599000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 307.06482, "r_y0": 278.57599000000005, "r_x1": 325.47778, "r_y1": 278.57599000000005, "r_x2": 325.47778, "r_y2": 269.25420999999994, "r_x3": 307.06482, "r_y3": 269.25420999999994, "coord_origin": "TOPLEFT" }, "text": "X X", "orig": "X X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 195.93939, "t": 268.74798999999996, "r": 203.11456, "b": 278.06976, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 195.93939, "r_y0": 278.06976, "r_x1": 203.11456, "r_y1": 278.06976, "r_x2": 203.11456, "r_y2": 268.74798999999996, "r_x3": 195.93939, "r_y3": 268.74798999999996, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 209.20891, "t": 268.73267, "r": 214.73439, "b": 278.05444, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.20891, "r_y0": 278.05444, "r_x1": 214.73439, "r_y1": 278.05444, "r_x2": 214.73439, "r_y2": 268.73267, "r_x3": 209.20891, "r_y3": 268.73267, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 80, "label": "text", "bbox": { "l": 221.14551, "t": 268.81293000000005, "r": 226.67099, "b": 278.13469999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 221.14551, "r_y0": 278.13469999999995, "r_x1": 226.67099, "r_y1": 278.13469999999995, "r_x2": 226.67099, "r_y2": 268.81293000000005, "r_x3": 221.14551, "r_y3": 268.81293000000005, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 81, "label": "text", "bbox": { "l": 232.44858, "t": 268.67957, "r": 237.97405999999998, "b": 278.00134, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.44858, "r_y0": 278.00134, "r_x1": 237.97405999999998, "r_y1": 278.00134, "r_x2": 237.97405999999998, "r_y2": 268.67957, "r_x3": 232.44858, "r_y3": 268.67957, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 82, "label": "text", "bbox": { "l": 196.21715, "t": 244.53961000000004, "r": 203.39232, "b": 253.86139000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.21715, "r_y0": 253.86139000000003, "r_x1": 203.39232, "r_y1": 253.86139000000003, "r_x2": 203.39232, "r_y2": 244.53961000000004, "r_x3": 196.21715, "r_y3": 244.53961000000004, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 83, "label": "text", "bbox": { "l": 250.32143, "t": 244.09813999999994, "r": 257.49661, "b": 253.41992000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 250.32143, "r_y0": 253.41992000000005, "r_x1": 257.49661, "r_y1": 253.41992000000005, "r_x2": 257.49661, "r_y2": 244.09813999999994, "r_x3": 250.32143, "r_y3": 244.09813999999994, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 84, "label": "text", "bbox": { "l": 250.17235999999997, "t": 256.43951000000004, "r": 257.34753, "b": 265.76129000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 250.17235999999997, "r_y0": 265.76129000000003, "r_x1": 257.34753, "r_y1": 265.76129000000003, "r_x2": 257.34753, "r_y2": 256.43951000000004, "r_x3": 250.17235999999997, "r_y3": 256.43951000000004, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 85, "label": "text", "bbox": { "l": 250.47049000000004, "t": 268.72222999999997, "r": 257.64566, "b": 278.04400999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 250.47049000000004, "r_y0": 278.04400999999996, "r_x1": 257.64566, "r_y1": 278.04400999999996, "r_x2": 257.64566, "r_y2": 268.72222999999997, "r_x3": 250.47049000000004, "r_y3": 268.72222999999997, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 86, "label": "text", "bbox": { "l": 334.51135, "t": 242.99463000000003, "r": 337.22485, "b": 249.20911, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.51135, "r_y0": 249.20911, "r_x1": 337.22485, "r_y1": 249.20911, "r_x2": 337.22485, "r_y2": 242.99463000000003, "r_x3": 334.51135, "r_y3": 242.99463000000003, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 87, "label": "text", "bbox": { "l": 339.93835, "t": 242.99463000000003, "r": 391.49472, "b": 249.20911, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.93835, "r_y0": 249.20911, "r_x1": 391.49472, "r_y1": 249.20911, "r_x2": 391.49472, "r_y2": 242.99463000000003, "r_x3": 339.93835, "r_y3": 242.99463000000003, "coord_origin": "TOPLEFT" }, "text": "- simple cells: \"C\"", "orig": "- simple cells: \"C\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 88, "label": "text", "bbox": { "l": 334.51135, "t": 252.93255999999997, "r": 337.33313, "b": 259.14703, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.51135, "r_y0": 259.14703, "r_x1": 337.33313, "r_y1": 259.14703, "r_x2": 337.33313, "r_y2": 252.93255999999997, "r_x3": 334.51135, "r_y3": 252.93255999999997, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 89, "label": "text", "bbox": { "l": 340.15491, "t": 252.93255999999997, "r": 421.98624, "b": 259.14703, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.15491, "r_y0": 259.14703, "r_x1": 421.98624, "r_y1": 259.14703, "r_x2": 421.98624, "r_y2": 252.93255999999997, "r_x3": 340.15491, "r_y3": 252.93255999999997, "coord_origin": "TOPLEFT" }, "text": "- horizontal merges: \"C\", \"L\"", "orig": "- horizontal merges: \"C\", \"L\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 90, "label": "text", "bbox": { "l": 334.51135, "t": 262.87048000000004, "r": 337.29868, "b": 269.08496, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.51135, "r_y0": 269.08496, "r_x1": 337.29868, "r_y1": 269.08496, "r_x2": 337.29868, "r_y2": 262.87048000000004, "r_x3": 334.51135, "r_y3": 262.87048000000004, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 91, "label": "text", "bbox": { "l": 340.086, "t": 262.87048000000004, "r": 415.34375, "b": 269.08496, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.086, "r_y0": 269.08496, "r_x1": 415.34375, "r_y1": 269.08496, "r_x2": 415.34375, "r_y2": 262.87048000000004, "r_x3": 340.086, "r_y3": 262.87048000000004, "coord_origin": "TOPLEFT" }, "text": "- vertical merges: \"C\", \"U\"", "orig": "- vertical merges: \"C\", \"U\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 18, "label": "list_item", "bbox": { "l": 334.51135, "t": 272.80841, "r": 426.59875, "b": 279.02288999999996, "coord_origin": "TOPLEFT" }, "confidence": 0.5250625610351562, "cells": [ { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.51135, "r_y0": 279.02288999999996, "r_x1": 337.30188, "r_y1": 279.02288999999996, "r_x2": 337.30188, "r_y2": 272.80841, "r_x3": 334.51135, "r_y3": 272.80841, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.09241, "r_y0": 279.02288999999996, "r_x1": 426.59875, "r_y1": 279.02288999999996, "r_x2": 426.59875, "r_y2": 272.80841, "r_x3": 340.09241, "r_y3": 272.80841, "coord_origin": "TOPLEFT" }, "text": "- 2d merges: \"C\", \"L\", \"U\", \"X\"", "orig": "- 2d merges: \"C\", \"L\", \"U\", \"X\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 92, "label": "text", "bbox": { "l": 185.67178, "t": 244.04224, "r": 189.35544, "b": 250.25671, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.67178, "r_y0": 250.25671, "r_x1": 189.35544, "r_y1": 250.25671, "r_x2": 189.35544, "r_y2": 244.04224, "r_x3": 185.67178, "r_y3": 244.04224, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 93, "label": "text", "bbox": { "l": 185.96759, "t": 268.34766, "r": 189.65125, "b": 274.56213, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.96759, "r_y0": 274.56213, "r_x1": 189.65125, "r_y1": 274.56213, "r_x2": 189.65125, "r_y2": 268.34766, "r_x3": 185.96759, "r_y3": 268.34766, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 94, "label": "text", "bbox": { "l": 239.34152, "t": 243.62523999999996, "r": 243.02518, "b": 249.83972000000006, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.34152, "r_y0": 249.83972000000006, "r_x1": 243.02518, "r_y1": 249.83972000000006, "r_x2": 243.02518, "r_y2": 243.62523999999996, "r_x3": 239.34152, "r_y3": 243.62523999999996, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 95, "label": "text", "bbox": { "l": 271.32852, "t": 243.49390000000005, "r": 275.01218, "b": 249.70836999999995, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 271.32852, "r_y0": 249.70836999999995, "r_x1": 275.01218, "r_y1": 249.70836999999995, "r_x2": 275.01218, "r_y2": 243.49390000000005, "r_x3": 271.32852, "r_y3": 243.49390000000005, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 96, "label": "text", "bbox": { "l": 229.81627, "t": 166.51495, "r": 233.49992000000003, "b": 172.72942999999998, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.81627, "r_y0": 172.72942999999998, "r_x1": 233.49992000000003, "r_y1": 172.72942999999998, "r_x2": 233.49992000000003, "r_y2": 166.51495, "r_x3": 229.81627, "r_y3": 166.51495, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 97, "label": "text", "bbox": { "l": 257.24402, "t": 189.961, "r": 260.92767, "b": 196.17548, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 257.24402, "r_y0": 196.17548, "r_x1": 260.92767, "r_y1": 196.17548, "r_x2": 260.92767, "r_y2": 189.961, "r_x3": 257.24402, "r_y3": 189.961, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 98, "label": "text", "bbox": { "l": 186.87526, "t": 177.97668, "r": 190.55891, "b": 184.19115999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 186.87526, "r_y0": 184.19115999999997, "r_x1": 190.55891, "r_y1": 184.19115999999997, "r_x2": 190.55891, "r_y2": 177.97668, "r_x3": 186.87526, "r_y3": 177.97668, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 99, "label": "text", "bbox": { "l": 196.48746, "t": 169.01520000000005, "r": 200.17111, "b": 175.22968000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.48746, "r_y0": 175.22968000000003, "r_x1": 200.17111, "r_y1": 175.22968000000003, "r_x2": 200.17111, "r_y2": 169.01520000000005, "r_x3": 196.48746, "r_y3": 169.01520000000005, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 100, "label": "text", "bbox": { "l": 169.74728, "t": 167.88225999999997, "r": 175.72659, "b": 175.65039000000002, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 169.74728, "r_y0": 175.65039000000002, "r_x1": 175.72659, "r_y1": 175.65039000000002, "r_x2": 175.72659, "r_y2": 167.88225999999997, "r_x3": 169.74728, "r_y3": 167.88225999999997, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 101, "label": "text", "bbox": { "l": 169.74728, "t": 206.83867999999995, "r": 175.72659, "b": 214.60681, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 169.74728, "r_y0": 214.60681, "r_x1": 175.72659, "r_y1": 214.60681, "r_x2": 175.72659, "r_y2": 206.83867999999995, "r_x3": 169.74728, "r_y3": 206.83867999999995, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 102, "label": "text", "bbox": { "l": 274.29419, "t": 168.27972, "r": 280.2735, "b": 176.04785000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 274.29419, "r_y0": 176.04785000000004, "r_x1": 280.2735, "r_y1": 176.04785000000004, "r_x2": 280.2735, "r_y2": 168.27972, "r_x3": 274.29419, "r_y3": 168.27972, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 103, "label": "text", "bbox": { "l": 359.56152, "t": 168.27972, "r": 365.54083, "b": 176.04785000000004, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 359.56152, "r_y0": 176.04785000000004, "r_x1": 365.54083, "r_y1": 176.04785000000004, "r_x2": 365.54083, "r_y2": 168.27972, "r_x3": 359.56152, "r_y3": 168.27972, "coord_origin": "TOPLEFT" }, "text": "D", "orig": "D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 104, "label": "text", "bbox": { "l": 169.74728, "t": 243.21149000000003, "r": 175.27112, "b": 250.97960999999998, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 169.74728, "r_y0": 250.97960999999998, "r_x1": 175.27112, "r_y1": 250.97960999999998, "r_x2": 175.27112, "r_y2": 243.21149000000003, "r_x3": 169.74728, "r_y3": 243.21149000000003, "coord_origin": "TOPLEFT" }, "text": "E", "orig": "E", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "section_header", "id": 9, "page_no": 6, "cluster": { "id": 9, "label": "section_header", "bbox": { "l": 134.765, "t": 305.29581, "r": 246.65197999999998, "b": 314.10275, "coord_origin": "TOPLEFT" }, "confidence": 0.9233023524284363, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 314.10275, "r_x1": 149.40205, "r_y1": 314.10275, "r_x2": 149.40205, "r_y2": 305.29581, "r_x3": 134.765, "r_y3": 305.29581, "coord_origin": "TOPLEFT" }, "text": "4.2", "orig": "4.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.85904, "r_y0": 314.10275, "r_x1": 246.65197999999998, "r_y1": 314.10275, "r_x2": 246.65197999999998, "r_y2": 305.29581, "r_x3": 160.85904, "r_y3": 305.29581, "coord_origin": "TOPLEFT" }, "text": "Language Syntax", "orig": "Language Syntax", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "4.2 Language Syntax" }, { "label": "text", "id": 10, "page_no": 6, "cluster": { "id": 10, "label": "text", "bbox": { "l": 134.765, "t": 325.24777, "r": 363.79617, "b": 334.04474, "coord_origin": "TOPLEFT" }, "confidence": 0.9169168472290039, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 334.04474, "r_x1": 363.79617, "r_y1": 334.04474, "r_x2": 363.79617, "r_y2": 325.24777, "r_x3": 134.765, "r_y3": 325.24777, "coord_origin": "TOPLEFT" }, "text": "The OTSL representation follows these syntax rules:", "orig": "The OTSL representation follows these syntax rules:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The OTSL representation follows these syntax rules:" }, { "label": "list_item", "id": 3, "page_no": 6, "cluster": { "id": 3, "label": "list_item", "bbox": { "l": 138.97299, "t": 347.17081, "r": 480.58902, "b": 367.93375, "coord_origin": "TOPLEFT" }, "confidence": 0.9588112235069275, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.97299, "r_y0": 355.97775, "r_x1": 146.71991, "r_y1": 355.97775, "r_x2": 146.71991, "r_y2": 347.18079, "r_x3": 138.97299, "r_y3": 347.18079, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.70099, "r_y0": 355.97775, "r_x1": 257.37927, "r_y1": 355.97775, "r_x2": 257.37927, "r_y2": 347.17081, "r_x3": 151.70099, "r_y3": 347.17081, "coord_origin": "TOPLEFT" }, "text": "Left-looking cell rule", "orig": "Left-looking cell rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 257.383, "r_y0": 355.97775, "r_x1": 480.58902, "r_y1": 355.97775, "r_x2": 480.58902, "r_y2": 347.18079, "r_x3": 257.383, "r_y3": 347.18079, "coord_origin": "TOPLEFT" }, "text": ": The left neighbour of an \"L\" cell must be either", "orig": ": The left neighbour of an \"L\" cell must be either", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.70099, "r_y0": 367.93375, "r_x1": 283.59387, "r_y1": 367.93375, "r_x2": 283.59387, "r_y2": 359.13678, "r_x3": 151.70099, "r_y3": 359.13678, "coord_origin": "TOPLEFT" }, "text": "another \"L\" cell or a \"C\" cell.", "orig": "another \"L\" cell or a \"C\" cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "1. Left-looking cell rule : The left neighbour of an \"L\" cell must be either another \"L\" cell or a \"C\" cell." }, { "label": "list_item", "id": 4, "page_no": 6, "cluster": { "id": 4, "label": "list_item", "bbox": { "l": 138.97299, "t": 371.08481, "r": 480.59229000000005, "b": 391.84673999999995, "coord_origin": "TOPLEFT" }, "confidence": 0.9585386514663696, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.97299, "r_y0": 379.89175, "r_x1": 146.71991, "r_y1": 379.89175, "r_x2": 146.71991, "r_y2": 371.09479, "r_x3": 138.97299, "r_y3": 371.09479, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.70099, "r_y0": 379.89175, "r_x1": 252.11203, "r_y1": 379.89175, "r_x2": 252.11203, "r_y2": 371.08481, "r_x3": 151.70099, "r_y3": 371.08481, "coord_origin": "TOPLEFT" }, "text": "Up-looking cell rule", "orig": "Up-looking cell rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 252.112, "r_y0": 379.89175, "r_x1": 480.59229000000005, "r_y1": 379.89175, "r_x2": 480.59229000000005, "r_y2": 371.09479, "r_x3": 252.112, "r_y3": 371.09479, "coord_origin": "TOPLEFT" }, "text": ": The upper neighbour of a \"U\" cell must be either", "orig": ": The upper neighbour of a \"U\" cell must be either", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.70099, "r_y0": 391.84673999999995, "r_x1": 284.8392, "r_y1": 391.84673999999995, "r_x2": 284.8392, "r_y2": 383.04977, "r_x3": 151.70099, "r_y3": 383.04977, "coord_origin": "TOPLEFT" }, "text": "another \"U\" cell or a \"C\" cell.", "orig": "another \"U\" cell or a \"C\" cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "2. Up-looking cell rule : The upper neighbour of a \"U\" cell must be either another \"U\" cell or a \"C\" cell." }, { "label": "section_header", "id": 14, "page_no": 6, "cluster": { "id": 14, "label": "section_header", "bbox": { "l": 138.97299, "t": 394.99780000000004, "r": 226.07360999999997, "b": 403.80475, "coord_origin": "TOPLEFT" }, "confidence": 0.6506174206733704, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.97299, "r_y0": 403.80475, "r_x1": 146.71991, "r_y1": 403.80475, "r_x2": 146.71991, "r_y2": 395.0077800000001, "r_x3": 138.97299, "r_y3": 395.0077800000001, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.70099, "r_y0": 403.80475, "r_x1": 223.3042, "r_y1": 403.80475, "r_x2": 223.3042, "r_y2": 394.99780000000004, "r_x3": 151.70099, "r_y3": 394.99780000000004, "coord_origin": "TOPLEFT" }, "text": "Cross cell rule", "orig": "Cross cell rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 223.30699, "r_y0": 403.80475, "r_x1": 226.07360999999997, "r_y1": 403.80475, "r_x2": 226.07360999999997, "r_y2": 395.0077800000001, "r_x3": 223.30699, "r_y3": 395.0077800000001, "coord_origin": "TOPLEFT" }, "text": ":", "orig": ":", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "3. Cross cell rule :" }, { "label": "list_item", "id": 13, "page_no": 6, "cluster": { "id": 13, "label": "list_item", "bbox": { "l": 151.70099, "t": 406.96677, "r": 480.59238, "b": 439.67371, "coord_origin": "TOPLEFT" }, "confidence": 0.7247239947319031, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.70099, "r_y0": 415.76373, "r_x1": 480.59238, "r_y1": 415.76373, "r_x2": 480.59238, "r_y2": 406.96677, "r_x3": 151.70099, "r_y3": 406.96677, "coord_origin": "TOPLEFT" }, "text": "The left neighbour of an \"X\" cell must be either another \"X\" cell or a \"U\"", "orig": "The left neighbour of an \"X\" cell must be either another \"X\" cell or a \"U\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.70099, "r_y0": 427.71871999999996, "r_x1": 480.59219, "r_y1": 427.71871999999996, "r_x2": 480.59219, "r_y2": 418.9217499999999, "r_x3": 151.70099, "r_y3": 418.9217499999999, "coord_origin": "TOPLEFT" }, "text": "cell, and the upper neighbour of an \"X\" cell must be either another \"X\" cell", "orig": "cell, and the upper neighbour of an \"X\" cell must be either another \"X\" cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.70099, "r_y0": 439.67371, "r_x1": 214.39663999999996, "r_y1": 439.67371, "r_x2": 214.39663999999996, "r_y2": 430.87674, "r_x3": 151.70099, "r_y3": 430.87674, "coord_origin": "TOPLEFT" }, "text": "or an \"L\" cell.", "orig": "or an \"L\" cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The left neighbour of an \"X\" cell must be either another \"X\" cell or a \"U\" cell, and the upper neighbour of an \"X\" cell must be either another \"X\" cell or an \"L\" cell." }, { "label": "list_item", "id": 8, "page_no": 6, "cluster": { "id": 8, "label": "list_item", "bbox": { "l": 138.97299, "t": 442.82574, "r": 474.59018, "b": 451.63269, "coord_origin": "TOPLEFT" }, "confidence": 0.9259927272796631, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.97299, "r_y0": 451.63269, "r_x1": 146.71991, "r_y1": 451.63269, "r_x2": 146.71991, "r_y2": 442.83572, "r_x3": 138.97299, "r_y3": 442.83572, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.70099, "r_y0": 451.63269, "r_x1": 221.32263, "r_y1": 451.63269, "r_x2": 221.32263, "r_y2": 442.82574, "r_x3": 151.70099, "r_y3": 442.82574, "coord_origin": "TOPLEFT" }, "text": "First row rule", "orig": "First row rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 221.32700000000003, "r_y0": 451.63269, "r_x1": 474.59018, "r_y1": 451.63269, "r_x2": 474.59018, "r_y2": 442.83572, "r_x3": 221.32700000000003, "r_y3": 442.83572, "coord_origin": "TOPLEFT" }, "text": ": Only \"L\" cells and \"C\" cells are allowed in the first row.", "orig": ": Only \"L\" cells and \"C\" cells are allowed in the first row.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "4. First row rule : Only \"L\" cells and \"C\" cells are allowed in the first row." }, { "label": "list_item", "id": 5, "page_no": 6, "cluster": { "id": 5, "label": "list_item", "bbox": { "l": 138.97299, "t": 454.78375, "r": 480.58746, "b": 475.54568, "coord_origin": "TOPLEFT" }, "confidence": 0.9420599937438965, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.97299, "r_y0": 463.5907, "r_x1": 146.71991, "r_y1": 463.5907, "r_x2": 146.71991, "r_y2": 454.7937299999999, "r_x3": 138.97299, "r_y3": 454.7937299999999, "coord_origin": "TOPLEFT" }, "text": "5.", "orig": "5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.70099, "r_y0": 463.5907, "r_x1": 240.71982, "r_y1": 463.5907, "r_x2": 240.71982, "r_y2": 454.78375, "r_x3": 151.70099, "r_y3": 454.78375, "coord_origin": "TOPLEFT" }, "text": "First column rule", "orig": "First column rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 240.71599, "r_y0": 463.5907, "r_x1": 480.58746, "r_y1": 463.5907, "r_x2": 480.58746, "r_y2": 454.7937299999999, "r_x3": 240.71599, "r_y3": 454.7937299999999, "coord_origin": "TOPLEFT" }, "text": ": Only \"U\" cells and \"C\" cells are allowed in the first", "orig": ": Only \"U\" cells and \"C\" cells are allowed in the first", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.70099, "r_y0": 475.54568, "r_x1": 186.0072, "r_y1": 475.54568, "r_x2": 186.0072, "r_y2": 466.74872, "r_x3": 151.70099, "r_y3": 466.74872, "coord_origin": "TOPLEFT" }, "text": "column.", "orig": "column.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "5. First column rule : Only \"U\" cells and \"C\" cells are allowed in the first column." }, { "label": "list_item", "id": 1, "page_no": 6, "cluster": { "id": 1, "label": "list_item", "bbox": { "l": 138.97299, "t": 478.69675, "r": 480.59457, "b": 499.45969, "coord_origin": "TOPLEFT" }, "confidence": 0.9617829918861389, "cells": [ { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.97299, "r_y0": 487.50369, "r_x1": 146.71991, "r_y1": 487.50369, "r_x2": 146.71991, "r_y2": 478.70673, "r_x3": 138.97299, "r_y3": 478.70673, "coord_origin": "TOPLEFT" }, "text": "6.", "orig": "6.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.70099, "r_y0": 487.50369, "r_x1": 235.15768, "r_y1": 487.50369, "r_x2": 235.15768, "r_y2": 478.69675, "r_x3": 151.70099, "r_y3": 478.69675, "coord_origin": "TOPLEFT" }, "text": "Rectangular rule", "orig": "Rectangular rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 235.15697999999998, "r_y0": 487.50369, "r_x1": 480.59457, "r_y1": 487.50369, "r_x2": 480.59457, "r_y2": 478.70673, "r_x3": 235.15697999999998, "r_y3": 478.70673, "coord_origin": "TOPLEFT" }, "text": ": The table representation is always rectangular - all rows", "orig": ": The table representation is always rectangular - all rows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.70099, "r_y0": 499.45969, "r_x1": 448.04147, "r_y1": 499.45969, "r_x2": 448.04147, "r_y2": 490.66272, "r_x3": 151.70099, "r_y3": 490.66272, "coord_origin": "TOPLEFT" }, "text": "must have an equal number of tokens, terminated with \"NL\" token.", "orig": "must have an equal number of tokens, terminated with \"NL\" token.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "6. Rectangular rule : The table representation is always rectangular - all rows must have an equal number of tokens, terminated with \"NL\" token." }, { "label": "text", "id": 0, "page_no": 6, "cluster": { "id": 0, "label": "text", "bbox": { "l": 134.76498, "t": 512.59271, "r": 480.59583, "b": 640.9416699999999, "coord_origin": "TOPLEFT" }, "confidence": 0.9785562753677368, "cells": [ { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.70898, "r_y0": 521.38968, "r_x1": 480.59583, "r_y1": 521.38968, "r_x2": 480.59583, "r_y2": 512.59271, "r_x3": 149.70898, "r_y3": 512.59271, "coord_origin": "TOPLEFT" }, "text": "The application of these rules gives OTSL a set of unique properties. First", "orig": "The application of these rules gives OTSL a set of unique properties. First", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 533.34467, "r_x1": 480.59079, "r_y1": 533.34467, "r_x2": 480.59079, "r_y2": 524.5477000000001, "r_x3": 134.76498, "r_y3": 524.5477000000001, "coord_origin": "TOPLEFT" }, "text": "of all, the OTSL enforces a strictly rectangular structure representation, where", "orig": "of all, the OTSL enforces a strictly rectangular structure representation, where", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 545.29967, "r_x1": 480.59482, "r_y1": 545.29967, "r_x2": 480.59482, "r_y2": 536.5027, "r_x3": 134.76498, "r_y3": 536.5027, "coord_origin": "TOPLEFT" }, "text": "every new-line token starts a new row. As a consequence, all rows and all columns", "orig": "every new-line token starts a new row. As a consequence, all rows and all columns", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 557.25566, "r_x1": 480.58865000000003, "r_y1": 557.25566, "r_x2": 480.58865000000003, "r_y2": 548.4586899999999, "r_x3": 134.76498, "r_y3": 548.4586899999999, "coord_origin": "TOPLEFT" }, "text": "have exactly the same number of tokens, irrespective of cell spans. Secondly, the", "orig": "have exactly the same number of tokens, irrespective of cell spans. Secondly, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 569.21066, "r_x1": 480.59365999999994, "r_y1": 569.21066, "r_x2": 480.59365999999994, "r_y2": 560.4137000000001, "r_x3": 134.76498, "r_y3": 560.4137000000001, "coord_origin": "TOPLEFT" }, "text": "OTSL representation is unambiguous: Every table structure is represented in one", "orig": "OTSL representation is unambiguous: Every table structure is represented in one", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 581.16566, "r_x1": 480.58673, "r_y1": 581.16566, "r_x2": 480.58673, "r_y2": 572.3687, "r_x3": 134.76498, "r_y3": 572.3687, "coord_origin": "TOPLEFT" }, "text": "way. In this representation every table cell corresponds to a \"C\"-cell token, which", "orig": "way. In this representation every table cell corresponds to a \"C\"-cell token, which", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 593.12067, "r_x1": 480.59171, "r_y1": 593.12067, "r_x2": 480.59171, "r_y2": 584.3237, "r_x3": 134.76498, "r_y3": 584.3237, "coord_origin": "TOPLEFT" }, "text": "in case of spans is always located in the top-left corner of the table cell definition.", "orig": "in case of spans is always located in the top-left corner of the table cell definition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 605.07567, "r_x1": 480.59180000000003, "r_y1": 605.07567, "r_x2": 480.59180000000003, "r_y2": 596.2787, "r_x3": 134.76498, "r_y3": 596.2787, "coord_origin": "TOPLEFT" }, "text": "Third, OTSL syntax rules are only backward-looking. As a consequence, every", "orig": "Third, OTSL syntax rules are only backward-looking. As a consequence, every", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 617.03166, "r_x1": 480.5936899999999, "r_y1": 617.03166, "r_x2": 480.5936899999999, "r_y2": 608.2347, "r_x3": 134.76498, "r_y3": 608.2347, "coord_origin": "TOPLEFT" }, "text": "predicted token can be validated straight during sequence generation by looking", "orig": "predicted token can be validated straight during sequence generation by looking", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 628.98666, "r_x1": 480.59072999999995, "r_y1": 628.98666, "r_x2": 480.59072999999995, "r_y2": 620.1897, "r_x3": 134.76498, "r_y3": 620.1897, "coord_origin": "TOPLEFT" }, "text": "at the previously predicted sequence. As such, OTSL can guarantee that every", "orig": "at the previously predicted sequence. As such, OTSL can guarantee that every", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 640.9416699999999, "r_x1": 311.19769, "r_y1": 640.9416699999999, "r_x2": 311.19769, "r_y2": 632.1447000000001, "r_x3": 134.76498, "r_y3": 632.1447000000001, "coord_origin": "TOPLEFT" }, "text": "predicted sequence is syntactically valid.", "orig": "predicted sequence is syntactically valid.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The application of these rules gives OTSL a set of unique properties. First of all, the OTSL enforces a strictly rectangular structure representation, where every new-line token starts a new row. As a consequence, all rows and all columns have exactly the same number of tokens, irrespective of cell spans. Secondly, the OTSL representation is unambiguous: Every table structure is represented in one way. In this representation every table cell corresponds to a \"C\"-cell token, which in case of spans is always located in the top-left corner of the table cell definition. Third, OTSL syntax rules are only backward-looking. As a consequence, every predicted token can be validated straight during sequence generation by looking at the previously predicted sequence. As such, OTSL can guarantee that every predicted sequence is syntactically valid." }, { "label": "text", "id": 2, "page_no": 6, "cluster": { "id": 2, "label": "text", "bbox": { "l": 134.76498, "t": 644.1026899999999, "r": 480.59265, "b": 664.8546699999999, "coord_origin": "TOPLEFT" }, "confidence": 0.9590610861778259, "cells": [ { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.70898, "r_y0": 652.89966, "r_x1": 480.59186, "r_y1": 652.89966, "r_x2": 480.59186, "r_y2": 644.1026899999999, "r_x3": 149.70898, "r_y3": 644.1026899999999, "coord_origin": "TOPLEFT" }, "text": "These characteristics can be easily learned by sequence generator networks,", "orig": "These characteristics can be easily learned by sequence generator networks,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 664.8546699999999, "r_x1": 480.59265, "r_y1": 664.8546699999999, "r_x2": 480.59265, "r_y2": 656.05769, "r_x3": 134.76498, "r_y3": 656.05769, "coord_origin": "TOPLEFT" }, "text": "as we demonstrate further below. We find strong indications that this pattern", "orig": "as we demonstrate further below. We find strong indications that this pattern", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "These characteristics can be easily learned by sequence generator networks, as we demonstrate further below. We find strong indications that this pattern" } ], "headers": [ { "label": "page_header", "id": 7, "page_no": 6, "cluster": { "id": 7, "label": "page_header", "bbox": { "l": 194.478, "t": 93.77099999999996, "r": 447.54291000000006, "b": 101.84069999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.932651162147522, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.478, "r_y0": 101.84069999999997, "r_x1": 447.54291000000006, "r_y1": 101.84069999999997, "r_x2": 447.54291000000006, "r_y2": 93.77099999999996, "r_x3": 194.478, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Optimized Table Tokenization for Table Structure Recognition" }, { "label": "page_header", "id": 11, "page_no": 6, "cluster": { "id": 11, "label": "page_header", "bbox": { "l": 475.98431, "t": 93.77099999999996, "r": 480.59125000000006, "b": 101.84069999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.8749732375144958, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 475.98431, "r_y0": 101.84069999999997, "r_x1": 480.59125000000006, "r_y1": 101.84069999999997, "r_x2": 480.59125000000006, "r_y2": 93.77099999999996, "r_x3": 475.98431, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "7" } ] } }, { "page_no": 7, "size": { "width": 612.0, "height": 792.0 }, "parsed_page": { "dimension": { "angle": 0.0, "rect": { "r_x0": 0.0, "r_y0": 0.0, "r_x1": 612.0, "r_y1": 0.0, "r_x2": 612.0, "r_y2": 792.0, "r_x3": 0.0, "r_y3": 792.0, "coord_origin": "BOTTOMLEFT" }, "boundary_type": "crop_box", "art_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "bleed_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "crop_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "media_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "trim_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" } }, "bitmap_resources": [], "char_cells": [], "word_cells": [], "textline_cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 101.84069999999997, "r_x1": 139.37193, "r_y1": 101.84069999999997, "r_x2": 139.37193, "r_y2": 93.77099999999996, "r_x3": 134.765, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.81335, "r_y0": 101.84069999999997, "r_x1": 178.07675, "r_y1": 101.84069999999997, "r_x2": 178.07675, "r_y2": 93.77099999999996, "r_x3": 167.81335, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.37415, "r_y0": 101.84069999999997, "r_x1": 231.72227, "r_y1": 101.84069999999997, "r_x2": 231.72227, "r_y2": 93.77099999999996, "r_x3": 182.37415, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 127.73077, "r_x1": 480.58884000000006, "r_y1": 127.73077, "r_x2": 480.58884000000006, "r_y2": 118.93377999999996, "r_x3": 134.765, "r_y3": 118.93377999999996, "coord_origin": "TOPLEFT" }, "text": "reduces significantly the column drift seen in the HTML based models (see Fig-", "orig": "reduces significantly the column drift seen in the HTML based models (see Fig-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 139.68579, "r_x1": 163.56389, "r_y1": 139.68579, "r_x2": 163.56389, "r_y2": 130.88878999999997, "r_x3": 134.765, "r_y3": 130.88878999999997, "coord_origin": "TOPLEFT" }, "text": "ure 5).", "orig": "ure 5).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 170.36377000000005, "r_x1": 149.40205, "r_y1": 170.36377000000005, "r_x2": 149.40205, "r_y2": 161.55682000000002, "r_x3": 134.765, "r_y3": 161.55682000000002, "coord_origin": "TOPLEFT" }, "text": "4.3", "orig": "4.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.85904, "r_y0": 170.36377000000005, "r_x1": 319.34708, "r_y1": 170.36377000000005, "r_x2": 319.34708, "r_y2": 161.55682000000002, "r_x3": 160.85904, "r_y3": 161.55682000000002, "coord_origin": "TOPLEFT" }, "text": "Error-detection and -mitigation", "orig": "Error-detection and -mitigation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 191.0788, "r_x1": 480.59572999999995, "r_y1": 191.0788, "r_x2": 480.59572999999995, "r_y2": 182.28179999999998, "r_x3": 134.765, "r_y3": 182.28179999999998, "coord_origin": "TOPLEFT" }, "text": "The design of OTSL allows to validate a table structure easily on an unfinished", "orig": "The design of OTSL allows to validate a table structure easily on an unfinished", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 203.03479000000004, "r_x1": 480.59473, "r_y1": 203.03479000000004, "r_x2": 480.59473, "r_y2": 194.23779000000002, "r_x3": 134.765, "r_y3": 194.23779000000002, "coord_origin": "TOPLEFT" }, "text": "sequence. The detection of an invalid sequence token is a clear indication of a", "orig": "sequence. The detection of an invalid sequence token is a clear indication of a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 214.98981000000003, "r_x1": 480.58678999999995, "r_y1": 214.98981000000003, "r_x2": 480.58678999999995, "r_y2": 206.19281, "r_x3": 134.765, "r_y3": 206.19281, "coord_origin": "TOPLEFT" }, "text": "prediction mistake, however a valid sequence by itself does not guarantee pre-", "orig": "prediction mistake, however a valid sequence by itself does not guarantee pre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 226.94482000000005, "r_x1": 480.59177000000005, "r_y1": 226.94482000000005, "r_x2": 480.59177000000005, "r_y2": 218.14783, "r_x3": 134.765, "r_y3": 218.14783, "coord_origin": "TOPLEFT" }, "text": "diction correctness. Different heuristics can be used to correct token errors in", "orig": "diction correctness. Different heuristics can be used to correct token errors in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 238.89984000000004, "r_x1": 480.58768, "r_y1": 238.89984000000004, "r_x2": 480.58768, "r_y2": 230.10284000000001, "r_x3": 134.765, "r_y3": 230.10284000000001, "coord_origin": "TOPLEFT" }, "text": "an invalid sequence and thus increase the chances for accurate predictions. Such", "orig": "an invalid sequence and thus increase the chances for accurate predictions. Such", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 250.85486000000003, "r_x1": 480.5867, "r_y1": 250.85486000000003, "r_x2": 480.5867, "r_y2": 242.05786, "r_x3": 134.765, "r_y3": 242.05786, "coord_origin": "TOPLEFT" }, "text": "heuristics can be applied either after the prediction of each token, or at the end", "orig": "heuristics can be applied either after the prediction of each token, or at the end", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 262.80988, "r_x1": 480.5938100000001, "r_y1": 262.80988, "r_x2": 480.5938100000001, "r_y2": 254.01288, "r_x3": 134.765, "r_y3": 254.01288, "coord_origin": "TOPLEFT" }, "text": "on the entire predicted sequence. For example a simple heuristic which can cor-", "orig": "on the entire predicted sequence. For example a simple heuristic which can cor-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 274.76586999999995, "r_x1": 480.59069999999997, "r_y1": 274.76586999999995, "r_x2": 480.59069999999997, "r_y2": 265.96887000000004, "r_x3": 134.765, "r_y3": 265.96887000000004, "coord_origin": "TOPLEFT" }, "text": "rect the predicted OTSL sequence on-the-fly is to verify if the token with the", "orig": "rect the predicted OTSL sequence on-the-fly is to verify if the token with the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 286.72086, "r_x1": 480.5957599999999, "r_y1": 286.72086, "r_x2": 480.5957599999999, "r_y2": 277.92389000000003, "r_x3": 134.765, "r_y3": 277.92389000000003, "coord_origin": "TOPLEFT" }, "text": "highest prediction confidence invalidates the predicted sequence, and replace it", "orig": "highest prediction confidence invalidates the predicted sequence, and replace it", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 298.67584, "r_x1": 469.40369, "r_y1": 298.67584, "r_x2": 469.40369, "r_y2": 289.8788799999999, "r_x3": 134.765, "r_y3": 289.8788799999999, "coord_origin": "TOPLEFT" }, "text": "by the token with the next highest confidence until OTSL rules are satisfied.", "orig": "by the token with the next highest confidence until OTSL rules are satisfied.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 331.73239000000007, "r_x1": 141.4886, "r_y1": 331.73239000000007, "r_x2": 141.4886, "r_y2": 321.164, "r_x3": 134.765, "r_y3": 321.164, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.9382, "r_y0": 331.73239000000007, "r_x1": 229.03534, "r_y1": 331.73239000000007, "r_x2": 229.03534, "r_y2": 321.164, "r_x3": 154.9382, "r_y3": 321.164, "coord_origin": "TOPLEFT" }, "text": "Experiments", "orig": "Experiments", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 356.04681, "r_x1": 480.59375, "r_y1": 356.04681, "r_x2": 480.59375, "r_y2": 347.24985, "r_x3": 134.765, "r_y3": 347.24985, "coord_origin": "TOPLEFT" }, "text": "To evaluate the impact of OTSL on prediction accuracy and inference times, we", "orig": "To evaluate the impact of OTSL on prediction accuracy and inference times, we", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 368.0018, "r_x1": 480.59476, "r_y1": 368.0018, "r_x2": 480.59476, "r_y2": 359.2048300000001, "r_x3": 134.765, "r_y3": 359.2048300000001, "coord_origin": "TOPLEFT" }, "text": "conducted a series of experiments based on the TableFormer model (Figure 4)", "orig": "conducted a series of experiments based on the TableFormer model (Figure 4)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 379.95679, "r_x1": 480.58786000000003, "r_y1": 379.95679, "r_x2": 480.58786000000003, "r_y2": 371.15982, "r_x3": 134.765, "r_y3": 371.15982, "coord_origin": "TOPLEFT" }, "text": "with two objectives: Firstly we evaluate the prediction quality and performance", "orig": "with two objectives: Firstly we evaluate the prediction quality and performance", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 391.91177, "r_x1": 480.58777, "r_y1": 391.91177, "r_x2": 480.58777, "r_y2": 383.11481000000003, "r_x3": 134.765, "r_y3": 383.11481000000003, "coord_origin": "TOPLEFT" }, "text": "of OTSL vs. HTML after performing Hyper Parameter Optimization (HPO) on", "orig": "of OTSL vs. HTML after performing Hyper Parameter Optimization (HPO) on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 403.86676, "r_x1": 148.59807, "r_y1": 403.86676, "r_x2": 148.59807, "r_y2": 395.06978999999995, "r_x3": 134.765, "r_y3": 395.06978999999995, "coord_origin": "TOPLEFT" }, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.627, "r_y0": 403.86676, "r_x1": 191.84703, "r_y1": 403.86676, "r_x2": 191.84703, "r_y2": 395.06978999999995, "r_x3": 151.627, "r_y3": 395.06978999999995, "coord_origin": "TOPLEFT" }, "text": "canonical", "orig": "canonical", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 195.90201, "r_y0": 403.86676, "r_x1": 480.59528, "r_y1": 403.86676, "r_x2": 480.59528, "r_y2": 395.06978999999995, "r_x3": 195.90201, "r_y3": 395.06978999999995, "coord_origin": "TOPLEFT" }, "text": "PubTabNet data set. Secondly we pick the best hyper-parameters", "orig": "PubTabNet data set. Secondly we pick the best hyper-parameters", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 415.82175, "r_x1": 480.59283000000005, "r_y1": 415.82175, "r_x2": 480.59283000000005, "r_y2": 407.02478, "r_x3": 134.76501, "r_y3": 407.02478, "coord_origin": "TOPLEFT" }, "text": "found in the first step and evaluate how OTSL impacts the performance of", "orig": "found in the first step and evaluate how OTSL impacts the performance of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 427.77774, "r_x1": 480.59476, "r_y1": 427.77774, "r_x2": 480.59476, "r_y2": 418.98077, "r_x3": 134.76501, "r_y3": 418.98077, "coord_origin": "TOPLEFT" }, "text": "TableFormer after training on other publicly available data sets (FinTabNet,", "orig": "TableFormer after training on other publicly available data sets (FinTabNet,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 439.73273, "r_x1": 480.59171, "r_y1": 439.73273, "r_x2": 480.59171, "r_y2": 430.93576, "r_x3": 134.76501, "r_y3": 430.93576, "coord_origin": "TOPLEFT" }, "text": "PubTables-1M [14]). The ground truth (GT) from all data sets has been con-", "orig": "PubTables-1M [14]). The ground truth (GT) from all data sets has been con-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 451.6877099999999, "r_x1": 479.30258, "r_y1": 451.6877099999999, "r_x2": 479.30258, "r_y2": 442.8907500000001, "r_x3": 134.76501, "r_y3": 442.8907500000001, "coord_origin": "TOPLEFT" }, "text": "verted into OTSL format for this purpose, and will be made publicly available.", "orig": "verted into OTSL format for this purpose, and will be made publicly available.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 492.57443, "r_x1": 162.64424, "r_y1": 492.57443, "r_x2": 162.64424, "r_y2": 484.64813, "r_x3": 134.76501, "r_y3": 484.64813, "coord_origin": "TOPLEFT" }, "text": "Fig. 4.", "orig": "Fig. 4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 165.19601, "r_y0": 492.78067, "r_x1": 480.59082, "r_y1": 492.78067, "r_x2": 480.59082, "r_y2": 484.71091, "r_x3": 165.19601, "r_y3": 484.71091, "coord_origin": "TOPLEFT" }, "text": "Architecture sketch of the TableFormer model, which is a representative for the", "orig": "Architecture sketch of the TableFormer model, which is a representative for the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 503.73965, "r_x1": 206.70245, "r_y1": 503.73965, "r_x2": 206.70245, "r_y2": 495.66989, "r_x3": 134.76501, "r_y3": 495.66989, "coord_origin": "TOPLEFT" }, "text": "Im2Seq approach.", "orig": "Im2Seq approach.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.30025, "r_y0": 543.1000799999999, "r_x1": 149.70605, "r_y1": 543.1000799999999, "r_x2": 149.70605, "r_y2": 540.73164, "r_x3": 147.30025, "r_y3": 540.73164, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.90895, "r_y0": 543.1000799999999, "r_x1": 155.72055, "r_y1": 543.1000799999999, "r_x2": 155.72055, "r_y2": 540.73164, "r_x3": 150.90895, "r_y3": 540.73164, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 162.75987, "r_y0": 537.76224, "r_x1": 172.2963, "r_y1": 537.76224, "r_x2": 172.2963, "r_y2": 535.3938, "r_x3": 162.75987, "r_y3": 535.3938, "coord_origin": "TOPLEFT" }, "text": "Amount", "orig": "Amount", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.63603, "r_y0": 537.73459, "r_x1": 155.91753, "r_y1": 537.73459, "r_x2": 155.91753, "r_y2": 535.3661500000001, "r_x3": 147.63603, "r_y3": 535.3661500000001, "coord_origin": "TOPLEFT" }, "text": "Names", "orig": "Names", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.48466, "r_y0": 543.1000799999999, "r_x1": 164.10178, "r_y1": 543.1000799999999, "r_x2": 164.10178, "r_y2": 540.73164, "r_x3": 158.48466, "r_y3": 540.73164, "coord_origin": "TOPLEFT" }, "text": "1000", "orig": "1000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.48466, "r_y0": 547.03909, "r_x1": 162.69737, "r_y1": 547.03909, "r_x2": 162.69737, "r_y2": 544.67065, "r_x3": 158.48466, "r_y3": 544.67065, "coord_origin": "TOPLEFT" }, "text": "500", "orig": "500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.48466, "r_y0": 551.28108, "r_x1": 164.10178, "r_y1": 551.28108, "r_x2": 164.10178, "r_y2": 548.91264, "r_x3": 158.48466, "r_y3": 548.91264, "coord_origin": "TOPLEFT" }, "text": "3500", "orig": "3500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.48466, "r_y0": 555.52309, "r_x1": 162.69737, "r_y1": 555.52309, "r_x2": 162.69737, "r_y2": 553.15465, "r_x3": 158.48466, "r_y3": 553.15465, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.81696, "r_y0": 543.1000799999999, "r_x1": 172.88876, "r_y1": 543.1000799999999, "r_x2": 172.88876, "r_y2": 540.73164, "r_x3": 168.81696, "r_y3": 540.73164, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.81696, "r_y0": 547.03909, "r_x1": 172.88876, "r_y1": 547.03909, "r_x2": 172.88876, "r_y2": 544.67065, "r_x3": 168.81696, "r_y3": 544.67065, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.81696, "r_y0": 551.28108, "r_x1": 172.88876, "r_y1": 551.28108, "r_x2": 172.88876, "r_y2": 548.91264, "r_x3": 168.81696, "r_y3": 548.91264, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.81696, "r_y0": 555.52309, "r_x1": 172.88876, "r_y1": 555.52309, "r_x2": 172.88876, "r_y2": 553.15465, "r_x3": 168.81696, "r_y3": 553.15465, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.30025, "r_y0": 547.03909, "r_x1": 149.70605, "r_y1": 547.03909, "r_x2": 149.70605, "r_y2": 544.67065, "r_x3": 147.30025, "r_y3": 544.67065, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.90895, "r_y0": 547.03909, "r_x1": 155.72055, "r_y1": 547.03909, "r_x2": 155.72055, "r_y2": 544.67065, "r_x3": 150.90895, "r_y3": 544.67065, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.30025, "r_y0": 551.28108, "r_x1": 149.70605, "r_y1": 551.28108, "r_x2": 149.70605, "r_y2": 548.91264, "r_x3": 147.30025, "r_y3": 548.91264, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.90895, "r_y0": 551.28108, "r_x1": 155.72055, "r_y1": 551.28108, "r_x2": 155.72055, "r_y2": 548.91264, "r_x3": 150.90895, "r_y3": 548.91264, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.30025, "r_y0": 555.52309, "r_x1": 149.70605, "r_y1": 555.52309, "r_x2": 149.70605, "r_y2": 553.15465, "r_x3": 147.30025, "r_y3": 553.15465, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.90895, "r_y0": 555.52309, "r_x1": 155.72055, "r_y1": 555.52309, "r_x2": 155.72055, "r_y2": 553.15465, "r_x3": 150.90895, "r_y3": 553.15465, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 152.05046, "r_y0": 521.27298, "r_x1": 171.24945, "r_y1": 521.27298, "r_x2": 171.24945, "r_y2": 517.0098, "r_x3": 152.05046, "r_y3": 517.0098, "coord_origin": "TOPLEFT" }, "text": "Extracted", "orig": "Extracted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 148.13347, "r_y0": 526.57547, "r_x1": 175.16759, "r_y1": 526.57547, "r_x2": 175.16759, "r_y2": 522.3122900000001, "r_x3": 148.13347, "r_y3": 522.3122900000001, "coord_origin": "TOPLEFT" }, "text": "Table Images", "orig": "Table Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 193.53331, "r_y0": 528.7774, "r_x1": 220.31973, "r_y1": 528.7774, "r_x2": 220.31973, "r_y2": 524.51422, "r_x3": 193.53331, "r_y3": 524.51422, "coord_origin": "TOPLEFT" }, "text": "Standardized", "orig": "Standardized", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 199.47311, "r_y0": 534.0799, "r_x1": 214.37889, "r_y1": 534.0799, "r_x2": 214.37889, "r_y2": 529.8167100000001, "r_x3": 199.47311, "r_y3": 529.8167100000001, "coord_origin": "TOPLEFT" }, "text": "Images", "orig": "Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 273.61066, "r_y0": 514.16849, "r_x1": 284.47275, "r_y1": 514.16849, "r_x2": 284.47275, "r_y2": 509.9053, "r_x3": 273.61066, "r_y3": 509.9053, "coord_origin": "TOPLEFT" }, "text": "BBox", "orig": "BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 270.45187, "r_y0": 517.9560200000001, "r_x1": 287.63242, "r_y1": 517.9560200000001, "r_x2": 287.63242, "r_y2": 513.6928399999999, "r_x3": 270.45187, "r_y3": 513.6928399999999, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.47852, "r_y0": 512.40756, "r_x1": 348.14014, "r_y1": 512.40756, "r_x2": 348.14014, "r_y2": 508.14438, "r_x3": 332.47852, "r_y3": 508.14438, "coord_origin": "TOPLEFT" }, "text": "BBoxes", "orig": "BBoxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 376.68622, "r_y0": 525.38342, "r_x1": 407.25497, "r_y1": 525.38342, "r_x2": 407.25497, "r_y2": 521.12024, "r_x3": 376.68622, "r_y3": 521.12024, "coord_origin": "TOPLEFT" }, "text": "BBoxes can be", "orig": "BBoxes can be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 373.90869, "r_y0": 529.92844, "r_x1": 410.03506, "r_y1": 529.92844, "r_x2": 410.03506, "r_y2": 525.66525, "r_x3": 373.90869, "r_y3": 525.66525, "coord_origin": "TOPLEFT" }, "text": "traced back to the", "orig": "traced back to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 375.29871, "r_y0": 534.47342, "r_x1": 408.64902, "r_y1": 534.47342, "r_x2": 408.64902, "r_y2": 530.21024, "r_x3": 375.29871, "r_y3": 530.21024, "coord_origin": "TOPLEFT" }, "text": "original image to", "orig": "original image to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 377.06747, "r_y0": 539.01843, "r_x1": 406.88312, "r_y1": 539.01843, "r_x2": 406.88312, "r_y2": 534.75522, "r_x3": 377.06747, "r_y3": 534.75522, "coord_origin": "TOPLEFT" }, "text": "extract content", "orig": "extract content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 383.56683, "r_y0": 567.50497, "r_x1": 433.76544, "r_y1": 567.50497, "r_x2": 433.76544, "r_y2": 563.24176, "r_x3": 383.56683, "r_y3": 563.24176, "coord_origin": "TOPLEFT" }, "text": "Structure Tags sequence", "orig": "Structure Tags sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 383.52768, "r_y0": 572.04997, "r_x1": 433.80764999999997, "r_y1": 572.04997, "r_x2": 433.80764999999997, "r_y2": 567.78676, "r_x3": 383.52768, "r_y3": 567.78676, "coord_origin": "TOPLEFT" }, "text": "provide full description of", "orig": "provide full description of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 390.47522, "r_y0": 576.59499, "r_x1": 426.85703, "r_y1": 576.59499, "r_x2": 426.85703, "r_y2": 572.33177, "r_x3": 390.47522, "r_y3": 572.33177, "coord_origin": "TOPLEFT" }, "text": "the table structure", "orig": "the table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.94702, "r_y0": 582.15465, "r_x1": 323.1691, "r_y1": 582.15465, "r_x2": 323.1691, "r_y2": 577.89143, "r_x3": 293.94702, "r_y3": 577.89143, "coord_origin": "TOPLEFT" }, "text": "Structure Tags", "orig": "Structure Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.94702, "r_y0": 586.69969, "r_x1": 324.59396, "r_y1": 586.69969, "r_x2": 324.59396, "r_y2": 582.43648, "r_x3": 293.94702, "r_y3": 582.43648, "coord_origin": "TOPLEFT" }, "text": "in OTSL format", "orig": "in OTSL format", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.07819, "r_y0": 546.08591, "r_x1": 364.14691, "r_y1": 546.08591, "r_x2": 364.14691, "r_y2": 541.82269, "r_x3": 333.07819, "r_y3": 541.82269, "coord_origin": "TOPLEFT" }, "text": "BBoxes in sync", "orig": "BBoxes in sync", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.07819, "r_y0": 549.87341, "r_x1": 369.71542, "r_y1": 549.87341, "r_x2": 369.71542, "r_y2": 545.6102, "r_x3": 333.07819, "r_y3": 545.6102, "coord_origin": "TOPLEFT" }, "text": "with tag sequence", "orig": "with tag sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.65881000000002, "r_y0": 519.50458, "r_x1": 249.58894000000004, "r_y1": 519.50458, "r_x2": 249.58894000000004, "r_y2": 515.24139, "r_x3": 232.65881000000002, "r_y3": 515.24139, "coord_origin": "TOPLEFT" }, "text": "Encoder", "orig": "Encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 269.8219, "r_y0": 550.23424, "r_x1": 288.26279, "r_y1": 550.23424, "r_x2": 288.26279, "r_y2": 545.97102, "r_x3": 269.8219, "r_y3": 545.97102, "coord_origin": "TOPLEFT" }, "text": "Structure", "orig": "Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 270.45187, "r_y0": 554.0217299999999, "r_x1": 287.63242, "r_y1": 554.0217299999999, "r_x2": 287.63242, "r_y2": 549.75851, "r_x3": 270.45187, "r_y3": 549.75851, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.17676, "r_y0": 520.17523, "r_x1": 358.11206, "r_y1": 520.17523, "r_x2": 358.11206, "r_y2": 515.91205, "r_x3": 332.17676, "r_y3": 515.91205, "coord_origin": "TOPLEFT" }, "text": "[x1, y2, x2, y2]", "orig": "[x1, y2, x2, y2]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.17676, "r_y0": 526.23523, "r_x1": 361.58298, "r_y1": 526.23523, "r_x2": 361.58298, "r_y2": 521.9720500000001, "r_x3": 332.17676, "r_y3": 521.9720500000001, "coord_origin": "TOPLEFT" }, "text": "[x1', y2', x2', y2']", "orig": "[x1', y2', x2', y2']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.17676, "r_y0": 532.29523, "r_x1": 364.76474, "r_y1": 532.29523, "r_x2": 364.76474, "r_y2": 528.03204, "r_x3": 332.17676, "r_y3": 528.03204, "coord_origin": "TOPLEFT" }, "text": "[x1'', y2'', x2'', y2'']", "orig": "[x1'', y2'', x2'', y2'']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.17676, "r_y0": 538.35524, "r_x1": 335.96548, "r_y1": 538.35524, "r_x2": 335.96548, "r_y2": 534.09204, "r_x3": 332.17676, "r_y3": 534.09204, "coord_origin": "TOPLEFT" }, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.8894, "r_y0": 520.6582599999999, "r_x1": 329.41641, "r_y1": 520.6582599999999, "r_x2": 329.41641, "r_y2": 516.39508, "r_x3": 326.8894, "r_y3": 516.39508, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.04089, "r_y0": 526.68796, "r_x1": 329.5679, "r_y1": 526.68796, "r_x2": 329.5679, "r_y2": 522.4247700000001, "r_x3": 327.04089, "r_y3": 522.4247700000001, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.04089, "r_y0": 532.77826, "r_x1": 329.5679, "r_y1": 532.77826, "r_x2": 329.5679, "r_y2": 528.51508, "r_x3": 327.04089, "r_y3": 528.51508, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 424.14102, "r_y0": 531.7060200000001, "r_x1": 426.66803, "r_y1": 531.7060200000001, "r_x2": 426.66803, "r_y2": 527.4428399999999, "r_x3": 424.14102, "r_y3": 527.4428399999999, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 453.0018, "r_y0": 521.71713, "r_x1": 455.52881, "r_y1": 521.71713, "r_x2": 455.52881, "r_y2": 517.4539500000001, "r_x3": 453.0018, "r_y3": 517.4539500000001, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.85825, "r_y0": 521.32599, "r_x1": 426.38525, "r_y1": 521.32599, "r_x2": 426.38525, "r_y2": 517.06281, "r_x3": 423.85825, "r_y3": 517.06281, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.4342, "r_y0": 562.35719, "r_x1": 337.27542, "r_y1": 562.35719, "r_x2": 337.27542, "r_y2": 557.36679, "r_x3": 333.4342, "r_y3": 557.36679, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.35397, "r_y0": 562.30719, "r_x1": 344.19519, "r_y1": 562.30719, "r_x2": 344.19519, "r_y2": 557.31679, "r_x3": 340.35397, "r_y3": 557.31679, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.30978, "r_y0": 568.8557900000001, "r_x1": 344.151, "r_y1": 568.8557900000001, "r_x2": 344.151, "r_y2": 563.8653899999999, "r_x3": 340.30978, "r_y3": 563.8653899999999, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.79904, "r_y0": 568.85907, "r_x1": 350.64026, "r_y1": 568.85907, "r_x2": 350.64026, "r_y2": 563.8686700000001, "r_x3": 346.79904, "r_y3": 563.8686700000001, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.59583, "r_y0": 568.81311, "r_x1": 337.43704, "r_y1": 568.81311, "r_x2": 337.43704, "r_y2": 563.82271, "r_x3": 333.59583, "r_y3": 563.82271, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.37543, "r_y0": 575.41713, "r_x1": 344.21664, "r_y1": 575.41713, "r_x2": 344.21664, "r_y2": 570.42673, "r_x3": 340.37543, "r_y3": 570.42673, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.86469, "r_y0": 575.42041, "r_x1": 350.7059, "r_y1": 575.42041, "r_x2": 350.7059, "r_y2": 570.43001, "r_x3": 346.86469, "r_y3": 570.43001, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.66144, "r_y0": 575.37445, "r_x1": 337.50266, "r_y1": 575.37445, "r_x2": 337.50266, "r_y2": 570.38405, "r_x3": 333.66144, "r_y3": 570.38405, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.37671, "r_y0": 582.0164599999999, "r_x1": 344.21793, "r_y1": 582.0164599999999, "r_x2": 344.21793, "r_y2": 577.02606, "r_x3": 340.37671, "r_y3": 577.02606, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.86597, "r_y0": 582.01974, "r_x1": 350.70718, "r_y1": 582.01974, "r_x2": 350.70718, "r_y2": 577.02934, "r_x3": 346.86597, "r_y3": 577.02934, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.66272, "r_y0": 581.97379, "r_x1": 337.50394, "r_y1": 581.97379, "r_x2": 337.50394, "r_y2": 576.98338, "r_x3": 333.66272, "r_y3": 576.98338, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.27948, "r_y0": 588.38777, "r_x1": 344.1207, "r_y1": 588.38777, "r_x2": 344.1207, "r_y2": 583.39737, "r_x3": 340.27948, "r_y3": 583.39737, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.76874, "r_y0": 588.39108, "r_x1": 350.60995, "r_y1": 588.39108, "r_x2": 350.60995, "r_y2": 583.40068, "r_x3": 346.76874, "r_y3": 583.40068, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.56549, "r_y0": 588.34514, "r_x1": 337.40671, "r_y1": 588.34514, "r_x2": 337.40671, "r_y2": 583.35474, "r_x3": 333.56549, "r_y3": 583.35474, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.03326, "r_y0": 561.87354, "r_x1": 359.83362, "r_y1": 561.87354, "r_x2": 359.83362, "r_y2": 556.8831299999999, "r_x3": 353.03326, "r_y3": 556.8831299999999, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.18604, "r_y0": 568.57085, "r_x1": 359.98639, "r_y1": 568.57085, "r_x2": 359.98639, "r_y2": 563.58044, "r_x3": 353.18604, "r_y3": 563.58044, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.19864, "r_y0": 575.15276, "r_x1": 359.99899, "r_y1": 575.15276, "r_x2": 359.99899, "r_y2": 570.1623500000001, "r_x3": 353.19864, "r_y3": 570.1623500000001, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.1532, "r_y0": 581.75652, "r_x1": 359.95355, "r_y1": 581.75652, "r_x2": 359.95355, "r_y2": 576.76611, "r_x3": 353.1532, "r_y3": 576.76611, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.26935, "r_y0": 588.3966800000001, "r_x1": 360.0697, "r_y1": 588.3966800000001, "r_x2": 360.0697, "r_y2": 583.40628, "r_x3": 353.26935, "r_y3": 583.40628, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.37979, "r_y0": 562.07275, "r_x1": 350.33786, "r_y1": 562.07275, "r_x2": 350.33786, "r_y2": 557.08235, "r_x3": 347.37979, "r_y3": 557.08235, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.14026, "r_y0": 568.55399, "r_x1": 333.66727, "r_y1": 568.55399, "r_x2": 333.66727, "r_y2": 564.2907700000001, "r_x3": 331.14026, "r_y3": 564.2907700000001, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.80972, "r_y0": 558.85634, "r_x1": 343.33673, "r_y1": 558.85634, "r_x2": 343.33673, "r_y2": 554.59312, "r_x3": 340.80972, "r_y3": 554.59312, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.97992, "r_y0": 559.09357, "r_x1": 333.50693, "r_y1": 559.09357, "r_x2": 333.50693, "r_y2": 554.83035, "r_x3": 330.97992, "r_y3": 554.83035, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.709, "r_y0": 628.98975, "r_x1": 480.58792, "r_y1": 628.98975, "r_x2": 480.58792, "r_y2": 620.19278, "r_x3": 149.709, "r_y3": 620.19278, "coord_origin": "TOPLEFT" }, "text": "We rely on standard metrics such as Tree Edit Distance score (TEDs) for", "orig": "We rely on standard metrics such as Tree Edit Distance score (TEDs) for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 640.94475, "r_x1": 480.58871, "r_y1": 640.94475, "r_x2": 480.58871, "r_y2": 632.14778, "r_x3": 134.765, "r_y3": 632.14778, "coord_origin": "TOPLEFT" }, "text": "table structure prediction, and Mean Average Precision (mAP) with 0.75 Inter-", "orig": "table structure prediction, and Mean Average Precision (mAP) with 0.75 Inter-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 652.89975, "r_x1": 480.5917400000001, "r_y1": 652.89975, "r_x2": 480.5917400000001, "r_y2": 644.1027799999999, "r_x3": 134.765, "r_y3": 644.1027799999999, "coord_origin": "TOPLEFT" }, "text": "section Over Union (IOU) threshold for the bounding-box predictions of table", "orig": "section Over Union (IOU) threshold for the bounding-box predictions of table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 664.8547599999999, "r_x1": 480.58968999999996, "r_y1": 664.8547599999999, "r_x2": 480.58968999999996, "r_y2": 656.0577900000001, "r_x3": 134.765, "r_y3": 656.0577900000001, "coord_origin": "TOPLEFT" }, "text": "cells. The predicted OTSL structures were converted back to HTML format in", "orig": "cells. The predicted OTSL structures were converted back to HTML format in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "has_chars": false, "has_words": false, "has_lines": true, "image": null, "lines": [] }, "predictions": { "layout": { "clusters": [ { "id": 9, "label": "page_header", "bbox": { "l": 134.765, "t": 93.77099999999996, "r": 139.37193, "b": 101.84069999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.8301323056221008, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 101.84069999999997, "r_x1": 139.37193, "r_y1": 101.84069999999997, "r_x2": 139.37193, "r_y2": 93.77099999999996, "r_x3": 134.765, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 8, "label": "page_header", "bbox": { "l": 167.81335, "t": 93.77099999999996, "r": 231.72227, "b": 101.84069999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.8631826043128967, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.81335, "r_y0": 101.84069999999997, "r_x1": 178.07675, "r_y1": 101.84069999999997, "r_x2": 178.07675, "r_y2": 93.77099999999996, "r_x3": 167.81335, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.37415, "r_y0": 101.84069999999997, "r_x1": 231.72227, "r_y1": 101.84069999999997, "r_x2": 231.72227, "r_y2": 93.77099999999996, "r_x3": 182.37415, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 5, "label": "text", "bbox": { "l": 134.765, "t": 118.93377999999996, "r": 480.58884000000006, "b": 139.68579, "coord_origin": "TOPLEFT" }, "confidence": 0.9464744925498962, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 127.73077, "r_x1": 480.58884000000006, "r_y1": 127.73077, "r_x2": 480.58884000000006, "r_y2": 118.93377999999996, "r_x3": 134.765, "r_y3": 118.93377999999996, "coord_origin": "TOPLEFT" }, "text": "reduces significantly the column drift seen in the HTML based models (see Fig-", "orig": "reduces significantly the column drift seen in the HTML based models (see Fig-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 139.68579, "r_x1": 163.56389, "r_y1": 139.68579, "r_x2": 163.56389, "r_y2": 130.88878999999997, "r_x3": 134.765, "r_y3": 130.88878999999997, "coord_origin": "TOPLEFT" }, "text": "ure 5).", "orig": "ure 5).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 2, "label": "section_header", "bbox": { "l": 134.765, "t": 161.55682000000002, "r": 319.34708, "b": 170.36377000000005, "coord_origin": "TOPLEFT" }, "confidence": 0.9549514651298523, "cells": [ { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 170.36377000000005, "r_x1": 149.40205, "r_y1": 170.36377000000005, "r_x2": 149.40205, "r_y2": 161.55682000000002, "r_x3": 134.765, "r_y3": 161.55682000000002, "coord_origin": "TOPLEFT" }, "text": "4.3", "orig": "4.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.85904, "r_y0": 170.36377000000005, "r_x1": 319.34708, "r_y1": 170.36377000000005, "r_x2": 319.34708, "r_y2": 161.55682000000002, "r_x3": 160.85904, "r_y3": 161.55682000000002, "coord_origin": "TOPLEFT" }, "text": "Error-detection and -mitigation", "orig": "Error-detection and -mitigation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 0, "label": "text", "bbox": { "l": 134.765, "t": 182.28179999999998, "r": 480.5957599999999, "b": 298.67584, "coord_origin": "TOPLEFT" }, "confidence": 0.9879790544509888, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 191.0788, "r_x1": 480.59572999999995, "r_y1": 191.0788, "r_x2": 480.59572999999995, "r_y2": 182.28179999999998, "r_x3": 134.765, "r_y3": 182.28179999999998, "coord_origin": "TOPLEFT" }, "text": "The design of OTSL allows to validate a table structure easily on an unfinished", "orig": "The design of OTSL allows to validate a table structure easily on an unfinished", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 203.03479000000004, "r_x1": 480.59473, "r_y1": 203.03479000000004, "r_x2": 480.59473, "r_y2": 194.23779000000002, "r_x3": 134.765, "r_y3": 194.23779000000002, "coord_origin": "TOPLEFT" }, "text": "sequence. The detection of an invalid sequence token is a clear indication of a", "orig": "sequence. The detection of an invalid sequence token is a clear indication of a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 214.98981000000003, "r_x1": 480.58678999999995, "r_y1": 214.98981000000003, "r_x2": 480.58678999999995, "r_y2": 206.19281, "r_x3": 134.765, "r_y3": 206.19281, "coord_origin": "TOPLEFT" }, "text": "prediction mistake, however a valid sequence by itself does not guarantee pre-", "orig": "prediction mistake, however a valid sequence by itself does not guarantee pre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 226.94482000000005, "r_x1": 480.59177000000005, "r_y1": 226.94482000000005, "r_x2": 480.59177000000005, "r_y2": 218.14783, "r_x3": 134.765, "r_y3": 218.14783, "coord_origin": "TOPLEFT" }, "text": "diction correctness. Different heuristics can be used to correct token errors in", "orig": "diction correctness. Different heuristics can be used to correct token errors in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 238.89984000000004, "r_x1": 480.58768, "r_y1": 238.89984000000004, "r_x2": 480.58768, "r_y2": 230.10284000000001, "r_x3": 134.765, "r_y3": 230.10284000000001, "coord_origin": "TOPLEFT" }, "text": "an invalid sequence and thus increase the chances for accurate predictions. Such", "orig": "an invalid sequence and thus increase the chances for accurate predictions. Such", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 250.85486000000003, "r_x1": 480.5867, "r_y1": 250.85486000000003, "r_x2": 480.5867, "r_y2": 242.05786, "r_x3": 134.765, "r_y3": 242.05786, "coord_origin": "TOPLEFT" }, "text": "heuristics can be applied either after the prediction of each token, or at the end", "orig": "heuristics can be applied either after the prediction of each token, or at the end", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 262.80988, "r_x1": 480.5938100000001, "r_y1": 262.80988, "r_x2": 480.5938100000001, "r_y2": 254.01288, "r_x3": 134.765, "r_y3": 254.01288, "coord_origin": "TOPLEFT" }, "text": "on the entire predicted sequence. For example a simple heuristic which can cor-", "orig": "on the entire predicted sequence. For example a simple heuristic which can cor-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 274.76586999999995, "r_x1": 480.59069999999997, "r_y1": 274.76586999999995, "r_x2": 480.59069999999997, "r_y2": 265.96887000000004, "r_x3": 134.765, "r_y3": 265.96887000000004, "coord_origin": "TOPLEFT" }, "text": "rect the predicted OTSL sequence on-the-fly is to verify if the token with the", "orig": "rect the predicted OTSL sequence on-the-fly is to verify if the token with the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 286.72086, "r_x1": 480.5957599999999, "r_y1": 286.72086, "r_x2": 480.5957599999999, "r_y2": 277.92389000000003, "r_x3": 134.765, "r_y3": 277.92389000000003, "coord_origin": "TOPLEFT" }, "text": "highest prediction confidence invalidates the predicted sequence, and replace it", "orig": "highest prediction confidence invalidates the predicted sequence, and replace it", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 298.67584, "r_x1": 469.40369, "r_y1": 298.67584, "r_x2": 469.40369, "r_y2": 289.8788799999999, "r_x3": 134.765, "r_y3": 289.8788799999999, "coord_origin": "TOPLEFT" }, "text": "by the token with the next highest confidence until OTSL rules are satisfied.", "orig": "by the token with the next highest confidence until OTSL rules are satisfied.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 3, "label": "section_header", "bbox": { "l": 134.765, "t": 321.164, "r": 229.03534, "b": 331.73239000000007, "coord_origin": "TOPLEFT" }, "confidence": 0.95152747631073, "cells": [ { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 331.73239000000007, "r_x1": 141.4886, "r_y1": 331.73239000000007, "r_x2": 141.4886, "r_y2": 321.164, "r_x3": 134.765, "r_y3": 321.164, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.9382, "r_y0": 331.73239000000007, "r_x1": 229.03534, "r_y1": 331.73239000000007, "r_x2": 229.03534, "r_y2": 321.164, "r_x3": 154.9382, "r_y3": 321.164, "coord_origin": "TOPLEFT" }, "text": "Experiments", "orig": "Experiments", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 1, "label": "text", "bbox": { "l": 134.765, "t": 347.24985, "r": 480.59528, "b": 451.6877099999999, "coord_origin": "TOPLEFT" }, "confidence": 0.9877985119819641, "cells": [ { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 356.04681, "r_x1": 480.59375, "r_y1": 356.04681, "r_x2": 480.59375, "r_y2": 347.24985, "r_x3": 134.765, "r_y3": 347.24985, "coord_origin": "TOPLEFT" }, "text": "To evaluate the impact of OTSL on prediction accuracy and inference times, we", "orig": "To evaluate the impact of OTSL on prediction accuracy and inference times, we", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 368.0018, "r_x1": 480.59476, "r_y1": 368.0018, "r_x2": 480.59476, "r_y2": 359.2048300000001, "r_x3": 134.765, "r_y3": 359.2048300000001, "coord_origin": "TOPLEFT" }, "text": "conducted a series of experiments based on the TableFormer model (Figure 4)", "orig": "conducted a series of experiments based on the TableFormer model (Figure 4)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 379.95679, "r_x1": 480.58786000000003, "r_y1": 379.95679, "r_x2": 480.58786000000003, "r_y2": 371.15982, "r_x3": 134.765, "r_y3": 371.15982, "coord_origin": "TOPLEFT" }, "text": "with two objectives: Firstly we evaluate the prediction quality and performance", "orig": "with two objectives: Firstly we evaluate the prediction quality and performance", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 391.91177, "r_x1": 480.58777, "r_y1": 391.91177, "r_x2": 480.58777, "r_y2": 383.11481000000003, "r_x3": 134.765, "r_y3": 383.11481000000003, "coord_origin": "TOPLEFT" }, "text": "of OTSL vs. HTML after performing Hyper Parameter Optimization (HPO) on", "orig": "of OTSL vs. HTML after performing Hyper Parameter Optimization (HPO) on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 403.86676, "r_x1": 148.59807, "r_y1": 403.86676, "r_x2": 148.59807, "r_y2": 395.06978999999995, "r_x3": 134.765, "r_y3": 395.06978999999995, "coord_origin": "TOPLEFT" }, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.627, "r_y0": 403.86676, "r_x1": 191.84703, "r_y1": 403.86676, "r_x2": 191.84703, "r_y2": 395.06978999999995, "r_x3": 151.627, "r_y3": 395.06978999999995, "coord_origin": "TOPLEFT" }, "text": "canonical", "orig": "canonical", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 195.90201, "r_y0": 403.86676, "r_x1": 480.59528, "r_y1": 403.86676, "r_x2": 480.59528, "r_y2": 395.06978999999995, "r_x3": 195.90201, "r_y3": 395.06978999999995, "coord_origin": "TOPLEFT" }, "text": "PubTabNet data set. Secondly we pick the best hyper-parameters", "orig": "PubTabNet data set. Secondly we pick the best hyper-parameters", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 415.82175, "r_x1": 480.59283000000005, "r_y1": 415.82175, "r_x2": 480.59283000000005, "r_y2": 407.02478, "r_x3": 134.76501, "r_y3": 407.02478, "coord_origin": "TOPLEFT" }, "text": "found in the first step and evaluate how OTSL impacts the performance of", "orig": "found in the first step and evaluate how OTSL impacts the performance of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 427.77774, "r_x1": 480.59476, "r_y1": 427.77774, "r_x2": 480.59476, "r_y2": 418.98077, "r_x3": 134.76501, "r_y3": 418.98077, "coord_origin": "TOPLEFT" }, "text": "TableFormer after training on other publicly available data sets (FinTabNet,", "orig": "TableFormer after training on other publicly available data sets (FinTabNet,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 439.73273, "r_x1": 480.59171, "r_y1": 439.73273, "r_x2": 480.59171, "r_y2": 430.93576, "r_x3": 134.76501, "r_y3": 430.93576, "coord_origin": "TOPLEFT" }, "text": "PubTables-1M [14]). The ground truth (GT) from all data sets has been con-", "orig": "PubTables-1M [14]). The ground truth (GT) from all data sets has been con-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 451.6877099999999, "r_x1": 479.30258, "r_y1": 451.6877099999999, "r_x2": 479.30258, "r_y2": 442.8907500000001, "r_x3": 134.76501, "r_y3": 442.8907500000001, "coord_origin": "TOPLEFT" }, "text": "verted into OTSL format for this purpose, and will be made publicly available.", "orig": "verted into OTSL format for this purpose, and will be made publicly available.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 7, "label": "caption", "bbox": { "l": 134.76501, "t": 484.64813, "r": 480.59082, "b": 503.73965, "coord_origin": "TOPLEFT" }, "confidence": 0.9297956228256226, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 492.57443, "r_x1": 162.64424, "r_y1": 492.57443, "r_x2": 162.64424, "r_y2": 484.64813, "r_x3": 134.76501, "r_y3": 484.64813, "coord_origin": "TOPLEFT" }, "text": "Fig. 4.", "orig": "Fig. 4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 165.19601, "r_y0": 492.78067, "r_x1": 480.59082, "r_y1": 492.78067, "r_x2": 480.59082, "r_y2": 484.71091, "r_x3": 165.19601, "r_y3": 484.71091, "coord_origin": "TOPLEFT" }, "text": "Architecture sketch of the TableFormer model, which is a representative for the", "orig": "Architecture sketch of the TableFormer model, which is a representative for the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 503.73965, "r_x1": 206.70245, "r_y1": 503.73965, "r_x2": 206.70245, "r_y2": 495.66989, "r_x3": 134.76501, "r_y3": 495.66989, "coord_origin": "TOPLEFT" }, "text": "Im2Seq approach.", "orig": "Im2Seq approach.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 6, "label": "picture", "bbox": { "l": 140.70968627929688, "t": 508.0638427734375, "r": 472.73382568359375, "b": 593.6771850585938, "coord_origin": "TOPLEFT" }, "confidence": 0.9303396344184875, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.30025, "r_y0": 543.1000799999999, "r_x1": 149.70605, "r_y1": 543.1000799999999, "r_x2": 149.70605, "r_y2": 540.73164, "r_x3": 147.30025, "r_y3": 540.73164, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.90895, "r_y0": 543.1000799999999, "r_x1": 155.72055, "r_y1": 543.1000799999999, "r_x2": 155.72055, "r_y2": 540.73164, "r_x3": 150.90895, "r_y3": 540.73164, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 162.75987, "r_y0": 537.76224, "r_x1": 172.2963, "r_y1": 537.76224, "r_x2": 172.2963, "r_y2": 535.3938, "r_x3": 162.75987, "r_y3": 535.3938, "coord_origin": "TOPLEFT" }, "text": "Amount", "orig": "Amount", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.63603, "r_y0": 537.73459, "r_x1": 155.91753, "r_y1": 537.73459, "r_x2": 155.91753, "r_y2": 535.3661500000001, "r_x3": 147.63603, "r_y3": 535.3661500000001, "coord_origin": "TOPLEFT" }, "text": "Names", "orig": "Names", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.48466, "r_y0": 543.1000799999999, "r_x1": 164.10178, "r_y1": 543.1000799999999, "r_x2": 164.10178, "r_y2": 540.73164, "r_x3": 158.48466, "r_y3": 540.73164, "coord_origin": "TOPLEFT" }, "text": "1000", "orig": "1000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.48466, "r_y0": 547.03909, "r_x1": 162.69737, "r_y1": 547.03909, "r_x2": 162.69737, "r_y2": 544.67065, "r_x3": 158.48466, "r_y3": 544.67065, "coord_origin": "TOPLEFT" }, "text": "500", "orig": "500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.48466, "r_y0": 551.28108, "r_x1": 164.10178, "r_y1": 551.28108, "r_x2": 164.10178, "r_y2": 548.91264, "r_x3": 158.48466, "r_y3": 548.91264, "coord_origin": "TOPLEFT" }, "text": "3500", "orig": "3500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.48466, "r_y0": 555.52309, "r_x1": 162.69737, "r_y1": 555.52309, "r_x2": 162.69737, "r_y2": 553.15465, "r_x3": 158.48466, "r_y3": 553.15465, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.81696, "r_y0": 543.1000799999999, "r_x1": 172.88876, "r_y1": 543.1000799999999, "r_x2": 172.88876, "r_y2": 540.73164, "r_x3": 168.81696, "r_y3": 540.73164, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.81696, "r_y0": 547.03909, "r_x1": 172.88876, "r_y1": 547.03909, "r_x2": 172.88876, "r_y2": 544.67065, "r_x3": 168.81696, "r_y3": 544.67065, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.81696, "r_y0": 551.28108, "r_x1": 172.88876, "r_y1": 551.28108, "r_x2": 172.88876, "r_y2": 548.91264, "r_x3": 168.81696, "r_y3": 548.91264, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.81696, "r_y0": 555.52309, "r_x1": 172.88876, "r_y1": 555.52309, "r_x2": 172.88876, "r_y2": 553.15465, "r_x3": 168.81696, "r_y3": 553.15465, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.30025, "r_y0": 547.03909, "r_x1": 149.70605, "r_y1": 547.03909, "r_x2": 149.70605, "r_y2": 544.67065, "r_x3": 147.30025, "r_y3": 544.67065, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.90895, "r_y0": 547.03909, "r_x1": 155.72055, "r_y1": 547.03909, "r_x2": 155.72055, "r_y2": 544.67065, "r_x3": 150.90895, "r_y3": 544.67065, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.30025, "r_y0": 551.28108, "r_x1": 149.70605, "r_y1": 551.28108, "r_x2": 149.70605, "r_y2": 548.91264, "r_x3": 147.30025, "r_y3": 548.91264, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.90895, "r_y0": 551.28108, "r_x1": 155.72055, "r_y1": 551.28108, "r_x2": 155.72055, "r_y2": 548.91264, "r_x3": 150.90895, "r_y3": 548.91264, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.30025, "r_y0": 555.52309, "r_x1": 149.70605, "r_y1": 555.52309, "r_x2": 149.70605, "r_y2": 553.15465, "r_x3": 147.30025, "r_y3": 553.15465, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.90895, "r_y0": 555.52309, "r_x1": 155.72055, "r_y1": 555.52309, "r_x2": 155.72055, "r_y2": 553.15465, "r_x3": 150.90895, "r_y3": 553.15465, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 152.05046, "r_y0": 521.27298, "r_x1": 171.24945, "r_y1": 521.27298, "r_x2": 171.24945, "r_y2": 517.0098, "r_x3": 152.05046, "r_y3": 517.0098, "coord_origin": "TOPLEFT" }, "text": "Extracted", "orig": "Extracted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 148.13347, "r_y0": 526.57547, "r_x1": 175.16759, "r_y1": 526.57547, "r_x2": 175.16759, "r_y2": 522.3122900000001, "r_x3": 148.13347, "r_y3": 522.3122900000001, "coord_origin": "TOPLEFT" }, "text": "Table Images", "orig": "Table Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 193.53331, "r_y0": 528.7774, "r_x1": 220.31973, "r_y1": 528.7774, "r_x2": 220.31973, "r_y2": 524.51422, "r_x3": 193.53331, "r_y3": 524.51422, "coord_origin": "TOPLEFT" }, "text": "Standardized", "orig": "Standardized", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 199.47311, "r_y0": 534.0799, "r_x1": 214.37889, "r_y1": 534.0799, "r_x2": 214.37889, "r_y2": 529.8167100000001, "r_x3": 199.47311, "r_y3": 529.8167100000001, "coord_origin": "TOPLEFT" }, "text": "Images", "orig": "Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 273.61066, "r_y0": 514.16849, "r_x1": 284.47275, "r_y1": 514.16849, "r_x2": 284.47275, "r_y2": 509.9053, "r_x3": 273.61066, "r_y3": 509.9053, "coord_origin": "TOPLEFT" }, "text": "BBox", "orig": "BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 270.45187, "r_y0": 517.9560200000001, "r_x1": 287.63242, "r_y1": 517.9560200000001, "r_x2": 287.63242, "r_y2": 513.6928399999999, "r_x3": 270.45187, "r_y3": 513.6928399999999, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.47852, "r_y0": 512.40756, "r_x1": 348.14014, "r_y1": 512.40756, "r_x2": 348.14014, "r_y2": 508.14438, "r_x3": 332.47852, "r_y3": 508.14438, "coord_origin": "TOPLEFT" }, "text": "BBoxes", "orig": "BBoxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 376.68622, "r_y0": 525.38342, "r_x1": 407.25497, "r_y1": 525.38342, "r_x2": 407.25497, "r_y2": 521.12024, "r_x3": 376.68622, "r_y3": 521.12024, "coord_origin": "TOPLEFT" }, "text": "BBoxes can be", "orig": "BBoxes can be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 373.90869, "r_y0": 529.92844, "r_x1": 410.03506, "r_y1": 529.92844, "r_x2": 410.03506, "r_y2": 525.66525, "r_x3": 373.90869, "r_y3": 525.66525, "coord_origin": "TOPLEFT" }, "text": "traced back to the", "orig": "traced back to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 375.29871, "r_y0": 534.47342, "r_x1": 408.64902, "r_y1": 534.47342, "r_x2": 408.64902, "r_y2": 530.21024, "r_x3": 375.29871, "r_y3": 530.21024, "coord_origin": "TOPLEFT" }, "text": "original image to", "orig": "original image to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 377.06747, "r_y0": 539.01843, "r_x1": 406.88312, "r_y1": 539.01843, "r_x2": 406.88312, "r_y2": 534.75522, "r_x3": 377.06747, "r_y3": 534.75522, "coord_origin": "TOPLEFT" }, "text": "extract content", "orig": "extract content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 383.56683, "r_y0": 567.50497, "r_x1": 433.76544, "r_y1": 567.50497, "r_x2": 433.76544, "r_y2": 563.24176, "r_x3": 383.56683, "r_y3": 563.24176, "coord_origin": "TOPLEFT" }, "text": "Structure Tags sequence", "orig": "Structure Tags sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 383.52768, "r_y0": 572.04997, "r_x1": 433.80764999999997, "r_y1": 572.04997, "r_x2": 433.80764999999997, "r_y2": 567.78676, "r_x3": 383.52768, "r_y3": 567.78676, "coord_origin": "TOPLEFT" }, "text": "provide full description of", "orig": "provide full description of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 390.47522, "r_y0": 576.59499, "r_x1": 426.85703, "r_y1": 576.59499, "r_x2": 426.85703, "r_y2": 572.33177, "r_x3": 390.47522, "r_y3": 572.33177, "coord_origin": "TOPLEFT" }, "text": "the table structure", "orig": "the table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.94702, "r_y0": 582.15465, "r_x1": 323.1691, "r_y1": 582.15465, "r_x2": 323.1691, "r_y2": 577.89143, "r_x3": 293.94702, "r_y3": 577.89143, "coord_origin": "TOPLEFT" }, "text": "Structure Tags", "orig": "Structure Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.94702, "r_y0": 586.69969, "r_x1": 324.59396, "r_y1": 586.69969, "r_x2": 324.59396, "r_y2": 582.43648, "r_x3": 293.94702, "r_y3": 582.43648, "coord_origin": "TOPLEFT" }, "text": "in OTSL format", "orig": "in OTSL format", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.07819, "r_y0": 546.08591, "r_x1": 364.14691, "r_y1": 546.08591, "r_x2": 364.14691, "r_y2": 541.82269, "r_x3": 333.07819, "r_y3": 541.82269, "coord_origin": "TOPLEFT" }, "text": "BBoxes in sync", "orig": "BBoxes in sync", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.07819, "r_y0": 549.87341, "r_x1": 369.71542, "r_y1": 549.87341, "r_x2": 369.71542, "r_y2": 545.6102, "r_x3": 333.07819, "r_y3": 545.6102, "coord_origin": "TOPLEFT" }, "text": "with tag sequence", "orig": "with tag sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.65881000000002, "r_y0": 519.50458, "r_x1": 249.58894000000004, "r_y1": 519.50458, "r_x2": 249.58894000000004, "r_y2": 515.24139, "r_x3": 232.65881000000002, "r_y3": 515.24139, "coord_origin": "TOPLEFT" }, "text": "Encoder", "orig": "Encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 269.8219, "r_y0": 550.23424, "r_x1": 288.26279, "r_y1": 550.23424, "r_x2": 288.26279, "r_y2": 545.97102, "r_x3": 269.8219, "r_y3": 545.97102, "coord_origin": "TOPLEFT" }, "text": "Structure", "orig": "Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 270.45187, "r_y0": 554.0217299999999, "r_x1": 287.63242, "r_y1": 554.0217299999999, "r_x2": 287.63242, "r_y2": 549.75851, "r_x3": 270.45187, "r_y3": 549.75851, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.17676, "r_y0": 520.17523, "r_x1": 358.11206, "r_y1": 520.17523, "r_x2": 358.11206, "r_y2": 515.91205, "r_x3": 332.17676, "r_y3": 515.91205, "coord_origin": "TOPLEFT" }, "text": "[x1, y2, x2, y2]", "orig": "[x1, y2, x2, y2]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.17676, "r_y0": 526.23523, "r_x1": 361.58298, "r_y1": 526.23523, "r_x2": 361.58298, "r_y2": 521.9720500000001, "r_x3": 332.17676, "r_y3": 521.9720500000001, "coord_origin": "TOPLEFT" }, "text": "[x1', y2', x2', y2']", "orig": "[x1', y2', x2', y2']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.17676, "r_y0": 532.29523, "r_x1": 364.76474, "r_y1": 532.29523, "r_x2": 364.76474, "r_y2": 528.03204, "r_x3": 332.17676, "r_y3": 528.03204, "coord_origin": "TOPLEFT" }, "text": "[x1'', y2'', x2'', y2'']", "orig": "[x1'', y2'', x2'', y2'']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.17676, "r_y0": 538.35524, "r_x1": 335.96548, "r_y1": 538.35524, "r_x2": 335.96548, "r_y2": 534.09204, "r_x3": 332.17676, "r_y3": 534.09204, "coord_origin": "TOPLEFT" }, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.8894, "r_y0": 520.6582599999999, "r_x1": 329.41641, "r_y1": 520.6582599999999, "r_x2": 329.41641, "r_y2": 516.39508, "r_x3": 326.8894, "r_y3": 516.39508, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.04089, "r_y0": 526.68796, "r_x1": 329.5679, "r_y1": 526.68796, "r_x2": 329.5679, "r_y2": 522.4247700000001, "r_x3": 327.04089, "r_y3": 522.4247700000001, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.04089, "r_y0": 532.77826, "r_x1": 329.5679, "r_y1": 532.77826, "r_x2": 329.5679, "r_y2": 528.51508, "r_x3": 327.04089, "r_y3": 528.51508, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 424.14102, "r_y0": 531.7060200000001, "r_x1": 426.66803, "r_y1": 531.7060200000001, "r_x2": 426.66803, "r_y2": 527.4428399999999, "r_x3": 424.14102, "r_y3": 527.4428399999999, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 453.0018, "r_y0": 521.71713, "r_x1": 455.52881, "r_y1": 521.71713, "r_x2": 455.52881, "r_y2": 517.4539500000001, "r_x3": 453.0018, "r_y3": 517.4539500000001, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.85825, "r_y0": 521.32599, "r_x1": 426.38525, "r_y1": 521.32599, "r_x2": 426.38525, "r_y2": 517.06281, "r_x3": 423.85825, "r_y3": 517.06281, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.4342, "r_y0": 562.35719, "r_x1": 337.27542, "r_y1": 562.35719, "r_x2": 337.27542, "r_y2": 557.36679, "r_x3": 333.4342, "r_y3": 557.36679, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.35397, "r_y0": 562.30719, "r_x1": 344.19519, "r_y1": 562.30719, "r_x2": 344.19519, "r_y2": 557.31679, "r_x3": 340.35397, "r_y3": 557.31679, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.30978, "r_y0": 568.8557900000001, "r_x1": 344.151, "r_y1": 568.8557900000001, "r_x2": 344.151, "r_y2": 563.8653899999999, "r_x3": 340.30978, "r_y3": 563.8653899999999, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.79904, "r_y0": 568.85907, "r_x1": 350.64026, "r_y1": 568.85907, "r_x2": 350.64026, "r_y2": 563.8686700000001, "r_x3": 346.79904, "r_y3": 563.8686700000001, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.59583, "r_y0": 568.81311, "r_x1": 337.43704, "r_y1": 568.81311, "r_x2": 337.43704, "r_y2": 563.82271, "r_x3": 333.59583, "r_y3": 563.82271, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.37543, "r_y0": 575.41713, "r_x1": 344.21664, "r_y1": 575.41713, "r_x2": 344.21664, "r_y2": 570.42673, "r_x3": 340.37543, "r_y3": 570.42673, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.86469, "r_y0": 575.42041, "r_x1": 350.7059, "r_y1": 575.42041, "r_x2": 350.7059, "r_y2": 570.43001, "r_x3": 346.86469, "r_y3": 570.43001, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.66144, "r_y0": 575.37445, "r_x1": 337.50266, "r_y1": 575.37445, "r_x2": 337.50266, "r_y2": 570.38405, "r_x3": 333.66144, "r_y3": 570.38405, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.37671, "r_y0": 582.0164599999999, "r_x1": 344.21793, "r_y1": 582.0164599999999, "r_x2": 344.21793, "r_y2": 577.02606, "r_x3": 340.37671, "r_y3": 577.02606, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.86597, "r_y0": 582.01974, "r_x1": 350.70718, "r_y1": 582.01974, "r_x2": 350.70718, "r_y2": 577.02934, "r_x3": 346.86597, "r_y3": 577.02934, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.66272, "r_y0": 581.97379, "r_x1": 337.50394, "r_y1": 581.97379, "r_x2": 337.50394, "r_y2": 576.98338, "r_x3": 333.66272, "r_y3": 576.98338, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.27948, "r_y0": 588.38777, "r_x1": 344.1207, "r_y1": 588.38777, "r_x2": 344.1207, "r_y2": 583.39737, "r_x3": 340.27948, "r_y3": 583.39737, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.76874, "r_y0": 588.39108, "r_x1": 350.60995, "r_y1": 588.39108, "r_x2": 350.60995, "r_y2": 583.40068, "r_x3": 346.76874, "r_y3": 583.40068, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.56549, "r_y0": 588.34514, "r_x1": 337.40671, "r_y1": 588.34514, "r_x2": 337.40671, "r_y2": 583.35474, "r_x3": 333.56549, "r_y3": 583.35474, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.03326, "r_y0": 561.87354, "r_x1": 359.83362, "r_y1": 561.87354, "r_x2": 359.83362, "r_y2": 556.8831299999999, "r_x3": 353.03326, "r_y3": 556.8831299999999, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.18604, "r_y0": 568.57085, "r_x1": 359.98639, "r_y1": 568.57085, "r_x2": 359.98639, "r_y2": 563.58044, "r_x3": 353.18604, "r_y3": 563.58044, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.19864, "r_y0": 575.15276, "r_x1": 359.99899, "r_y1": 575.15276, "r_x2": 359.99899, "r_y2": 570.1623500000001, "r_x3": 353.19864, "r_y3": 570.1623500000001, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.1532, "r_y0": 581.75652, "r_x1": 359.95355, "r_y1": 581.75652, "r_x2": 359.95355, "r_y2": 576.76611, "r_x3": 353.1532, "r_y3": 576.76611, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.26935, "r_y0": 588.3966800000001, "r_x1": 360.0697, "r_y1": 588.3966800000001, "r_x2": 360.0697, "r_y2": 583.40628, "r_x3": 353.26935, "r_y3": 583.40628, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.37979, "r_y0": 562.07275, "r_x1": 350.33786, "r_y1": 562.07275, "r_x2": 350.33786, "r_y2": 557.08235, "r_x3": 347.37979, "r_y3": 557.08235, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.14026, "r_y0": 568.55399, "r_x1": 333.66727, "r_y1": 568.55399, "r_x2": 333.66727, "r_y2": 564.2907700000001, "r_x3": 331.14026, "r_y3": 564.2907700000001, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.80972, "r_y0": 558.85634, "r_x1": 343.33673, "r_y1": 558.85634, "r_x2": 343.33673, "r_y2": 554.59312, "r_x3": 340.80972, "r_y3": 554.59312, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.97992, "r_y0": 559.09357, "r_x1": 333.50693, "r_y1": 559.09357, "r_x2": 333.50693, "r_y2": 554.83035, "r_x3": 330.97992, "r_y3": 554.83035, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 13, "label": "text", "bbox": { "l": 147.30025, "t": 540.73164, "r": 149.70605, "b": 543.1000799999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.30025, "r_y0": 543.1000799999999, "r_x1": 149.70605, "r_y1": 543.1000799999999, "r_x2": 149.70605, "r_y2": 540.73164, "r_x3": 147.30025, "r_y3": 540.73164, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 14, "label": "text", "bbox": { "l": 150.90895, "t": 540.73164, "r": 155.72055, "b": 543.1000799999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.90895, "r_y0": 543.1000799999999, "r_x1": 155.72055, "r_y1": 543.1000799999999, "r_x2": 155.72055, "r_y2": 540.73164, "r_x3": 150.90895, "r_y3": 540.73164, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 15, "label": "text", "bbox": { "l": 162.75987, "t": 535.3938, "r": 172.2963, "b": 537.76224, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 162.75987, "r_y0": 537.76224, "r_x1": 172.2963, "r_y1": 537.76224, "r_x2": 172.2963, "r_y2": 535.3938, "r_x3": 162.75987, "r_y3": 535.3938, "coord_origin": "TOPLEFT" }, "text": "Amount", "orig": "Amount", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 16, "label": "text", "bbox": { "l": 147.63603, "t": 535.3661500000001, "r": 155.91753, "b": 537.73459, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.63603, "r_y0": 537.73459, "r_x1": 155.91753, "r_y1": 537.73459, "r_x2": 155.91753, "r_y2": 535.3661500000001, "r_x3": 147.63603, "r_y3": 535.3661500000001, "coord_origin": "TOPLEFT" }, "text": "Names", "orig": "Names", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 17, "label": "text", "bbox": { "l": 158.48466, "t": 540.73164, "r": 164.10178, "b": 543.1000799999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.48466, "r_y0": 543.1000799999999, "r_x1": 164.10178, "r_y1": 543.1000799999999, "r_x2": 164.10178, "r_y2": 540.73164, "r_x3": 158.48466, "r_y3": 540.73164, "coord_origin": "TOPLEFT" }, "text": "1000", "orig": "1000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 18, "label": "text", "bbox": { "l": 158.48466, "t": 544.67065, "r": 162.69737, "b": 547.03909, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.48466, "r_y0": 547.03909, "r_x1": 162.69737, "r_y1": 547.03909, "r_x2": 162.69737, "r_y2": 544.67065, "r_x3": 158.48466, "r_y3": 544.67065, "coord_origin": "TOPLEFT" }, "text": "500", "orig": "500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 19, "label": "text", "bbox": { "l": 158.48466, "t": 548.91264, "r": 164.10178, "b": 551.28108, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.48466, "r_y0": 551.28108, "r_x1": 164.10178, "r_y1": 551.28108, "r_x2": 164.10178, "r_y2": 548.91264, "r_x3": 158.48466, "r_y3": 548.91264, "coord_origin": "TOPLEFT" }, "text": "3500", "orig": "3500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 20, "label": "text", "bbox": { "l": 158.48466, "t": 553.15465, "r": 162.69737, "b": 555.52309, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.48466, "r_y0": 555.52309, "r_x1": 162.69737, "r_y1": 555.52309, "r_x2": 162.69737, "r_y2": 553.15465, "r_x3": 158.48466, "r_y3": 553.15465, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 21, "label": "text", "bbox": { "l": 168.81696, "t": 540.73164, "r": 172.88876, "b": 543.1000799999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.81696, "r_y0": 543.1000799999999, "r_x1": 172.88876, "r_y1": 543.1000799999999, "r_x2": 172.88876, "r_y2": 540.73164, "r_x3": 168.81696, "r_y3": 540.73164, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 22, "label": "text", "bbox": { "l": 168.81696, "t": 544.67065, "r": 172.88876, "b": 547.03909, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.81696, "r_y0": 547.03909, "r_x1": 172.88876, "r_y1": 547.03909, "r_x2": 172.88876, "r_y2": 544.67065, "r_x3": 168.81696, "r_y3": 544.67065, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 23, "label": "text", "bbox": { "l": 168.81696, "t": 548.91264, "r": 172.88876, "b": 551.28108, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.81696, "r_y0": 551.28108, "r_x1": 172.88876, "r_y1": 551.28108, "r_x2": 172.88876, "r_y2": 548.91264, "r_x3": 168.81696, "r_y3": 548.91264, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 24, "label": "text", "bbox": { "l": 168.81696, "t": 553.15465, "r": 172.88876, "b": 555.52309, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.81696, "r_y0": 555.52309, "r_x1": 172.88876, "r_y1": 555.52309, "r_x2": 172.88876, "r_y2": 553.15465, "r_x3": 168.81696, "r_y3": 553.15465, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 25, "label": "text", "bbox": { "l": 147.30025, "t": 544.67065, "r": 149.70605, "b": 547.03909, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.30025, "r_y0": 547.03909, "r_x1": 149.70605, "r_y1": 547.03909, "r_x2": 149.70605, "r_y2": 544.67065, "r_x3": 147.30025, "r_y3": 544.67065, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 26, "label": "text", "bbox": { "l": 150.90895, "t": 544.67065, "r": 155.72055, "b": 547.03909, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.90895, "r_y0": 547.03909, "r_x1": 155.72055, "r_y1": 547.03909, "r_x2": 155.72055, "r_y2": 544.67065, "r_x3": 150.90895, "r_y3": 544.67065, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 27, "label": "text", "bbox": { "l": 147.30025, "t": 548.91264, "r": 149.70605, "b": 551.28108, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.30025, "r_y0": 551.28108, "r_x1": 149.70605, "r_y1": 551.28108, "r_x2": 149.70605, "r_y2": 548.91264, "r_x3": 147.30025, "r_y3": 548.91264, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 28, "label": "text", "bbox": { "l": 150.90895, "t": 548.91264, "r": 155.72055, "b": 551.28108, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.90895, "r_y0": 551.28108, "r_x1": 155.72055, "r_y1": 551.28108, "r_x2": 155.72055, "r_y2": 548.91264, "r_x3": 150.90895, "r_y3": 548.91264, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 29, "label": "text", "bbox": { "l": 147.30025, "t": 553.15465, "r": 149.70605, "b": 555.52309, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.30025, "r_y0": 555.52309, "r_x1": 149.70605, "r_y1": 555.52309, "r_x2": 149.70605, "r_y2": 553.15465, "r_x3": 147.30025, "r_y3": 553.15465, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 30, "label": "text", "bbox": { "l": 150.90895, "t": 553.15465, "r": 155.72055, "b": 555.52309, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.90895, "r_y0": 555.52309, "r_x1": 155.72055, "r_y1": 555.52309, "r_x2": 155.72055, "r_y2": 553.15465, "r_x3": 150.90895, "r_y3": 553.15465, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 31, "label": "text", "bbox": { "l": 152.05046, "t": 517.0098, "r": 171.24945, "b": 521.27298, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 152.05046, "r_y0": 521.27298, "r_x1": 171.24945, "r_y1": 521.27298, "r_x2": 171.24945, "r_y2": 517.0098, "r_x3": 152.05046, "r_y3": 517.0098, "coord_origin": "TOPLEFT" }, "text": "Extracted", "orig": "Extracted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 32, "label": "text", "bbox": { "l": 148.13347, "t": 522.3122900000001, "r": 175.16759, "b": 526.57547, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 148.13347, "r_y0": 526.57547, "r_x1": 175.16759, "r_y1": 526.57547, "r_x2": 175.16759, "r_y2": 522.3122900000001, "r_x3": 148.13347, "r_y3": 522.3122900000001, "coord_origin": "TOPLEFT" }, "text": "Table Images", "orig": "Table Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 33, "label": "text", "bbox": { "l": 193.53331, "t": 524.51422, "r": 220.31973, "b": 528.7774, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 193.53331, "r_y0": 528.7774, "r_x1": 220.31973, "r_y1": 528.7774, "r_x2": 220.31973, "r_y2": 524.51422, "r_x3": 193.53331, "r_y3": 524.51422, "coord_origin": "TOPLEFT" }, "text": "Standardized", "orig": "Standardized", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 34, "label": "text", "bbox": { "l": 199.47311, "t": 529.8167100000001, "r": 214.37889, "b": 534.0799, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 199.47311, "r_y0": 534.0799, "r_x1": 214.37889, "r_y1": 534.0799, "r_x2": 214.37889, "r_y2": 529.8167100000001, "r_x3": 199.47311, "r_y3": 529.8167100000001, "coord_origin": "TOPLEFT" }, "text": "Images", "orig": "Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 35, "label": "text", "bbox": { "l": 273.61066, "t": 509.9053, "r": 284.47275, "b": 514.16849, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 273.61066, "r_y0": 514.16849, "r_x1": 284.47275, "r_y1": 514.16849, "r_x2": 284.47275, "r_y2": 509.9053, "r_x3": 273.61066, "r_y3": 509.9053, "coord_origin": "TOPLEFT" }, "text": "BBox", "orig": "BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 36, "label": "text", "bbox": { "l": 270.45187, "t": 513.6928399999999, "r": 287.63242, "b": 517.9560200000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 270.45187, "r_y0": 517.9560200000001, "r_x1": 287.63242, "r_y1": 517.9560200000001, "r_x2": 287.63242, "r_y2": 513.6928399999999, "r_x3": 270.45187, "r_y3": 513.6928399999999, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 37, "label": "text", "bbox": { "l": 332.47852, "t": 508.14438, "r": 348.14014, "b": 512.40756, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.47852, "r_y0": 512.40756, "r_x1": 348.14014, "r_y1": 512.40756, "r_x2": 348.14014, "r_y2": 508.14438, "r_x3": 332.47852, "r_y3": 508.14438, "coord_origin": "TOPLEFT" }, "text": "BBoxes", "orig": "BBoxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 38, "label": "text", "bbox": { "l": 376.68622, "t": 521.12024, "r": 407.25497, "b": 525.38342, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 376.68622, "r_y0": 525.38342, "r_x1": 407.25497, "r_y1": 525.38342, "r_x2": 407.25497, "r_y2": 521.12024, "r_x3": 376.68622, "r_y3": 521.12024, "coord_origin": "TOPLEFT" }, "text": "BBoxes can be", "orig": "BBoxes can be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 39, "label": "text", "bbox": { "l": 373.90869, "t": 525.66525, "r": 410.03506, "b": 529.92844, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 373.90869, "r_y0": 529.92844, "r_x1": 410.03506, "r_y1": 529.92844, "r_x2": 410.03506, "r_y2": 525.66525, "r_x3": 373.90869, "r_y3": 525.66525, "coord_origin": "TOPLEFT" }, "text": "traced back to the", "orig": "traced back to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 40, "label": "text", "bbox": { "l": 375.29871, "t": 530.21024, "r": 408.64902, "b": 534.47342, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 375.29871, "r_y0": 534.47342, "r_x1": 408.64902, "r_y1": 534.47342, "r_x2": 408.64902, "r_y2": 530.21024, "r_x3": 375.29871, "r_y3": 530.21024, "coord_origin": "TOPLEFT" }, "text": "original image to", "orig": "original image to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 377.06747, "t": 534.75522, "r": 406.88312, "b": 539.01843, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 377.06747, "r_y0": 539.01843, "r_x1": 406.88312, "r_y1": 539.01843, "r_x2": 406.88312, "r_y2": 534.75522, "r_x3": 377.06747, "r_y3": 534.75522, "coord_origin": "TOPLEFT" }, "text": "extract content", "orig": "extract content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 383.56683, "t": 563.24176, "r": 433.76544, "b": 567.50497, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 383.56683, "r_y0": 567.50497, "r_x1": 433.76544, "r_y1": 567.50497, "r_x2": 433.76544, "r_y2": 563.24176, "r_x3": 383.56683, "r_y3": 563.24176, "coord_origin": "TOPLEFT" }, "text": "Structure Tags sequence", "orig": "Structure Tags sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 383.52768, "t": 567.78676, "r": 433.80764999999997, "b": 572.04997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 383.52768, "r_y0": 572.04997, "r_x1": 433.80764999999997, "r_y1": 572.04997, "r_x2": 433.80764999999997, "r_y2": 567.78676, "r_x3": 383.52768, "r_y3": 567.78676, "coord_origin": "TOPLEFT" }, "text": "provide full description of", "orig": "provide full description of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 390.47522, "t": 572.33177, "r": 426.85703, "b": 576.59499, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 390.47522, "r_y0": 576.59499, "r_x1": 426.85703, "r_y1": 576.59499, "r_x2": 426.85703, "r_y2": 572.33177, "r_x3": 390.47522, "r_y3": 572.33177, "coord_origin": "TOPLEFT" }, "text": "the table structure", "orig": "the table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 293.94702, "t": 577.89143, "r": 323.1691, "b": 582.15465, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.94702, "r_y0": 582.15465, "r_x1": 323.1691, "r_y1": 582.15465, "r_x2": 323.1691, "r_y2": 577.89143, "r_x3": 293.94702, "r_y3": 577.89143, "coord_origin": "TOPLEFT" }, "text": "Structure Tags", "orig": "Structure Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 293.94702, "t": 582.43648, "r": 324.59396, "b": 586.69969, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.94702, "r_y0": 586.69969, "r_x1": 324.59396, "r_y1": 586.69969, "r_x2": 324.59396, "r_y2": 582.43648, "r_x3": 293.94702, "r_y3": 582.43648, "coord_origin": "TOPLEFT" }, "text": "in OTSL format", "orig": "in OTSL format", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 333.07819, "t": 541.82269, "r": 364.14691, "b": 546.08591, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.07819, "r_y0": 546.08591, "r_x1": 364.14691, "r_y1": 546.08591, "r_x2": 364.14691, "r_y2": 541.82269, "r_x3": 333.07819, "r_y3": 541.82269, "coord_origin": "TOPLEFT" }, "text": "BBoxes in sync", "orig": "BBoxes in sync", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 333.07819, "t": 545.6102, "r": 369.71542, "b": 549.87341, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.07819, "r_y0": 549.87341, "r_x1": 369.71542, "r_y1": 549.87341, "r_x2": 369.71542, "r_y2": 545.6102, "r_x3": 333.07819, "r_y3": 545.6102, "coord_origin": "TOPLEFT" }, "text": "with tag sequence", "orig": "with tag sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 232.65881000000002, "t": 515.24139, "r": 249.58894000000004, "b": 519.50458, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.65881000000002, "r_y0": 519.50458, "r_x1": 249.58894000000004, "r_y1": 519.50458, "r_x2": 249.58894000000004, "r_y2": 515.24139, "r_x3": 232.65881000000002, "r_y3": 515.24139, "coord_origin": "TOPLEFT" }, "text": "Encoder", "orig": "Encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 269.8219, "t": 545.97102, "r": 288.26279, "b": 550.23424, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 269.8219, "r_y0": 550.23424, "r_x1": 288.26279, "r_y1": 550.23424, "r_x2": 288.26279, "r_y2": 545.97102, "r_x3": 269.8219, "r_y3": 545.97102, "coord_origin": "TOPLEFT" }, "text": "Structure", "orig": "Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 51, "label": "text", "bbox": { "l": 270.45187, "t": 549.75851, "r": 287.63242, "b": 554.0217299999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 270.45187, "r_y0": 554.0217299999999, "r_x1": 287.63242, "r_y1": 554.0217299999999, "r_x2": 287.63242, "r_y2": 549.75851, "r_x3": 270.45187, "r_y3": 549.75851, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 52, "label": "text", "bbox": { "l": 332.17676, "t": 515.91205, "r": 358.11206, "b": 520.17523, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.17676, "r_y0": 520.17523, "r_x1": 358.11206, "r_y1": 520.17523, "r_x2": 358.11206, "r_y2": 515.91205, "r_x3": 332.17676, "r_y3": 515.91205, "coord_origin": "TOPLEFT" }, "text": "[x1, y2, x2, y2]", "orig": "[x1, y2, x2, y2]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 53, "label": "text", "bbox": { "l": 332.17676, "t": 521.9720500000001, "r": 361.58298, "b": 526.23523, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.17676, "r_y0": 526.23523, "r_x1": 361.58298, "r_y1": 526.23523, "r_x2": 361.58298, "r_y2": 521.9720500000001, "r_x3": 332.17676, "r_y3": 521.9720500000001, "coord_origin": "TOPLEFT" }, "text": "[x1', y2', x2', y2']", "orig": "[x1', y2', x2', y2']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 54, "label": "text", "bbox": { "l": 332.17676, "t": 528.03204, "r": 364.76474, "b": 532.29523, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.17676, "r_y0": 532.29523, "r_x1": 364.76474, "r_y1": 532.29523, "r_x2": 364.76474, "r_y2": 528.03204, "r_x3": 332.17676, "r_y3": 528.03204, "coord_origin": "TOPLEFT" }, "text": "[x1'', y2'', x2'', y2'']", "orig": "[x1'', y2'', x2'', y2'']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 55, "label": "text", "bbox": { "l": 332.17676, "t": 534.09204, "r": 335.96548, "b": 538.35524, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.17676, "r_y0": 538.35524, "r_x1": 335.96548, "r_y1": 538.35524, "r_x2": 335.96548, "r_y2": 534.09204, "r_x3": 332.17676, "r_y3": 534.09204, "coord_origin": "TOPLEFT" }, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 56, "label": "text", "bbox": { "l": 326.8894, "t": 516.39508, "r": 329.41641, "b": 520.6582599999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.8894, "r_y0": 520.6582599999999, "r_x1": 329.41641, "r_y1": 520.6582599999999, "r_x2": 329.41641, "r_y2": 516.39508, "r_x3": 326.8894, "r_y3": 516.39508, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 57, "label": "text", "bbox": { "l": 327.04089, "t": 522.4247700000001, "r": 329.5679, "b": 526.68796, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.04089, "r_y0": 526.68796, "r_x1": 329.5679, "r_y1": 526.68796, "r_x2": 329.5679, "r_y2": 522.4247700000001, "r_x3": 327.04089, "r_y3": 522.4247700000001, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 58, "label": "text", "bbox": { "l": 327.04089, "t": 528.51508, "r": 329.5679, "b": 532.77826, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.04089, "r_y0": 532.77826, "r_x1": 329.5679, "r_y1": 532.77826, "r_x2": 329.5679, "r_y2": 528.51508, "r_x3": 327.04089, "r_y3": 528.51508, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 59, "label": "text", "bbox": { "l": 424.14102, "t": 527.4428399999999, "r": 426.66803, "b": 531.7060200000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 424.14102, "r_y0": 531.7060200000001, "r_x1": 426.66803, "r_y1": 531.7060200000001, "r_x2": 426.66803, "r_y2": 527.4428399999999, "r_x3": 424.14102, "r_y3": 527.4428399999999, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 60, "label": "text", "bbox": { "l": 453.0018, "t": 517.4539500000001, "r": 455.52881, "b": 521.71713, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 453.0018, "r_y0": 521.71713, "r_x1": 455.52881, "r_y1": 521.71713, "r_x2": 455.52881, "r_y2": 517.4539500000001, "r_x3": 453.0018, "r_y3": 517.4539500000001, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 61, "label": "text", "bbox": { "l": 423.85825, "t": 517.06281, "r": 426.38525, "b": 521.32599, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.85825, "r_y0": 521.32599, "r_x1": 426.38525, "r_y1": 521.32599, "r_x2": 426.38525, "r_y2": 517.06281, "r_x3": 423.85825, "r_y3": 517.06281, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 62, "label": "text", "bbox": { "l": 333.4342, "t": 557.36679, "r": 337.27542, "b": 562.35719, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.4342, "r_y0": 562.35719, "r_x1": 337.27542, "r_y1": 562.35719, "r_x2": 337.27542, "r_y2": 557.36679, "r_x3": 333.4342, "r_y3": 557.36679, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 340.35397, "t": 557.31679, "r": 344.19519, "b": 562.30719, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.35397, "r_y0": 562.30719, "r_x1": 344.19519, "r_y1": 562.30719, "r_x2": 344.19519, "r_y2": 557.31679, "r_x3": 340.35397, "r_y3": 557.31679, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 340.30978, "t": 563.8653899999999, "r": 344.151, "b": 568.8557900000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.30978, "r_y0": 568.8557900000001, "r_x1": 344.151, "r_y1": 568.8557900000001, "r_x2": 344.151, "r_y2": 563.8653899999999, "r_x3": 340.30978, "r_y3": 563.8653899999999, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 346.79904, "t": 563.8686700000001, "r": 350.64026, "b": 568.85907, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.79904, "r_y0": 568.85907, "r_x1": 350.64026, "r_y1": 568.85907, "r_x2": 350.64026, "r_y2": 563.8686700000001, "r_x3": 346.79904, "r_y3": 563.8686700000001, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 333.59583, "t": 563.82271, "r": 337.43704, "b": 568.81311, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.59583, "r_y0": 568.81311, "r_x1": 337.43704, "r_y1": 568.81311, "r_x2": 337.43704, "r_y2": 563.82271, "r_x3": 333.59583, "r_y3": 563.82271, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 340.37543, "t": 570.42673, "r": 344.21664, "b": 575.41713, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.37543, "r_y0": 575.41713, "r_x1": 344.21664, "r_y1": 575.41713, "r_x2": 344.21664, "r_y2": 570.42673, "r_x3": 340.37543, "r_y3": 570.42673, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 346.86469, "t": 570.43001, "r": 350.7059, "b": 575.42041, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.86469, "r_y0": 575.42041, "r_x1": 350.7059, "r_y1": 575.42041, "r_x2": 350.7059, "r_y2": 570.43001, "r_x3": 346.86469, "r_y3": 570.43001, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 333.66144, "t": 570.38405, "r": 337.50266, "b": 575.37445, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.66144, "r_y0": 575.37445, "r_x1": 337.50266, "r_y1": 575.37445, "r_x2": 337.50266, "r_y2": 570.38405, "r_x3": 333.66144, "r_y3": 570.38405, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 340.37671, "t": 577.02606, "r": 344.21793, "b": 582.0164599999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.37671, "r_y0": 582.0164599999999, "r_x1": 344.21793, "r_y1": 582.0164599999999, "r_x2": 344.21793, "r_y2": 577.02606, "r_x3": 340.37671, "r_y3": 577.02606, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 346.86597, "t": 577.02934, "r": 350.70718, "b": 582.01974, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.86597, "r_y0": 582.01974, "r_x1": 350.70718, "r_y1": 582.01974, "r_x2": 350.70718, "r_y2": 577.02934, "r_x3": 346.86597, "r_y3": 577.02934, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 333.66272, "t": 576.98338, "r": 337.50394, "b": 581.97379, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.66272, "r_y0": 581.97379, "r_x1": 337.50394, "r_y1": 581.97379, "r_x2": 337.50394, "r_y2": 576.98338, "r_x3": 333.66272, "r_y3": 576.98338, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 340.27948, "t": 583.39737, "r": 344.1207, "b": 588.38777, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.27948, "r_y0": 588.38777, "r_x1": 344.1207, "r_y1": 588.38777, "r_x2": 344.1207, "r_y2": 583.39737, "r_x3": 340.27948, "r_y3": 583.39737, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 346.76874, "t": 583.40068, "r": 350.60995, "b": 588.39108, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.76874, "r_y0": 588.39108, "r_x1": 350.60995, "r_y1": 588.39108, "r_x2": 350.60995, "r_y2": 583.40068, "r_x3": 346.76874, "r_y3": 583.40068, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 333.56549, "t": 583.35474, "r": 337.40671, "b": 588.34514, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.56549, "r_y0": 588.34514, "r_x1": 337.40671, "r_y1": 588.34514, "r_x2": 337.40671, "r_y2": 583.35474, "r_x3": 333.56549, "r_y3": 583.35474, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 353.03326, "t": 556.8831299999999, "r": 359.83362, "b": 561.87354, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.03326, "r_y0": 561.87354, "r_x1": 359.83362, "r_y1": 561.87354, "r_x2": 359.83362, "r_y2": 556.8831299999999, "r_x3": 353.03326, "r_y3": 556.8831299999999, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 353.18604, "t": 563.58044, "r": 359.98639, "b": 568.57085, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.18604, "r_y0": 568.57085, "r_x1": 359.98639, "r_y1": 568.57085, "r_x2": 359.98639, "r_y2": 563.58044, "r_x3": 353.18604, "r_y3": 563.58044, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 353.19864, "t": 570.1623500000001, "r": 359.99899, "b": 575.15276, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.19864, "r_y0": 575.15276, "r_x1": 359.99899, "r_y1": 575.15276, "r_x2": 359.99899, "r_y2": 570.1623500000001, "r_x3": 353.19864, "r_y3": 570.1623500000001, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 353.1532, "t": 576.76611, "r": 359.95355, "b": 581.75652, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.1532, "r_y0": 581.75652, "r_x1": 359.95355, "r_y1": 581.75652, "r_x2": 359.95355, "r_y2": 576.76611, "r_x3": 353.1532, "r_y3": 576.76611, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 80, "label": "text", "bbox": { "l": 353.26935, "t": 583.40628, "r": 360.0697, "b": 588.3966800000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.26935, "r_y0": 588.3966800000001, "r_x1": 360.0697, "r_y1": 588.3966800000001, "r_x2": 360.0697, "r_y2": 583.40628, "r_x3": 353.26935, "r_y3": 583.40628, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 81, "label": "text", "bbox": { "l": 347.37979, "t": 557.08235, "r": 350.33786, "b": 562.07275, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.37979, "r_y0": 562.07275, "r_x1": 350.33786, "r_y1": 562.07275, "r_x2": 350.33786, "r_y2": 557.08235, "r_x3": 347.37979, "r_y3": 557.08235, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 82, "label": "text", "bbox": { "l": 331.14026, "t": 564.2907700000001, "r": 333.66727, "b": 568.55399, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.14026, "r_y0": 568.55399, "r_x1": 333.66727, "r_y1": 568.55399, "r_x2": 333.66727, "r_y2": 564.2907700000001, "r_x3": 331.14026, "r_y3": 564.2907700000001, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 83, "label": "text", "bbox": { "l": 340.80972, "t": 554.59312, "r": 343.33673, "b": 558.85634, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.80972, "r_y0": 558.85634, "r_x1": 343.33673, "r_y1": 558.85634, "r_x2": 343.33673, "r_y2": 554.59312, "r_x3": 340.80972, "r_y3": 554.59312, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 84, "label": "text", "bbox": { "l": 330.97992, "t": 554.83035, "r": 333.50693, "b": 559.09357, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.97992, "r_y0": 559.09357, "r_x1": 333.50693, "r_y1": 559.09357, "r_x2": 333.50693, "r_y2": 554.83035, "r_x3": 330.97992, "r_y3": 554.83035, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, { "id": 4, "label": "text", "bbox": { "l": 134.765, "t": 620.19278, "r": 480.5917400000001, "b": 664.8547599999999, "coord_origin": "TOPLEFT" }, "confidence": 0.951270341873169, "cells": [ { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.709, "r_y0": 628.98975, "r_x1": 480.58792, "r_y1": 628.98975, "r_x2": 480.58792, "r_y2": 620.19278, "r_x3": 149.709, "r_y3": 620.19278, "coord_origin": "TOPLEFT" }, "text": "We rely on standard metrics such as Tree Edit Distance score (TEDs) for", "orig": "We rely on standard metrics such as Tree Edit Distance score (TEDs) for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 640.94475, "r_x1": 480.58871, "r_y1": 640.94475, "r_x2": 480.58871, "r_y2": 632.14778, "r_x3": 134.765, "r_y3": 632.14778, "coord_origin": "TOPLEFT" }, "text": "table structure prediction, and Mean Average Precision (mAP) with 0.75 Inter-", "orig": "table structure prediction, and Mean Average Precision (mAP) with 0.75 Inter-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 652.89975, "r_x1": 480.5917400000001, "r_y1": 652.89975, "r_x2": 480.5917400000001, "r_y2": 644.1027799999999, "r_x3": 134.765, "r_y3": 644.1027799999999, "coord_origin": "TOPLEFT" }, "text": "section Over Union (IOU) threshold for the bounding-box predictions of table", "orig": "section Over Union (IOU) threshold for the bounding-box predictions of table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 664.8547599999999, "r_x1": 480.58968999999996, "r_y1": 664.8547599999999, "r_x2": 480.58968999999996, "r_y2": 656.0577900000001, "r_x3": 134.765, "r_y3": 656.0577900000001, "coord_origin": "TOPLEFT" }, "text": "cells. The predicted OTSL structures were converted back to HTML format in", "orig": "cells. The predicted OTSL structures were converted back to HTML format in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "tablestructure": { "table_map": {} }, "figures_classification": null, "equations_prediction": null, "vlm_response": null }, "assembled": { "elements": [ { "label": "page_header", "id": 9, "page_no": 7, "cluster": { "id": 9, "label": "page_header", "bbox": { "l": 134.765, "t": 93.77099999999996, "r": 139.37193, "b": 101.84069999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.8301323056221008, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 101.84069999999997, "r_x1": 139.37193, "r_y1": 101.84069999999997, "r_x2": 139.37193, "r_y2": 93.77099999999996, "r_x3": 134.765, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "8" }, { "label": "page_header", "id": 8, "page_no": 7, "cluster": { "id": 8, "label": "page_header", "bbox": { "l": 167.81335, "t": 93.77099999999996, "r": 231.72227, "b": 101.84069999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.8631826043128967, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.81335, "r_y0": 101.84069999999997, "r_x1": 178.07675, "r_y1": 101.84069999999997, "r_x2": 178.07675, "r_y2": 93.77099999999996, "r_x3": 167.81335, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.37415, "r_y0": 101.84069999999997, "r_x1": 231.72227, "r_y1": 101.84069999999997, "r_x2": 231.72227, "r_y2": 93.77099999999996, "r_x3": 182.37415, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "M. Lysak, et al." }, { "label": "text", "id": 5, "page_no": 7, "cluster": { "id": 5, "label": "text", "bbox": { "l": 134.765, "t": 118.93377999999996, "r": 480.58884000000006, "b": 139.68579, "coord_origin": "TOPLEFT" }, "confidence": 0.9464744925498962, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 127.73077, "r_x1": 480.58884000000006, "r_y1": 127.73077, "r_x2": 480.58884000000006, "r_y2": 118.93377999999996, "r_x3": 134.765, "r_y3": 118.93377999999996, "coord_origin": "TOPLEFT" }, "text": "reduces significantly the column drift seen in the HTML based models (see Fig-", "orig": "reduces significantly the column drift seen in the HTML based models (see Fig-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 139.68579, "r_x1": 163.56389, "r_y1": 139.68579, "r_x2": 163.56389, "r_y2": 130.88878999999997, "r_x3": 134.765, "r_y3": 130.88878999999997, "coord_origin": "TOPLEFT" }, "text": "ure 5).", "orig": "ure 5).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "reduces significantly the column drift seen in the HTML based models (see Figure 5)." }, { "label": "section_header", "id": 2, "page_no": 7, "cluster": { "id": 2, "label": "section_header", "bbox": { "l": 134.765, "t": 161.55682000000002, "r": 319.34708, "b": 170.36377000000005, "coord_origin": "TOPLEFT" }, "confidence": 0.9549514651298523, "cells": [ { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 170.36377000000005, "r_x1": 149.40205, "r_y1": 170.36377000000005, "r_x2": 149.40205, "r_y2": 161.55682000000002, "r_x3": 134.765, "r_y3": 161.55682000000002, "coord_origin": "TOPLEFT" }, "text": "4.3", "orig": "4.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.85904, "r_y0": 170.36377000000005, "r_x1": 319.34708, "r_y1": 170.36377000000005, "r_x2": 319.34708, "r_y2": 161.55682000000002, "r_x3": 160.85904, "r_y3": 161.55682000000002, "coord_origin": "TOPLEFT" }, "text": "Error-detection and -mitigation", "orig": "Error-detection and -mitigation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "4.3 Error-detection and -mitigation" }, { "label": "text", "id": 0, "page_no": 7, "cluster": { "id": 0, "label": "text", "bbox": { "l": 134.765, "t": 182.28179999999998, "r": 480.5957599999999, "b": 298.67584, "coord_origin": "TOPLEFT" }, "confidence": 0.9879790544509888, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 191.0788, "r_x1": 480.59572999999995, "r_y1": 191.0788, "r_x2": 480.59572999999995, "r_y2": 182.28179999999998, "r_x3": 134.765, "r_y3": 182.28179999999998, "coord_origin": "TOPLEFT" }, "text": "The design of OTSL allows to validate a table structure easily on an unfinished", "orig": "The design of OTSL allows to validate a table structure easily on an unfinished", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 203.03479000000004, "r_x1": 480.59473, "r_y1": 203.03479000000004, "r_x2": 480.59473, "r_y2": 194.23779000000002, "r_x3": 134.765, "r_y3": 194.23779000000002, "coord_origin": "TOPLEFT" }, "text": "sequence. The detection of an invalid sequence token is a clear indication of a", "orig": "sequence. The detection of an invalid sequence token is a clear indication of a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 214.98981000000003, "r_x1": 480.58678999999995, "r_y1": 214.98981000000003, "r_x2": 480.58678999999995, "r_y2": 206.19281, "r_x3": 134.765, "r_y3": 206.19281, "coord_origin": "TOPLEFT" }, "text": "prediction mistake, however a valid sequence by itself does not guarantee pre-", "orig": "prediction mistake, however a valid sequence by itself does not guarantee pre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 226.94482000000005, "r_x1": 480.59177000000005, "r_y1": 226.94482000000005, "r_x2": 480.59177000000005, "r_y2": 218.14783, "r_x3": 134.765, "r_y3": 218.14783, "coord_origin": "TOPLEFT" }, "text": "diction correctness. Different heuristics can be used to correct token errors in", "orig": "diction correctness. Different heuristics can be used to correct token errors in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 238.89984000000004, "r_x1": 480.58768, "r_y1": 238.89984000000004, "r_x2": 480.58768, "r_y2": 230.10284000000001, "r_x3": 134.765, "r_y3": 230.10284000000001, "coord_origin": "TOPLEFT" }, "text": "an invalid sequence and thus increase the chances for accurate predictions. Such", "orig": "an invalid sequence and thus increase the chances for accurate predictions. Such", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 250.85486000000003, "r_x1": 480.5867, "r_y1": 250.85486000000003, "r_x2": 480.5867, "r_y2": 242.05786, "r_x3": 134.765, "r_y3": 242.05786, "coord_origin": "TOPLEFT" }, "text": "heuristics can be applied either after the prediction of each token, or at the end", "orig": "heuristics can be applied either after the prediction of each token, or at the end", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 262.80988, "r_x1": 480.5938100000001, "r_y1": 262.80988, "r_x2": 480.5938100000001, "r_y2": 254.01288, "r_x3": 134.765, "r_y3": 254.01288, "coord_origin": "TOPLEFT" }, "text": "on the entire predicted sequence. For example a simple heuristic which can cor-", "orig": "on the entire predicted sequence. For example a simple heuristic which can cor-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 274.76586999999995, "r_x1": 480.59069999999997, "r_y1": 274.76586999999995, "r_x2": 480.59069999999997, "r_y2": 265.96887000000004, "r_x3": 134.765, "r_y3": 265.96887000000004, "coord_origin": "TOPLEFT" }, "text": "rect the predicted OTSL sequence on-the-fly is to verify if the token with the", "orig": "rect the predicted OTSL sequence on-the-fly is to verify if the token with the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 286.72086, "r_x1": 480.5957599999999, "r_y1": 286.72086, "r_x2": 480.5957599999999, "r_y2": 277.92389000000003, "r_x3": 134.765, "r_y3": 277.92389000000003, "coord_origin": "TOPLEFT" }, "text": "highest prediction confidence invalidates the predicted sequence, and replace it", "orig": "highest prediction confidence invalidates the predicted sequence, and replace it", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 298.67584, "r_x1": 469.40369, "r_y1": 298.67584, "r_x2": 469.40369, "r_y2": 289.8788799999999, "r_x3": 134.765, "r_y3": 289.8788799999999, "coord_origin": "TOPLEFT" }, "text": "by the token with the next highest confidence until OTSL rules are satisfied.", "orig": "by the token with the next highest confidence until OTSL rules are satisfied.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The design of OTSL allows to validate a table structure easily on an unfinished sequence. The detection of an invalid sequence token is a clear indication of a prediction mistake, however a valid sequence by itself does not guarantee prediction correctness. Different heuristics can be used to correct token errors in an invalid sequence and thus increase the chances for accurate predictions. Such heuristics can be applied either after the prediction of each token, or at the end on the entire predicted sequence. For example a simple heuristic which can correct the predicted OTSL sequence on-the-fly is to verify if the token with the highest prediction confidence invalidates the predicted sequence, and replace it by the token with the next highest confidence until OTSL rules are satisfied." }, { "label": "section_header", "id": 3, "page_no": 7, "cluster": { "id": 3, "label": "section_header", "bbox": { "l": 134.765, "t": 321.164, "r": 229.03534, "b": 331.73239000000007, "coord_origin": "TOPLEFT" }, "confidence": 0.95152747631073, "cells": [ { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 331.73239000000007, "r_x1": 141.4886, "r_y1": 331.73239000000007, "r_x2": 141.4886, "r_y2": 321.164, "r_x3": 134.765, "r_y3": 321.164, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.9382, "r_y0": 331.73239000000007, "r_x1": 229.03534, "r_y1": 331.73239000000007, "r_x2": 229.03534, "r_y2": 321.164, "r_x3": 154.9382, "r_y3": 321.164, "coord_origin": "TOPLEFT" }, "text": "Experiments", "orig": "Experiments", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "5 Experiments" }, { "label": "text", "id": 1, "page_no": 7, "cluster": { "id": 1, "label": "text", "bbox": { "l": 134.765, "t": 347.24985, "r": 480.59528, "b": 451.6877099999999, "coord_origin": "TOPLEFT" }, "confidence": 0.9877985119819641, "cells": [ { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 356.04681, "r_x1": 480.59375, "r_y1": 356.04681, "r_x2": 480.59375, "r_y2": 347.24985, "r_x3": 134.765, "r_y3": 347.24985, "coord_origin": "TOPLEFT" }, "text": "To evaluate the impact of OTSL on prediction accuracy and inference times, we", "orig": "To evaluate the impact of OTSL on prediction accuracy and inference times, we", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 368.0018, "r_x1": 480.59476, "r_y1": 368.0018, "r_x2": 480.59476, "r_y2": 359.2048300000001, "r_x3": 134.765, "r_y3": 359.2048300000001, "coord_origin": "TOPLEFT" }, "text": "conducted a series of experiments based on the TableFormer model (Figure 4)", "orig": "conducted a series of experiments based on the TableFormer model (Figure 4)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 379.95679, "r_x1": 480.58786000000003, "r_y1": 379.95679, "r_x2": 480.58786000000003, "r_y2": 371.15982, "r_x3": 134.765, "r_y3": 371.15982, "coord_origin": "TOPLEFT" }, "text": "with two objectives: Firstly we evaluate the prediction quality and performance", "orig": "with two objectives: Firstly we evaluate the prediction quality and performance", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 391.91177, "r_x1": 480.58777, "r_y1": 391.91177, "r_x2": 480.58777, "r_y2": 383.11481000000003, "r_x3": 134.765, "r_y3": 383.11481000000003, "coord_origin": "TOPLEFT" }, "text": "of OTSL vs. HTML after performing Hyper Parameter Optimization (HPO) on", "orig": "of OTSL vs. HTML after performing Hyper Parameter Optimization (HPO) on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 403.86676, "r_x1": 148.59807, "r_y1": 403.86676, "r_x2": 148.59807, "r_y2": 395.06978999999995, "r_x3": 134.765, "r_y3": 395.06978999999995, "coord_origin": "TOPLEFT" }, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.627, "r_y0": 403.86676, "r_x1": 191.84703, "r_y1": 403.86676, "r_x2": 191.84703, "r_y2": 395.06978999999995, "r_x3": 151.627, "r_y3": 395.06978999999995, "coord_origin": "TOPLEFT" }, "text": "canonical", "orig": "canonical", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 195.90201, "r_y0": 403.86676, "r_x1": 480.59528, "r_y1": 403.86676, "r_x2": 480.59528, "r_y2": 395.06978999999995, "r_x3": 195.90201, "r_y3": 395.06978999999995, "coord_origin": "TOPLEFT" }, "text": "PubTabNet data set. Secondly we pick the best hyper-parameters", "orig": "PubTabNet data set. Secondly we pick the best hyper-parameters", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 415.82175, "r_x1": 480.59283000000005, "r_y1": 415.82175, "r_x2": 480.59283000000005, "r_y2": 407.02478, "r_x3": 134.76501, "r_y3": 407.02478, "coord_origin": "TOPLEFT" }, "text": "found in the first step and evaluate how OTSL impacts the performance of", "orig": "found in the first step and evaluate how OTSL impacts the performance of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 427.77774, "r_x1": 480.59476, "r_y1": 427.77774, "r_x2": 480.59476, "r_y2": 418.98077, "r_x3": 134.76501, "r_y3": 418.98077, "coord_origin": "TOPLEFT" }, "text": "TableFormer after training on other publicly available data sets (FinTabNet,", "orig": "TableFormer after training on other publicly available data sets (FinTabNet,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 439.73273, "r_x1": 480.59171, "r_y1": 439.73273, "r_x2": 480.59171, "r_y2": 430.93576, "r_x3": 134.76501, "r_y3": 430.93576, "coord_origin": "TOPLEFT" }, "text": "PubTables-1M [14]). The ground truth (GT) from all data sets has been con-", "orig": "PubTables-1M [14]). The ground truth (GT) from all data sets has been con-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 451.6877099999999, "r_x1": 479.30258, "r_y1": 451.6877099999999, "r_x2": 479.30258, "r_y2": 442.8907500000001, "r_x3": 134.76501, "r_y3": 442.8907500000001, "coord_origin": "TOPLEFT" }, "text": "verted into OTSL format for this purpose, and will be made publicly available.", "orig": "verted into OTSL format for this purpose, and will be made publicly available.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "To evaluate the impact of OTSL on prediction accuracy and inference times, we conducted a series of experiments based on the TableFormer model (Figure 4) with two objectives: Firstly we evaluate the prediction quality and performance of OTSL vs. HTML after performing Hyper Parameter Optimization (HPO) on the canonical PubTabNet data set. Secondly we pick the best hyper-parameters found in the first step and evaluate how OTSL impacts the performance of TableFormer after training on other publicly available data sets (FinTabNet, PubTables-1M [14]). The ground truth (GT) from all data sets has been converted into OTSL format for this purpose, and will be made publicly available." }, { "label": "caption", "id": 7, "page_no": 7, "cluster": { "id": 7, "label": "caption", "bbox": { "l": 134.76501, "t": 484.64813, "r": 480.59082, "b": 503.73965, "coord_origin": "TOPLEFT" }, "confidence": 0.9297956228256226, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 492.57443, "r_x1": 162.64424, "r_y1": 492.57443, "r_x2": 162.64424, "r_y2": 484.64813, "r_x3": 134.76501, "r_y3": 484.64813, "coord_origin": "TOPLEFT" }, "text": "Fig. 4.", "orig": "Fig. 4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 165.19601, "r_y0": 492.78067, "r_x1": 480.59082, "r_y1": 492.78067, "r_x2": 480.59082, "r_y2": 484.71091, "r_x3": 165.19601, "r_y3": 484.71091, "coord_origin": "TOPLEFT" }, "text": "Architecture sketch of the TableFormer model, which is a representative for the", "orig": "Architecture sketch of the TableFormer model, which is a representative for the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 503.73965, "r_x1": 206.70245, "r_y1": 503.73965, "r_x2": 206.70245, "r_y2": 495.66989, "r_x3": 134.76501, "r_y3": 495.66989, "coord_origin": "TOPLEFT" }, "text": "Im2Seq approach.", "orig": "Im2Seq approach.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Fig. 4. Architecture sketch of the TableFormer model, which is a representative for the Im2Seq approach." }, { "label": "picture", "id": 6, "page_no": 7, "cluster": { "id": 6, "label": "picture", "bbox": { "l": 140.70968627929688, "t": 508.0638427734375, "r": 472.73382568359375, "b": 593.6771850585938, "coord_origin": "TOPLEFT" }, "confidence": 0.9303396344184875, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.30025, "r_y0": 543.1000799999999, "r_x1": 149.70605, "r_y1": 543.1000799999999, "r_x2": 149.70605, "r_y2": 540.73164, "r_x3": 147.30025, "r_y3": 540.73164, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.90895, "r_y0": 543.1000799999999, "r_x1": 155.72055, "r_y1": 543.1000799999999, "r_x2": 155.72055, "r_y2": 540.73164, "r_x3": 150.90895, "r_y3": 540.73164, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 162.75987, "r_y0": 537.76224, "r_x1": 172.2963, "r_y1": 537.76224, "r_x2": 172.2963, "r_y2": 535.3938, "r_x3": 162.75987, "r_y3": 535.3938, "coord_origin": "TOPLEFT" }, "text": "Amount", "orig": "Amount", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.63603, "r_y0": 537.73459, "r_x1": 155.91753, "r_y1": 537.73459, "r_x2": 155.91753, "r_y2": 535.3661500000001, "r_x3": 147.63603, "r_y3": 535.3661500000001, "coord_origin": "TOPLEFT" }, "text": "Names", "orig": "Names", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.48466, "r_y0": 543.1000799999999, "r_x1": 164.10178, "r_y1": 543.1000799999999, "r_x2": 164.10178, "r_y2": 540.73164, "r_x3": 158.48466, "r_y3": 540.73164, "coord_origin": "TOPLEFT" }, "text": "1000", "orig": "1000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.48466, "r_y0": 547.03909, "r_x1": 162.69737, "r_y1": 547.03909, "r_x2": 162.69737, "r_y2": 544.67065, "r_x3": 158.48466, "r_y3": 544.67065, "coord_origin": "TOPLEFT" }, "text": "500", "orig": "500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.48466, "r_y0": 551.28108, "r_x1": 164.10178, "r_y1": 551.28108, "r_x2": 164.10178, "r_y2": 548.91264, "r_x3": 158.48466, "r_y3": 548.91264, "coord_origin": "TOPLEFT" }, "text": "3500", "orig": "3500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.48466, "r_y0": 555.52309, "r_x1": 162.69737, "r_y1": 555.52309, "r_x2": 162.69737, "r_y2": 553.15465, "r_x3": 158.48466, "r_y3": 553.15465, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.81696, "r_y0": 543.1000799999999, "r_x1": 172.88876, "r_y1": 543.1000799999999, "r_x2": 172.88876, "r_y2": 540.73164, "r_x3": 168.81696, "r_y3": 540.73164, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.81696, "r_y0": 547.03909, "r_x1": 172.88876, "r_y1": 547.03909, "r_x2": 172.88876, "r_y2": 544.67065, "r_x3": 168.81696, "r_y3": 544.67065, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.81696, "r_y0": 551.28108, "r_x1": 172.88876, "r_y1": 551.28108, "r_x2": 172.88876, "r_y2": 548.91264, "r_x3": 168.81696, "r_y3": 548.91264, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.81696, "r_y0": 555.52309, "r_x1": 172.88876, "r_y1": 555.52309, "r_x2": 172.88876, "r_y2": 553.15465, "r_x3": 168.81696, "r_y3": 553.15465, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.30025, "r_y0": 547.03909, "r_x1": 149.70605, "r_y1": 547.03909, "r_x2": 149.70605, "r_y2": 544.67065, "r_x3": 147.30025, "r_y3": 544.67065, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.90895, "r_y0": 547.03909, "r_x1": 155.72055, "r_y1": 547.03909, "r_x2": 155.72055, "r_y2": 544.67065, "r_x3": 150.90895, "r_y3": 544.67065, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.30025, "r_y0": 551.28108, "r_x1": 149.70605, "r_y1": 551.28108, "r_x2": 149.70605, "r_y2": 548.91264, "r_x3": 147.30025, "r_y3": 548.91264, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.90895, "r_y0": 551.28108, "r_x1": 155.72055, "r_y1": 551.28108, "r_x2": 155.72055, "r_y2": 548.91264, "r_x3": 150.90895, "r_y3": 548.91264, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.30025, "r_y0": 555.52309, "r_x1": 149.70605, "r_y1": 555.52309, "r_x2": 149.70605, "r_y2": 553.15465, "r_x3": 147.30025, "r_y3": 553.15465, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.90895, "r_y0": 555.52309, "r_x1": 155.72055, "r_y1": 555.52309, "r_x2": 155.72055, "r_y2": 553.15465, "r_x3": 150.90895, "r_y3": 553.15465, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 152.05046, "r_y0": 521.27298, "r_x1": 171.24945, "r_y1": 521.27298, "r_x2": 171.24945, "r_y2": 517.0098, "r_x3": 152.05046, "r_y3": 517.0098, "coord_origin": "TOPLEFT" }, "text": "Extracted", "orig": "Extracted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 148.13347, "r_y0": 526.57547, "r_x1": 175.16759, "r_y1": 526.57547, "r_x2": 175.16759, "r_y2": 522.3122900000001, "r_x3": 148.13347, "r_y3": 522.3122900000001, "coord_origin": "TOPLEFT" }, "text": "Table Images", "orig": "Table Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 193.53331, "r_y0": 528.7774, "r_x1": 220.31973, "r_y1": 528.7774, "r_x2": 220.31973, "r_y2": 524.51422, "r_x3": 193.53331, "r_y3": 524.51422, "coord_origin": "TOPLEFT" }, "text": "Standardized", "orig": "Standardized", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 199.47311, "r_y0": 534.0799, "r_x1": 214.37889, "r_y1": 534.0799, "r_x2": 214.37889, "r_y2": 529.8167100000001, "r_x3": 199.47311, "r_y3": 529.8167100000001, "coord_origin": "TOPLEFT" }, "text": "Images", "orig": "Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 273.61066, "r_y0": 514.16849, "r_x1": 284.47275, "r_y1": 514.16849, "r_x2": 284.47275, "r_y2": 509.9053, "r_x3": 273.61066, "r_y3": 509.9053, "coord_origin": "TOPLEFT" }, "text": "BBox", "orig": "BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 270.45187, "r_y0": 517.9560200000001, "r_x1": 287.63242, "r_y1": 517.9560200000001, "r_x2": 287.63242, "r_y2": 513.6928399999999, "r_x3": 270.45187, "r_y3": 513.6928399999999, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.47852, "r_y0": 512.40756, "r_x1": 348.14014, "r_y1": 512.40756, "r_x2": 348.14014, "r_y2": 508.14438, "r_x3": 332.47852, "r_y3": 508.14438, "coord_origin": "TOPLEFT" }, "text": "BBoxes", "orig": "BBoxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 376.68622, "r_y0": 525.38342, "r_x1": 407.25497, "r_y1": 525.38342, "r_x2": 407.25497, "r_y2": 521.12024, "r_x3": 376.68622, "r_y3": 521.12024, "coord_origin": "TOPLEFT" }, "text": "BBoxes can be", "orig": "BBoxes can be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 373.90869, "r_y0": 529.92844, "r_x1": 410.03506, "r_y1": 529.92844, "r_x2": 410.03506, "r_y2": 525.66525, "r_x3": 373.90869, "r_y3": 525.66525, "coord_origin": "TOPLEFT" }, "text": "traced back to the", "orig": "traced back to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 375.29871, "r_y0": 534.47342, "r_x1": 408.64902, "r_y1": 534.47342, "r_x2": 408.64902, "r_y2": 530.21024, "r_x3": 375.29871, "r_y3": 530.21024, "coord_origin": "TOPLEFT" }, "text": "original image to", "orig": "original image to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 377.06747, "r_y0": 539.01843, "r_x1": 406.88312, "r_y1": 539.01843, "r_x2": 406.88312, "r_y2": 534.75522, "r_x3": 377.06747, "r_y3": 534.75522, "coord_origin": "TOPLEFT" }, "text": "extract content", "orig": "extract content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 383.56683, "r_y0": 567.50497, "r_x1": 433.76544, "r_y1": 567.50497, "r_x2": 433.76544, "r_y2": 563.24176, "r_x3": 383.56683, "r_y3": 563.24176, "coord_origin": "TOPLEFT" }, "text": "Structure Tags sequence", "orig": "Structure Tags sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 383.52768, "r_y0": 572.04997, "r_x1": 433.80764999999997, "r_y1": 572.04997, "r_x2": 433.80764999999997, "r_y2": 567.78676, "r_x3": 383.52768, "r_y3": 567.78676, "coord_origin": "TOPLEFT" }, "text": "provide full description of", "orig": "provide full description of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 390.47522, "r_y0": 576.59499, "r_x1": 426.85703, "r_y1": 576.59499, "r_x2": 426.85703, "r_y2": 572.33177, "r_x3": 390.47522, "r_y3": 572.33177, "coord_origin": "TOPLEFT" }, "text": "the table structure", "orig": "the table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.94702, "r_y0": 582.15465, "r_x1": 323.1691, "r_y1": 582.15465, "r_x2": 323.1691, "r_y2": 577.89143, "r_x3": 293.94702, "r_y3": 577.89143, "coord_origin": "TOPLEFT" }, "text": "Structure Tags", "orig": "Structure Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.94702, "r_y0": 586.69969, "r_x1": 324.59396, "r_y1": 586.69969, "r_x2": 324.59396, "r_y2": 582.43648, "r_x3": 293.94702, "r_y3": 582.43648, "coord_origin": "TOPLEFT" }, "text": "in OTSL format", "orig": "in OTSL format", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.07819, "r_y0": 546.08591, "r_x1": 364.14691, "r_y1": 546.08591, "r_x2": 364.14691, "r_y2": 541.82269, "r_x3": 333.07819, "r_y3": 541.82269, "coord_origin": "TOPLEFT" }, "text": "BBoxes in sync", "orig": "BBoxes in sync", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.07819, "r_y0": 549.87341, "r_x1": 369.71542, "r_y1": 549.87341, "r_x2": 369.71542, "r_y2": 545.6102, "r_x3": 333.07819, "r_y3": 545.6102, "coord_origin": "TOPLEFT" }, "text": "with tag sequence", "orig": "with tag sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.65881000000002, "r_y0": 519.50458, "r_x1": 249.58894000000004, "r_y1": 519.50458, "r_x2": 249.58894000000004, "r_y2": 515.24139, "r_x3": 232.65881000000002, "r_y3": 515.24139, "coord_origin": "TOPLEFT" }, "text": "Encoder", "orig": "Encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 269.8219, "r_y0": 550.23424, "r_x1": 288.26279, "r_y1": 550.23424, "r_x2": 288.26279, "r_y2": 545.97102, "r_x3": 269.8219, "r_y3": 545.97102, "coord_origin": "TOPLEFT" }, "text": "Structure", "orig": "Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 270.45187, "r_y0": 554.0217299999999, "r_x1": 287.63242, "r_y1": 554.0217299999999, "r_x2": 287.63242, "r_y2": 549.75851, "r_x3": 270.45187, "r_y3": 549.75851, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.17676, "r_y0": 520.17523, "r_x1": 358.11206, "r_y1": 520.17523, "r_x2": 358.11206, "r_y2": 515.91205, "r_x3": 332.17676, "r_y3": 515.91205, "coord_origin": "TOPLEFT" }, "text": "[x1, y2, x2, y2]", "orig": "[x1, y2, x2, y2]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.17676, "r_y0": 526.23523, "r_x1": 361.58298, "r_y1": 526.23523, "r_x2": 361.58298, "r_y2": 521.9720500000001, "r_x3": 332.17676, "r_y3": 521.9720500000001, "coord_origin": "TOPLEFT" }, "text": "[x1', y2', x2', y2']", "orig": "[x1', y2', x2', y2']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.17676, "r_y0": 532.29523, "r_x1": 364.76474, "r_y1": 532.29523, "r_x2": 364.76474, "r_y2": 528.03204, "r_x3": 332.17676, "r_y3": 528.03204, "coord_origin": "TOPLEFT" }, "text": "[x1'', y2'', x2'', y2'']", "orig": "[x1'', y2'', x2'', y2'']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.17676, "r_y0": 538.35524, "r_x1": 335.96548, "r_y1": 538.35524, "r_x2": 335.96548, "r_y2": 534.09204, "r_x3": 332.17676, "r_y3": 534.09204, "coord_origin": "TOPLEFT" }, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.8894, "r_y0": 520.6582599999999, "r_x1": 329.41641, "r_y1": 520.6582599999999, "r_x2": 329.41641, "r_y2": 516.39508, "r_x3": 326.8894, "r_y3": 516.39508, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.04089, "r_y0": 526.68796, "r_x1": 329.5679, "r_y1": 526.68796, "r_x2": 329.5679, "r_y2": 522.4247700000001, "r_x3": 327.04089, "r_y3": 522.4247700000001, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.04089, "r_y0": 532.77826, "r_x1": 329.5679, "r_y1": 532.77826, "r_x2": 329.5679, "r_y2": 528.51508, "r_x3": 327.04089, "r_y3": 528.51508, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 424.14102, "r_y0": 531.7060200000001, "r_x1": 426.66803, "r_y1": 531.7060200000001, "r_x2": 426.66803, "r_y2": 527.4428399999999, "r_x3": 424.14102, "r_y3": 527.4428399999999, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 453.0018, "r_y0": 521.71713, "r_x1": 455.52881, "r_y1": 521.71713, "r_x2": 455.52881, "r_y2": 517.4539500000001, "r_x3": 453.0018, "r_y3": 517.4539500000001, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.85825, "r_y0": 521.32599, "r_x1": 426.38525, "r_y1": 521.32599, "r_x2": 426.38525, "r_y2": 517.06281, "r_x3": 423.85825, "r_y3": 517.06281, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.4342, "r_y0": 562.35719, "r_x1": 337.27542, "r_y1": 562.35719, "r_x2": 337.27542, "r_y2": 557.36679, "r_x3": 333.4342, "r_y3": 557.36679, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.35397, "r_y0": 562.30719, "r_x1": 344.19519, "r_y1": 562.30719, "r_x2": 344.19519, "r_y2": 557.31679, "r_x3": 340.35397, "r_y3": 557.31679, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.30978, "r_y0": 568.8557900000001, "r_x1": 344.151, "r_y1": 568.8557900000001, "r_x2": 344.151, "r_y2": 563.8653899999999, "r_x3": 340.30978, "r_y3": 563.8653899999999, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.79904, "r_y0": 568.85907, "r_x1": 350.64026, "r_y1": 568.85907, "r_x2": 350.64026, "r_y2": 563.8686700000001, "r_x3": 346.79904, "r_y3": 563.8686700000001, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.59583, "r_y0": 568.81311, "r_x1": 337.43704, "r_y1": 568.81311, "r_x2": 337.43704, "r_y2": 563.82271, "r_x3": 333.59583, "r_y3": 563.82271, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.37543, "r_y0": 575.41713, "r_x1": 344.21664, "r_y1": 575.41713, "r_x2": 344.21664, "r_y2": 570.42673, "r_x3": 340.37543, "r_y3": 570.42673, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.86469, "r_y0": 575.42041, "r_x1": 350.7059, "r_y1": 575.42041, "r_x2": 350.7059, "r_y2": 570.43001, "r_x3": 346.86469, "r_y3": 570.43001, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.66144, "r_y0": 575.37445, "r_x1": 337.50266, "r_y1": 575.37445, "r_x2": 337.50266, "r_y2": 570.38405, "r_x3": 333.66144, "r_y3": 570.38405, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.37671, "r_y0": 582.0164599999999, "r_x1": 344.21793, "r_y1": 582.0164599999999, "r_x2": 344.21793, "r_y2": 577.02606, "r_x3": 340.37671, "r_y3": 577.02606, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.86597, "r_y0": 582.01974, "r_x1": 350.70718, "r_y1": 582.01974, "r_x2": 350.70718, "r_y2": 577.02934, "r_x3": 346.86597, "r_y3": 577.02934, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.66272, "r_y0": 581.97379, "r_x1": 337.50394, "r_y1": 581.97379, "r_x2": 337.50394, "r_y2": 576.98338, "r_x3": 333.66272, "r_y3": 576.98338, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.27948, "r_y0": 588.38777, "r_x1": 344.1207, "r_y1": 588.38777, "r_x2": 344.1207, "r_y2": 583.39737, "r_x3": 340.27948, "r_y3": 583.39737, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.76874, "r_y0": 588.39108, "r_x1": 350.60995, "r_y1": 588.39108, "r_x2": 350.60995, "r_y2": 583.40068, "r_x3": 346.76874, "r_y3": 583.40068, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.56549, "r_y0": 588.34514, "r_x1": 337.40671, "r_y1": 588.34514, "r_x2": 337.40671, "r_y2": 583.35474, "r_x3": 333.56549, "r_y3": 583.35474, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.03326, "r_y0": 561.87354, "r_x1": 359.83362, "r_y1": 561.87354, "r_x2": 359.83362, "r_y2": 556.8831299999999, "r_x3": 353.03326, "r_y3": 556.8831299999999, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.18604, "r_y0": 568.57085, "r_x1": 359.98639, "r_y1": 568.57085, "r_x2": 359.98639, "r_y2": 563.58044, "r_x3": 353.18604, "r_y3": 563.58044, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.19864, "r_y0": 575.15276, "r_x1": 359.99899, "r_y1": 575.15276, "r_x2": 359.99899, "r_y2": 570.1623500000001, "r_x3": 353.19864, "r_y3": 570.1623500000001, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.1532, "r_y0": 581.75652, "r_x1": 359.95355, "r_y1": 581.75652, "r_x2": 359.95355, "r_y2": 576.76611, "r_x3": 353.1532, "r_y3": 576.76611, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.26935, "r_y0": 588.3966800000001, "r_x1": 360.0697, "r_y1": 588.3966800000001, "r_x2": 360.0697, "r_y2": 583.40628, "r_x3": 353.26935, "r_y3": 583.40628, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.37979, "r_y0": 562.07275, "r_x1": 350.33786, "r_y1": 562.07275, "r_x2": 350.33786, "r_y2": 557.08235, "r_x3": 347.37979, "r_y3": 557.08235, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.14026, "r_y0": 568.55399, "r_x1": 333.66727, "r_y1": 568.55399, "r_x2": 333.66727, "r_y2": 564.2907700000001, "r_x3": 331.14026, "r_y3": 564.2907700000001, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.80972, "r_y0": 558.85634, "r_x1": 343.33673, "r_y1": 558.85634, "r_x2": 343.33673, "r_y2": 554.59312, "r_x3": 340.80972, "r_y3": 554.59312, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.97992, "r_y0": 559.09357, "r_x1": 333.50693, "r_y1": 559.09357, "r_x2": 333.50693, "r_y2": 554.83035, "r_x3": 330.97992, "r_y3": 554.83035, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 13, "label": "text", "bbox": { "l": 147.30025, "t": 540.73164, "r": 149.70605, "b": 543.1000799999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.30025, "r_y0": 543.1000799999999, "r_x1": 149.70605, "r_y1": 543.1000799999999, "r_x2": 149.70605, "r_y2": 540.73164, "r_x3": 147.30025, "r_y3": 540.73164, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 14, "label": "text", "bbox": { "l": 150.90895, "t": 540.73164, "r": 155.72055, "b": 543.1000799999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.90895, "r_y0": 543.1000799999999, "r_x1": 155.72055, "r_y1": 543.1000799999999, "r_x2": 155.72055, "r_y2": 540.73164, "r_x3": 150.90895, "r_y3": 540.73164, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 15, "label": "text", "bbox": { "l": 162.75987, "t": 535.3938, "r": 172.2963, "b": 537.76224, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 162.75987, "r_y0": 537.76224, "r_x1": 172.2963, "r_y1": 537.76224, "r_x2": 172.2963, "r_y2": 535.3938, "r_x3": 162.75987, "r_y3": 535.3938, "coord_origin": "TOPLEFT" }, "text": "Amount", "orig": "Amount", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 16, "label": "text", "bbox": { "l": 147.63603, "t": 535.3661500000001, "r": 155.91753, "b": 537.73459, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.63603, "r_y0": 537.73459, "r_x1": 155.91753, "r_y1": 537.73459, "r_x2": 155.91753, "r_y2": 535.3661500000001, "r_x3": 147.63603, "r_y3": 535.3661500000001, "coord_origin": "TOPLEFT" }, "text": "Names", "orig": "Names", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 17, "label": "text", "bbox": { "l": 158.48466, "t": 540.73164, "r": 164.10178, "b": 543.1000799999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.48466, "r_y0": 543.1000799999999, "r_x1": 164.10178, "r_y1": 543.1000799999999, "r_x2": 164.10178, "r_y2": 540.73164, "r_x3": 158.48466, "r_y3": 540.73164, "coord_origin": "TOPLEFT" }, "text": "1000", "orig": "1000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 18, "label": "text", "bbox": { "l": 158.48466, "t": 544.67065, "r": 162.69737, "b": 547.03909, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.48466, "r_y0": 547.03909, "r_x1": 162.69737, "r_y1": 547.03909, "r_x2": 162.69737, "r_y2": 544.67065, "r_x3": 158.48466, "r_y3": 544.67065, "coord_origin": "TOPLEFT" }, "text": "500", "orig": "500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 19, "label": "text", "bbox": { "l": 158.48466, "t": 548.91264, "r": 164.10178, "b": 551.28108, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.48466, "r_y0": 551.28108, "r_x1": 164.10178, "r_y1": 551.28108, "r_x2": 164.10178, "r_y2": 548.91264, "r_x3": 158.48466, "r_y3": 548.91264, "coord_origin": "TOPLEFT" }, "text": "3500", "orig": "3500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 20, "label": "text", "bbox": { "l": 158.48466, "t": 553.15465, "r": 162.69737, "b": 555.52309, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.48466, "r_y0": 555.52309, "r_x1": 162.69737, "r_y1": 555.52309, "r_x2": 162.69737, "r_y2": 553.15465, "r_x3": 158.48466, "r_y3": 553.15465, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 21, "label": "text", "bbox": { "l": 168.81696, "t": 540.73164, "r": 172.88876, "b": 543.1000799999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.81696, "r_y0": 543.1000799999999, "r_x1": 172.88876, "r_y1": 543.1000799999999, "r_x2": 172.88876, "r_y2": 540.73164, "r_x3": 168.81696, "r_y3": 540.73164, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 22, "label": "text", "bbox": { "l": 168.81696, "t": 544.67065, "r": 172.88876, "b": 547.03909, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.81696, "r_y0": 547.03909, "r_x1": 172.88876, "r_y1": 547.03909, "r_x2": 172.88876, "r_y2": 544.67065, "r_x3": 168.81696, "r_y3": 544.67065, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 23, "label": "text", "bbox": { "l": 168.81696, "t": 548.91264, "r": 172.88876, "b": 551.28108, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.81696, "r_y0": 551.28108, "r_x1": 172.88876, "r_y1": 551.28108, "r_x2": 172.88876, "r_y2": 548.91264, "r_x3": 168.81696, "r_y3": 548.91264, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 24, "label": "text", "bbox": { "l": 168.81696, "t": 553.15465, "r": 172.88876, "b": 555.52309, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.81696, "r_y0": 555.52309, "r_x1": 172.88876, "r_y1": 555.52309, "r_x2": 172.88876, "r_y2": 553.15465, "r_x3": 168.81696, "r_y3": 553.15465, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 25, "label": "text", "bbox": { "l": 147.30025, "t": 544.67065, "r": 149.70605, "b": 547.03909, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.30025, "r_y0": 547.03909, "r_x1": 149.70605, "r_y1": 547.03909, "r_x2": 149.70605, "r_y2": 544.67065, "r_x3": 147.30025, "r_y3": 544.67065, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 26, "label": "text", "bbox": { "l": 150.90895, "t": 544.67065, "r": 155.72055, "b": 547.03909, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.90895, "r_y0": 547.03909, "r_x1": 155.72055, "r_y1": 547.03909, "r_x2": 155.72055, "r_y2": 544.67065, "r_x3": 150.90895, "r_y3": 544.67065, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 27, "label": "text", "bbox": { "l": 147.30025, "t": 548.91264, "r": 149.70605, "b": 551.28108, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.30025, "r_y0": 551.28108, "r_x1": 149.70605, "r_y1": 551.28108, "r_x2": 149.70605, "r_y2": 548.91264, "r_x3": 147.30025, "r_y3": 548.91264, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 28, "label": "text", "bbox": { "l": 150.90895, "t": 548.91264, "r": 155.72055, "b": 551.28108, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.90895, "r_y0": 551.28108, "r_x1": 155.72055, "r_y1": 551.28108, "r_x2": 155.72055, "r_y2": 548.91264, "r_x3": 150.90895, "r_y3": 548.91264, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 29, "label": "text", "bbox": { "l": 147.30025, "t": 553.15465, "r": 149.70605, "b": 555.52309, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.30025, "r_y0": 555.52309, "r_x1": 149.70605, "r_y1": 555.52309, "r_x2": 149.70605, "r_y2": 553.15465, "r_x3": 147.30025, "r_y3": 553.15465, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 30, "label": "text", "bbox": { "l": 150.90895, "t": 553.15465, "r": 155.72055, "b": 555.52309, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.90895, "r_y0": 555.52309, "r_x1": 155.72055, "r_y1": 555.52309, "r_x2": 155.72055, "r_y2": 553.15465, "r_x3": 150.90895, "r_y3": 553.15465, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 31, "label": "text", "bbox": { "l": 152.05046, "t": 517.0098, "r": 171.24945, "b": 521.27298, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 152.05046, "r_y0": 521.27298, "r_x1": 171.24945, "r_y1": 521.27298, "r_x2": 171.24945, "r_y2": 517.0098, "r_x3": 152.05046, "r_y3": 517.0098, "coord_origin": "TOPLEFT" }, "text": "Extracted", "orig": "Extracted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 32, "label": "text", "bbox": { "l": 148.13347, "t": 522.3122900000001, "r": 175.16759, "b": 526.57547, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 148.13347, "r_y0": 526.57547, "r_x1": 175.16759, "r_y1": 526.57547, "r_x2": 175.16759, "r_y2": 522.3122900000001, "r_x3": 148.13347, "r_y3": 522.3122900000001, "coord_origin": "TOPLEFT" }, "text": "Table Images", "orig": "Table Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 33, "label": "text", "bbox": { "l": 193.53331, "t": 524.51422, "r": 220.31973, "b": 528.7774, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 193.53331, "r_y0": 528.7774, "r_x1": 220.31973, "r_y1": 528.7774, "r_x2": 220.31973, "r_y2": 524.51422, "r_x3": 193.53331, "r_y3": 524.51422, "coord_origin": "TOPLEFT" }, "text": "Standardized", "orig": "Standardized", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 34, "label": "text", "bbox": { "l": 199.47311, "t": 529.8167100000001, "r": 214.37889, "b": 534.0799, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 199.47311, "r_y0": 534.0799, "r_x1": 214.37889, "r_y1": 534.0799, "r_x2": 214.37889, "r_y2": 529.8167100000001, "r_x3": 199.47311, "r_y3": 529.8167100000001, "coord_origin": "TOPLEFT" }, "text": "Images", "orig": "Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 35, "label": "text", "bbox": { "l": 273.61066, "t": 509.9053, "r": 284.47275, "b": 514.16849, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 273.61066, "r_y0": 514.16849, "r_x1": 284.47275, "r_y1": 514.16849, "r_x2": 284.47275, "r_y2": 509.9053, "r_x3": 273.61066, "r_y3": 509.9053, "coord_origin": "TOPLEFT" }, "text": "BBox", "orig": "BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 36, "label": "text", "bbox": { "l": 270.45187, "t": 513.6928399999999, "r": 287.63242, "b": 517.9560200000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 270.45187, "r_y0": 517.9560200000001, "r_x1": 287.63242, "r_y1": 517.9560200000001, "r_x2": 287.63242, "r_y2": 513.6928399999999, "r_x3": 270.45187, "r_y3": 513.6928399999999, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 37, "label": "text", "bbox": { "l": 332.47852, "t": 508.14438, "r": 348.14014, "b": 512.40756, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.47852, "r_y0": 512.40756, "r_x1": 348.14014, "r_y1": 512.40756, "r_x2": 348.14014, "r_y2": 508.14438, "r_x3": 332.47852, "r_y3": 508.14438, "coord_origin": "TOPLEFT" }, "text": "BBoxes", "orig": "BBoxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 38, "label": "text", "bbox": { "l": 376.68622, "t": 521.12024, "r": 407.25497, "b": 525.38342, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 376.68622, "r_y0": 525.38342, "r_x1": 407.25497, "r_y1": 525.38342, "r_x2": 407.25497, "r_y2": 521.12024, "r_x3": 376.68622, "r_y3": 521.12024, "coord_origin": "TOPLEFT" }, "text": "BBoxes can be", "orig": "BBoxes can be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 39, "label": "text", "bbox": { "l": 373.90869, "t": 525.66525, "r": 410.03506, "b": 529.92844, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 373.90869, "r_y0": 529.92844, "r_x1": 410.03506, "r_y1": 529.92844, "r_x2": 410.03506, "r_y2": 525.66525, "r_x3": 373.90869, "r_y3": 525.66525, "coord_origin": "TOPLEFT" }, "text": "traced back to the", "orig": "traced back to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 40, "label": "text", "bbox": { "l": 375.29871, "t": 530.21024, "r": 408.64902, "b": 534.47342, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 375.29871, "r_y0": 534.47342, "r_x1": 408.64902, "r_y1": 534.47342, "r_x2": 408.64902, "r_y2": 530.21024, "r_x3": 375.29871, "r_y3": 530.21024, "coord_origin": "TOPLEFT" }, "text": "original image to", "orig": "original image to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 377.06747, "t": 534.75522, "r": 406.88312, "b": 539.01843, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 377.06747, "r_y0": 539.01843, "r_x1": 406.88312, "r_y1": 539.01843, "r_x2": 406.88312, "r_y2": 534.75522, "r_x3": 377.06747, "r_y3": 534.75522, "coord_origin": "TOPLEFT" }, "text": "extract content", "orig": "extract content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 383.56683, "t": 563.24176, "r": 433.76544, "b": 567.50497, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 383.56683, "r_y0": 567.50497, "r_x1": 433.76544, "r_y1": 567.50497, "r_x2": 433.76544, "r_y2": 563.24176, "r_x3": 383.56683, "r_y3": 563.24176, "coord_origin": "TOPLEFT" }, "text": "Structure Tags sequence", "orig": "Structure Tags sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 383.52768, "t": 567.78676, "r": 433.80764999999997, "b": 572.04997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 383.52768, "r_y0": 572.04997, "r_x1": 433.80764999999997, "r_y1": 572.04997, "r_x2": 433.80764999999997, "r_y2": 567.78676, "r_x3": 383.52768, "r_y3": 567.78676, "coord_origin": "TOPLEFT" }, "text": "provide full description of", "orig": "provide full description of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 390.47522, "t": 572.33177, "r": 426.85703, "b": 576.59499, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 390.47522, "r_y0": 576.59499, "r_x1": 426.85703, "r_y1": 576.59499, "r_x2": 426.85703, "r_y2": 572.33177, "r_x3": 390.47522, "r_y3": 572.33177, "coord_origin": "TOPLEFT" }, "text": "the table structure", "orig": "the table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 293.94702, "t": 577.89143, "r": 323.1691, "b": 582.15465, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.94702, "r_y0": 582.15465, "r_x1": 323.1691, "r_y1": 582.15465, "r_x2": 323.1691, "r_y2": 577.89143, "r_x3": 293.94702, "r_y3": 577.89143, "coord_origin": "TOPLEFT" }, "text": "Structure Tags", "orig": "Structure Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 293.94702, "t": 582.43648, "r": 324.59396, "b": 586.69969, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.94702, "r_y0": 586.69969, "r_x1": 324.59396, "r_y1": 586.69969, "r_x2": 324.59396, "r_y2": 582.43648, "r_x3": 293.94702, "r_y3": 582.43648, "coord_origin": "TOPLEFT" }, "text": "in OTSL format", "orig": "in OTSL format", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 333.07819, "t": 541.82269, "r": 364.14691, "b": 546.08591, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.07819, "r_y0": 546.08591, "r_x1": 364.14691, "r_y1": 546.08591, "r_x2": 364.14691, "r_y2": 541.82269, "r_x3": 333.07819, "r_y3": 541.82269, "coord_origin": "TOPLEFT" }, "text": "BBoxes in sync", "orig": "BBoxes in sync", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 333.07819, "t": 545.6102, "r": 369.71542, "b": 549.87341, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.07819, "r_y0": 549.87341, "r_x1": 369.71542, "r_y1": 549.87341, "r_x2": 369.71542, "r_y2": 545.6102, "r_x3": 333.07819, "r_y3": 545.6102, "coord_origin": "TOPLEFT" }, "text": "with tag sequence", "orig": "with tag sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 232.65881000000002, "t": 515.24139, "r": 249.58894000000004, "b": 519.50458, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.65881000000002, "r_y0": 519.50458, "r_x1": 249.58894000000004, "r_y1": 519.50458, "r_x2": 249.58894000000004, "r_y2": 515.24139, "r_x3": 232.65881000000002, "r_y3": 515.24139, "coord_origin": "TOPLEFT" }, "text": "Encoder", "orig": "Encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 269.8219, "t": 545.97102, "r": 288.26279, "b": 550.23424, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 269.8219, "r_y0": 550.23424, "r_x1": 288.26279, "r_y1": 550.23424, "r_x2": 288.26279, "r_y2": 545.97102, "r_x3": 269.8219, "r_y3": 545.97102, "coord_origin": "TOPLEFT" }, "text": "Structure", "orig": "Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 51, "label": "text", "bbox": { "l": 270.45187, "t": 549.75851, "r": 287.63242, "b": 554.0217299999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 270.45187, "r_y0": 554.0217299999999, "r_x1": 287.63242, "r_y1": 554.0217299999999, "r_x2": 287.63242, "r_y2": 549.75851, "r_x3": 270.45187, "r_y3": 549.75851, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 52, "label": "text", "bbox": { "l": 332.17676, "t": 515.91205, "r": 358.11206, "b": 520.17523, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.17676, "r_y0": 520.17523, "r_x1": 358.11206, "r_y1": 520.17523, "r_x2": 358.11206, "r_y2": 515.91205, "r_x3": 332.17676, "r_y3": 515.91205, "coord_origin": "TOPLEFT" }, "text": "[x1, y2, x2, y2]", "orig": "[x1, y2, x2, y2]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 53, "label": "text", "bbox": { "l": 332.17676, "t": 521.9720500000001, "r": 361.58298, "b": 526.23523, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.17676, "r_y0": 526.23523, "r_x1": 361.58298, "r_y1": 526.23523, "r_x2": 361.58298, "r_y2": 521.9720500000001, "r_x3": 332.17676, "r_y3": 521.9720500000001, "coord_origin": "TOPLEFT" }, "text": "[x1', y2', x2', y2']", "orig": "[x1', y2', x2', y2']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 54, "label": "text", "bbox": { "l": 332.17676, "t": 528.03204, "r": 364.76474, "b": 532.29523, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.17676, "r_y0": 532.29523, "r_x1": 364.76474, "r_y1": 532.29523, "r_x2": 364.76474, "r_y2": 528.03204, "r_x3": 332.17676, "r_y3": 528.03204, "coord_origin": "TOPLEFT" }, "text": "[x1'', y2'', x2'', y2'']", "orig": "[x1'', y2'', x2'', y2'']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 55, "label": "text", "bbox": { "l": 332.17676, "t": 534.09204, "r": 335.96548, "b": 538.35524, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.17676, "r_y0": 538.35524, "r_x1": 335.96548, "r_y1": 538.35524, "r_x2": 335.96548, "r_y2": 534.09204, "r_x3": 332.17676, "r_y3": 534.09204, "coord_origin": "TOPLEFT" }, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 56, "label": "text", "bbox": { "l": 326.8894, "t": 516.39508, "r": 329.41641, "b": 520.6582599999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.8894, "r_y0": 520.6582599999999, "r_x1": 329.41641, "r_y1": 520.6582599999999, "r_x2": 329.41641, "r_y2": 516.39508, "r_x3": 326.8894, "r_y3": 516.39508, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 57, "label": "text", "bbox": { "l": 327.04089, "t": 522.4247700000001, "r": 329.5679, "b": 526.68796, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.04089, "r_y0": 526.68796, "r_x1": 329.5679, "r_y1": 526.68796, "r_x2": 329.5679, "r_y2": 522.4247700000001, "r_x3": 327.04089, "r_y3": 522.4247700000001, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 58, "label": "text", "bbox": { "l": 327.04089, "t": 528.51508, "r": 329.5679, "b": 532.77826, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.04089, "r_y0": 532.77826, "r_x1": 329.5679, "r_y1": 532.77826, "r_x2": 329.5679, "r_y2": 528.51508, "r_x3": 327.04089, "r_y3": 528.51508, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 59, "label": "text", "bbox": { "l": 424.14102, "t": 527.4428399999999, "r": 426.66803, "b": 531.7060200000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 424.14102, "r_y0": 531.7060200000001, "r_x1": 426.66803, "r_y1": 531.7060200000001, "r_x2": 426.66803, "r_y2": 527.4428399999999, "r_x3": 424.14102, "r_y3": 527.4428399999999, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 60, "label": "text", "bbox": { "l": 453.0018, "t": 517.4539500000001, "r": 455.52881, "b": 521.71713, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 453.0018, "r_y0": 521.71713, "r_x1": 455.52881, "r_y1": 521.71713, "r_x2": 455.52881, "r_y2": 517.4539500000001, "r_x3": 453.0018, "r_y3": 517.4539500000001, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 61, "label": "text", "bbox": { "l": 423.85825, "t": 517.06281, "r": 426.38525, "b": 521.32599, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.85825, "r_y0": 521.32599, "r_x1": 426.38525, "r_y1": 521.32599, "r_x2": 426.38525, "r_y2": 517.06281, "r_x3": 423.85825, "r_y3": 517.06281, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 62, "label": "text", "bbox": { "l": 333.4342, "t": 557.36679, "r": 337.27542, "b": 562.35719, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.4342, "r_y0": 562.35719, "r_x1": 337.27542, "r_y1": 562.35719, "r_x2": 337.27542, "r_y2": 557.36679, "r_x3": 333.4342, "r_y3": 557.36679, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 340.35397, "t": 557.31679, "r": 344.19519, "b": 562.30719, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.35397, "r_y0": 562.30719, "r_x1": 344.19519, "r_y1": 562.30719, "r_x2": 344.19519, "r_y2": 557.31679, "r_x3": 340.35397, "r_y3": 557.31679, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 340.30978, "t": 563.8653899999999, "r": 344.151, "b": 568.8557900000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.30978, "r_y0": 568.8557900000001, "r_x1": 344.151, "r_y1": 568.8557900000001, "r_x2": 344.151, "r_y2": 563.8653899999999, "r_x3": 340.30978, "r_y3": 563.8653899999999, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 346.79904, "t": 563.8686700000001, "r": 350.64026, "b": 568.85907, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.79904, "r_y0": 568.85907, "r_x1": 350.64026, "r_y1": 568.85907, "r_x2": 350.64026, "r_y2": 563.8686700000001, "r_x3": 346.79904, "r_y3": 563.8686700000001, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 333.59583, "t": 563.82271, "r": 337.43704, "b": 568.81311, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.59583, "r_y0": 568.81311, "r_x1": 337.43704, "r_y1": 568.81311, "r_x2": 337.43704, "r_y2": 563.82271, "r_x3": 333.59583, "r_y3": 563.82271, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 340.37543, "t": 570.42673, "r": 344.21664, "b": 575.41713, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.37543, "r_y0": 575.41713, "r_x1": 344.21664, "r_y1": 575.41713, "r_x2": 344.21664, "r_y2": 570.42673, "r_x3": 340.37543, "r_y3": 570.42673, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 346.86469, "t": 570.43001, "r": 350.7059, "b": 575.42041, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.86469, "r_y0": 575.42041, "r_x1": 350.7059, "r_y1": 575.42041, "r_x2": 350.7059, "r_y2": 570.43001, "r_x3": 346.86469, "r_y3": 570.43001, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 333.66144, "t": 570.38405, "r": 337.50266, "b": 575.37445, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.66144, "r_y0": 575.37445, "r_x1": 337.50266, "r_y1": 575.37445, "r_x2": 337.50266, "r_y2": 570.38405, "r_x3": 333.66144, "r_y3": 570.38405, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 340.37671, "t": 577.02606, "r": 344.21793, "b": 582.0164599999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.37671, "r_y0": 582.0164599999999, "r_x1": 344.21793, "r_y1": 582.0164599999999, "r_x2": 344.21793, "r_y2": 577.02606, "r_x3": 340.37671, "r_y3": 577.02606, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 346.86597, "t": 577.02934, "r": 350.70718, "b": 582.01974, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.86597, "r_y0": 582.01974, "r_x1": 350.70718, "r_y1": 582.01974, "r_x2": 350.70718, "r_y2": 577.02934, "r_x3": 346.86597, "r_y3": 577.02934, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 333.66272, "t": 576.98338, "r": 337.50394, "b": 581.97379, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.66272, "r_y0": 581.97379, "r_x1": 337.50394, "r_y1": 581.97379, "r_x2": 337.50394, "r_y2": 576.98338, "r_x3": 333.66272, "r_y3": 576.98338, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 340.27948, "t": 583.39737, "r": 344.1207, "b": 588.38777, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.27948, "r_y0": 588.38777, "r_x1": 344.1207, "r_y1": 588.38777, "r_x2": 344.1207, "r_y2": 583.39737, "r_x3": 340.27948, "r_y3": 583.39737, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 346.76874, "t": 583.40068, "r": 350.60995, "b": 588.39108, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.76874, "r_y0": 588.39108, "r_x1": 350.60995, "r_y1": 588.39108, "r_x2": 350.60995, "r_y2": 583.40068, "r_x3": 346.76874, "r_y3": 583.40068, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 333.56549, "t": 583.35474, "r": 337.40671, "b": 588.34514, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.56549, "r_y0": 588.34514, "r_x1": 337.40671, "r_y1": 588.34514, "r_x2": 337.40671, "r_y2": 583.35474, "r_x3": 333.56549, "r_y3": 583.35474, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 353.03326, "t": 556.8831299999999, "r": 359.83362, "b": 561.87354, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.03326, "r_y0": 561.87354, "r_x1": 359.83362, "r_y1": 561.87354, "r_x2": 359.83362, "r_y2": 556.8831299999999, "r_x3": 353.03326, "r_y3": 556.8831299999999, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 353.18604, "t": 563.58044, "r": 359.98639, "b": 568.57085, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.18604, "r_y0": 568.57085, "r_x1": 359.98639, "r_y1": 568.57085, "r_x2": 359.98639, "r_y2": 563.58044, "r_x3": 353.18604, "r_y3": 563.58044, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 353.19864, "t": 570.1623500000001, "r": 359.99899, "b": 575.15276, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.19864, "r_y0": 575.15276, "r_x1": 359.99899, "r_y1": 575.15276, "r_x2": 359.99899, "r_y2": 570.1623500000001, "r_x3": 353.19864, "r_y3": 570.1623500000001, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 353.1532, "t": 576.76611, "r": 359.95355, "b": 581.75652, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.1532, "r_y0": 581.75652, "r_x1": 359.95355, "r_y1": 581.75652, "r_x2": 359.95355, "r_y2": 576.76611, "r_x3": 353.1532, "r_y3": 576.76611, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 80, "label": "text", "bbox": { "l": 353.26935, "t": 583.40628, "r": 360.0697, "b": 588.3966800000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.26935, "r_y0": 588.3966800000001, "r_x1": 360.0697, "r_y1": 588.3966800000001, "r_x2": 360.0697, "r_y2": 583.40628, "r_x3": 353.26935, "r_y3": 583.40628, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 81, "label": "text", "bbox": { "l": 347.37979, "t": 557.08235, "r": 350.33786, "b": 562.07275, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.37979, "r_y0": 562.07275, "r_x1": 350.33786, "r_y1": 562.07275, "r_x2": 350.33786, "r_y2": 557.08235, "r_x3": 347.37979, "r_y3": 557.08235, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 82, "label": "text", "bbox": { "l": 331.14026, "t": 564.2907700000001, "r": 333.66727, "b": 568.55399, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.14026, "r_y0": 568.55399, "r_x1": 333.66727, "r_y1": 568.55399, "r_x2": 333.66727, "r_y2": 564.2907700000001, "r_x3": 331.14026, "r_y3": 564.2907700000001, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 83, "label": "text", "bbox": { "l": 340.80972, "t": 554.59312, "r": 343.33673, "b": 558.85634, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.80972, "r_y0": 558.85634, "r_x1": 343.33673, "r_y1": 558.85634, "r_x2": 343.33673, "r_y2": 554.59312, "r_x3": 340.80972, "r_y3": 554.59312, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 84, "label": "text", "bbox": { "l": 330.97992, "t": 554.83035, "r": 333.50693, "b": 559.09357, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.97992, "r_y0": 559.09357, "r_x1": 333.50693, "r_y1": 559.09357, "r_x2": 333.50693, "r_y2": 554.83035, "r_x3": 330.97992, "r_y3": 554.83035, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "text", "id": 4, "page_no": 7, "cluster": { "id": 4, "label": "text", "bbox": { "l": 134.765, "t": 620.19278, "r": 480.5917400000001, "b": 664.8547599999999, "coord_origin": "TOPLEFT" }, "confidence": 0.951270341873169, "cells": [ { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.709, "r_y0": 628.98975, "r_x1": 480.58792, "r_y1": 628.98975, "r_x2": 480.58792, "r_y2": 620.19278, "r_x3": 149.709, "r_y3": 620.19278, "coord_origin": "TOPLEFT" }, "text": "We rely on standard metrics such as Tree Edit Distance score (TEDs) for", "orig": "We rely on standard metrics such as Tree Edit Distance score (TEDs) for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 640.94475, "r_x1": 480.58871, "r_y1": 640.94475, "r_x2": 480.58871, "r_y2": 632.14778, "r_x3": 134.765, "r_y3": 632.14778, "coord_origin": "TOPLEFT" }, "text": "table structure prediction, and Mean Average Precision (mAP) with 0.75 Inter-", "orig": "table structure prediction, and Mean Average Precision (mAP) with 0.75 Inter-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 652.89975, "r_x1": 480.5917400000001, "r_y1": 652.89975, "r_x2": 480.5917400000001, "r_y2": 644.1027799999999, "r_x3": 134.765, "r_y3": 644.1027799999999, "coord_origin": "TOPLEFT" }, "text": "section Over Union (IOU) threshold for the bounding-box predictions of table", "orig": "section Over Union (IOU) threshold for the bounding-box predictions of table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 664.8547599999999, "r_x1": 480.58968999999996, "r_y1": 664.8547599999999, "r_x2": 480.58968999999996, "r_y2": 656.0577900000001, "r_x3": 134.765, "r_y3": 656.0577900000001, "coord_origin": "TOPLEFT" }, "text": "cells. The predicted OTSL structures were converted back to HTML format in", "orig": "cells. The predicted OTSL structures were converted back to HTML format in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "We rely on standard metrics such as Tree Edit Distance score (TEDs) for table structure prediction, and Mean Average Precision (mAP) with 0.75 Intersection Over Union (IOU) threshold for the bounding-box predictions of table cells. The predicted OTSL structures were converted back to HTML format in" } ], "body": [ { "label": "text", "id": 5, "page_no": 7, "cluster": { "id": 5, "label": "text", "bbox": { "l": 134.765, "t": 118.93377999999996, "r": 480.58884000000006, "b": 139.68579, "coord_origin": "TOPLEFT" }, "confidence": 0.9464744925498962, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 127.73077, "r_x1": 480.58884000000006, "r_y1": 127.73077, "r_x2": 480.58884000000006, "r_y2": 118.93377999999996, "r_x3": 134.765, "r_y3": 118.93377999999996, "coord_origin": "TOPLEFT" }, "text": "reduces significantly the column drift seen in the HTML based models (see Fig-", "orig": "reduces significantly the column drift seen in the HTML based models (see Fig-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 139.68579, "r_x1": 163.56389, "r_y1": 139.68579, "r_x2": 163.56389, "r_y2": 130.88878999999997, "r_x3": 134.765, "r_y3": 130.88878999999997, "coord_origin": "TOPLEFT" }, "text": "ure 5).", "orig": "ure 5).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "reduces significantly the column drift seen in the HTML based models (see Figure 5)." }, { "label": "section_header", "id": 2, "page_no": 7, "cluster": { "id": 2, "label": "section_header", "bbox": { "l": 134.765, "t": 161.55682000000002, "r": 319.34708, "b": 170.36377000000005, "coord_origin": "TOPLEFT" }, "confidence": 0.9549514651298523, "cells": [ { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 170.36377000000005, "r_x1": 149.40205, "r_y1": 170.36377000000005, "r_x2": 149.40205, "r_y2": 161.55682000000002, "r_x3": 134.765, "r_y3": 161.55682000000002, "coord_origin": "TOPLEFT" }, "text": "4.3", "orig": "4.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.85904, "r_y0": 170.36377000000005, "r_x1": 319.34708, "r_y1": 170.36377000000005, "r_x2": 319.34708, "r_y2": 161.55682000000002, "r_x3": 160.85904, "r_y3": 161.55682000000002, "coord_origin": "TOPLEFT" }, "text": "Error-detection and -mitigation", "orig": "Error-detection and -mitigation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "4.3 Error-detection and -mitigation" }, { "label": "text", "id": 0, "page_no": 7, "cluster": { "id": 0, "label": "text", "bbox": { "l": 134.765, "t": 182.28179999999998, "r": 480.5957599999999, "b": 298.67584, "coord_origin": "TOPLEFT" }, "confidence": 0.9879790544509888, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 191.0788, "r_x1": 480.59572999999995, "r_y1": 191.0788, "r_x2": 480.59572999999995, "r_y2": 182.28179999999998, "r_x3": 134.765, "r_y3": 182.28179999999998, "coord_origin": "TOPLEFT" }, "text": "The design of OTSL allows to validate a table structure easily on an unfinished", "orig": "The design of OTSL allows to validate a table structure easily on an unfinished", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 203.03479000000004, "r_x1": 480.59473, "r_y1": 203.03479000000004, "r_x2": 480.59473, "r_y2": 194.23779000000002, "r_x3": 134.765, "r_y3": 194.23779000000002, "coord_origin": "TOPLEFT" }, "text": "sequence. The detection of an invalid sequence token is a clear indication of a", "orig": "sequence. The detection of an invalid sequence token is a clear indication of a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 214.98981000000003, "r_x1": 480.58678999999995, "r_y1": 214.98981000000003, "r_x2": 480.58678999999995, "r_y2": 206.19281, "r_x3": 134.765, "r_y3": 206.19281, "coord_origin": "TOPLEFT" }, "text": "prediction mistake, however a valid sequence by itself does not guarantee pre-", "orig": "prediction mistake, however a valid sequence by itself does not guarantee pre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 226.94482000000005, "r_x1": 480.59177000000005, "r_y1": 226.94482000000005, "r_x2": 480.59177000000005, "r_y2": 218.14783, "r_x3": 134.765, "r_y3": 218.14783, "coord_origin": "TOPLEFT" }, "text": "diction correctness. Different heuristics can be used to correct token errors in", "orig": "diction correctness. Different heuristics can be used to correct token errors in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 238.89984000000004, "r_x1": 480.58768, "r_y1": 238.89984000000004, "r_x2": 480.58768, "r_y2": 230.10284000000001, "r_x3": 134.765, "r_y3": 230.10284000000001, "coord_origin": "TOPLEFT" }, "text": "an invalid sequence and thus increase the chances for accurate predictions. Such", "orig": "an invalid sequence and thus increase the chances for accurate predictions. Such", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 250.85486000000003, "r_x1": 480.5867, "r_y1": 250.85486000000003, "r_x2": 480.5867, "r_y2": 242.05786, "r_x3": 134.765, "r_y3": 242.05786, "coord_origin": "TOPLEFT" }, "text": "heuristics can be applied either after the prediction of each token, or at the end", "orig": "heuristics can be applied either after the prediction of each token, or at the end", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 262.80988, "r_x1": 480.5938100000001, "r_y1": 262.80988, "r_x2": 480.5938100000001, "r_y2": 254.01288, "r_x3": 134.765, "r_y3": 254.01288, "coord_origin": "TOPLEFT" }, "text": "on the entire predicted sequence. For example a simple heuristic which can cor-", "orig": "on the entire predicted sequence. For example a simple heuristic which can cor-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 274.76586999999995, "r_x1": 480.59069999999997, "r_y1": 274.76586999999995, "r_x2": 480.59069999999997, "r_y2": 265.96887000000004, "r_x3": 134.765, "r_y3": 265.96887000000004, "coord_origin": "TOPLEFT" }, "text": "rect the predicted OTSL sequence on-the-fly is to verify if the token with the", "orig": "rect the predicted OTSL sequence on-the-fly is to verify if the token with the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 286.72086, "r_x1": 480.5957599999999, "r_y1": 286.72086, "r_x2": 480.5957599999999, "r_y2": 277.92389000000003, "r_x3": 134.765, "r_y3": 277.92389000000003, "coord_origin": "TOPLEFT" }, "text": "highest prediction confidence invalidates the predicted sequence, and replace it", "orig": "highest prediction confidence invalidates the predicted sequence, and replace it", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 298.67584, "r_x1": 469.40369, "r_y1": 298.67584, "r_x2": 469.40369, "r_y2": 289.8788799999999, "r_x3": 134.765, "r_y3": 289.8788799999999, "coord_origin": "TOPLEFT" }, "text": "by the token with the next highest confidence until OTSL rules are satisfied.", "orig": "by the token with the next highest confidence until OTSL rules are satisfied.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The design of OTSL allows to validate a table structure easily on an unfinished sequence. The detection of an invalid sequence token is a clear indication of a prediction mistake, however a valid sequence by itself does not guarantee prediction correctness. Different heuristics can be used to correct token errors in an invalid sequence and thus increase the chances for accurate predictions. Such heuristics can be applied either after the prediction of each token, or at the end on the entire predicted sequence. For example a simple heuristic which can correct the predicted OTSL sequence on-the-fly is to verify if the token with the highest prediction confidence invalidates the predicted sequence, and replace it by the token with the next highest confidence until OTSL rules are satisfied." }, { "label": "section_header", "id": 3, "page_no": 7, "cluster": { "id": 3, "label": "section_header", "bbox": { "l": 134.765, "t": 321.164, "r": 229.03534, "b": 331.73239000000007, "coord_origin": "TOPLEFT" }, "confidence": 0.95152747631073, "cells": [ { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 331.73239000000007, "r_x1": 141.4886, "r_y1": 331.73239000000007, "r_x2": 141.4886, "r_y2": 321.164, "r_x3": 134.765, "r_y3": 321.164, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.9382, "r_y0": 331.73239000000007, "r_x1": 229.03534, "r_y1": 331.73239000000007, "r_x2": 229.03534, "r_y2": 321.164, "r_x3": 154.9382, "r_y3": 321.164, "coord_origin": "TOPLEFT" }, "text": "Experiments", "orig": "Experiments", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "5 Experiments" }, { "label": "text", "id": 1, "page_no": 7, "cluster": { "id": 1, "label": "text", "bbox": { "l": 134.765, "t": 347.24985, "r": 480.59528, "b": 451.6877099999999, "coord_origin": "TOPLEFT" }, "confidence": 0.9877985119819641, "cells": [ { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 356.04681, "r_x1": 480.59375, "r_y1": 356.04681, "r_x2": 480.59375, "r_y2": 347.24985, "r_x3": 134.765, "r_y3": 347.24985, "coord_origin": "TOPLEFT" }, "text": "To evaluate the impact of OTSL on prediction accuracy and inference times, we", "orig": "To evaluate the impact of OTSL on prediction accuracy and inference times, we", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 368.0018, "r_x1": 480.59476, "r_y1": 368.0018, "r_x2": 480.59476, "r_y2": 359.2048300000001, "r_x3": 134.765, "r_y3": 359.2048300000001, "coord_origin": "TOPLEFT" }, "text": "conducted a series of experiments based on the TableFormer model (Figure 4)", "orig": "conducted a series of experiments based on the TableFormer model (Figure 4)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 379.95679, "r_x1": 480.58786000000003, "r_y1": 379.95679, "r_x2": 480.58786000000003, "r_y2": 371.15982, "r_x3": 134.765, "r_y3": 371.15982, "coord_origin": "TOPLEFT" }, "text": "with two objectives: Firstly we evaluate the prediction quality and performance", "orig": "with two objectives: Firstly we evaluate the prediction quality and performance", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 391.91177, "r_x1": 480.58777, "r_y1": 391.91177, "r_x2": 480.58777, "r_y2": 383.11481000000003, "r_x3": 134.765, "r_y3": 383.11481000000003, "coord_origin": "TOPLEFT" }, "text": "of OTSL vs. HTML after performing Hyper Parameter Optimization (HPO) on", "orig": "of OTSL vs. HTML after performing Hyper Parameter Optimization (HPO) on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 403.86676, "r_x1": 148.59807, "r_y1": 403.86676, "r_x2": 148.59807, "r_y2": 395.06978999999995, "r_x3": 134.765, "r_y3": 395.06978999999995, "coord_origin": "TOPLEFT" }, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.627, "r_y0": 403.86676, "r_x1": 191.84703, "r_y1": 403.86676, "r_x2": 191.84703, "r_y2": 395.06978999999995, "r_x3": 151.627, "r_y3": 395.06978999999995, "coord_origin": "TOPLEFT" }, "text": "canonical", "orig": "canonical", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 195.90201, "r_y0": 403.86676, "r_x1": 480.59528, "r_y1": 403.86676, "r_x2": 480.59528, "r_y2": 395.06978999999995, "r_x3": 195.90201, "r_y3": 395.06978999999995, "coord_origin": "TOPLEFT" }, "text": "PubTabNet data set. Secondly we pick the best hyper-parameters", "orig": "PubTabNet data set. Secondly we pick the best hyper-parameters", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 415.82175, "r_x1": 480.59283000000005, "r_y1": 415.82175, "r_x2": 480.59283000000005, "r_y2": 407.02478, "r_x3": 134.76501, "r_y3": 407.02478, "coord_origin": "TOPLEFT" }, "text": "found in the first step and evaluate how OTSL impacts the performance of", "orig": "found in the first step and evaluate how OTSL impacts the performance of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 427.77774, "r_x1": 480.59476, "r_y1": 427.77774, "r_x2": 480.59476, "r_y2": 418.98077, "r_x3": 134.76501, "r_y3": 418.98077, "coord_origin": "TOPLEFT" }, "text": "TableFormer after training on other publicly available data sets (FinTabNet,", "orig": "TableFormer after training on other publicly available data sets (FinTabNet,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 439.73273, "r_x1": 480.59171, "r_y1": 439.73273, "r_x2": 480.59171, "r_y2": 430.93576, "r_x3": 134.76501, "r_y3": 430.93576, "coord_origin": "TOPLEFT" }, "text": "PubTables-1M [14]). The ground truth (GT) from all data sets has been con-", "orig": "PubTables-1M [14]). The ground truth (GT) from all data sets has been con-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 451.6877099999999, "r_x1": 479.30258, "r_y1": 451.6877099999999, "r_x2": 479.30258, "r_y2": 442.8907500000001, "r_x3": 134.76501, "r_y3": 442.8907500000001, "coord_origin": "TOPLEFT" }, "text": "verted into OTSL format for this purpose, and will be made publicly available.", "orig": "verted into OTSL format for this purpose, and will be made publicly available.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "To evaluate the impact of OTSL on prediction accuracy and inference times, we conducted a series of experiments based on the TableFormer model (Figure 4) with two objectives: Firstly we evaluate the prediction quality and performance of OTSL vs. HTML after performing Hyper Parameter Optimization (HPO) on the canonical PubTabNet data set. Secondly we pick the best hyper-parameters found in the first step and evaluate how OTSL impacts the performance of TableFormer after training on other publicly available data sets (FinTabNet, PubTables-1M [14]). The ground truth (GT) from all data sets has been converted into OTSL format for this purpose, and will be made publicly available." }, { "label": "caption", "id": 7, "page_no": 7, "cluster": { "id": 7, "label": "caption", "bbox": { "l": 134.76501, "t": 484.64813, "r": 480.59082, "b": 503.73965, "coord_origin": "TOPLEFT" }, "confidence": 0.9297956228256226, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 492.57443, "r_x1": 162.64424, "r_y1": 492.57443, "r_x2": 162.64424, "r_y2": 484.64813, "r_x3": 134.76501, "r_y3": 484.64813, "coord_origin": "TOPLEFT" }, "text": "Fig. 4.", "orig": "Fig. 4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 165.19601, "r_y0": 492.78067, "r_x1": 480.59082, "r_y1": 492.78067, "r_x2": 480.59082, "r_y2": 484.71091, "r_x3": 165.19601, "r_y3": 484.71091, "coord_origin": "TOPLEFT" }, "text": "Architecture sketch of the TableFormer model, which is a representative for the", "orig": "Architecture sketch of the TableFormer model, which is a representative for the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76501, "r_y0": 503.73965, "r_x1": 206.70245, "r_y1": 503.73965, "r_x2": 206.70245, "r_y2": 495.66989, "r_x3": 134.76501, "r_y3": 495.66989, "coord_origin": "TOPLEFT" }, "text": "Im2Seq approach.", "orig": "Im2Seq approach.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Fig. 4. Architecture sketch of the TableFormer model, which is a representative for the Im2Seq approach." }, { "label": "picture", "id": 6, "page_no": 7, "cluster": { "id": 6, "label": "picture", "bbox": { "l": 140.70968627929688, "t": 508.0638427734375, "r": 472.73382568359375, "b": 593.6771850585938, "coord_origin": "TOPLEFT" }, "confidence": 0.9303396344184875, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.30025, "r_y0": 543.1000799999999, "r_x1": 149.70605, "r_y1": 543.1000799999999, "r_x2": 149.70605, "r_y2": 540.73164, "r_x3": 147.30025, "r_y3": 540.73164, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.90895, "r_y0": 543.1000799999999, "r_x1": 155.72055, "r_y1": 543.1000799999999, "r_x2": 155.72055, "r_y2": 540.73164, "r_x3": 150.90895, "r_y3": 540.73164, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 162.75987, "r_y0": 537.76224, "r_x1": 172.2963, "r_y1": 537.76224, "r_x2": 172.2963, "r_y2": 535.3938, "r_x3": 162.75987, "r_y3": 535.3938, "coord_origin": "TOPLEFT" }, "text": "Amount", "orig": "Amount", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.63603, "r_y0": 537.73459, "r_x1": 155.91753, "r_y1": 537.73459, "r_x2": 155.91753, "r_y2": 535.3661500000001, "r_x3": 147.63603, "r_y3": 535.3661500000001, "coord_origin": "TOPLEFT" }, "text": "Names", "orig": "Names", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.48466, "r_y0": 543.1000799999999, "r_x1": 164.10178, "r_y1": 543.1000799999999, "r_x2": 164.10178, "r_y2": 540.73164, "r_x3": 158.48466, "r_y3": 540.73164, "coord_origin": "TOPLEFT" }, "text": "1000", "orig": "1000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.48466, "r_y0": 547.03909, "r_x1": 162.69737, "r_y1": 547.03909, "r_x2": 162.69737, "r_y2": 544.67065, "r_x3": 158.48466, "r_y3": 544.67065, "coord_origin": "TOPLEFT" }, "text": "500", "orig": "500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.48466, "r_y0": 551.28108, "r_x1": 164.10178, "r_y1": 551.28108, "r_x2": 164.10178, "r_y2": 548.91264, "r_x3": 158.48466, "r_y3": 548.91264, "coord_origin": "TOPLEFT" }, "text": "3500", "orig": "3500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.48466, "r_y0": 555.52309, "r_x1": 162.69737, "r_y1": 555.52309, "r_x2": 162.69737, "r_y2": 553.15465, "r_x3": 158.48466, "r_y3": 553.15465, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.81696, "r_y0": 543.1000799999999, "r_x1": 172.88876, "r_y1": 543.1000799999999, "r_x2": 172.88876, "r_y2": 540.73164, "r_x3": 168.81696, "r_y3": 540.73164, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.81696, "r_y0": 547.03909, "r_x1": 172.88876, "r_y1": 547.03909, "r_x2": 172.88876, "r_y2": 544.67065, "r_x3": 168.81696, "r_y3": 544.67065, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.81696, "r_y0": 551.28108, "r_x1": 172.88876, "r_y1": 551.28108, "r_x2": 172.88876, "r_y2": 548.91264, "r_x3": 168.81696, "r_y3": 548.91264, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.81696, "r_y0": 555.52309, "r_x1": 172.88876, "r_y1": 555.52309, "r_x2": 172.88876, "r_y2": 553.15465, "r_x3": 168.81696, "r_y3": 553.15465, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.30025, "r_y0": 547.03909, "r_x1": 149.70605, "r_y1": 547.03909, "r_x2": 149.70605, "r_y2": 544.67065, "r_x3": 147.30025, "r_y3": 544.67065, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.90895, "r_y0": 547.03909, "r_x1": 155.72055, "r_y1": 547.03909, "r_x2": 155.72055, "r_y2": 544.67065, "r_x3": 150.90895, "r_y3": 544.67065, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.30025, "r_y0": 551.28108, "r_x1": 149.70605, "r_y1": 551.28108, "r_x2": 149.70605, "r_y2": 548.91264, "r_x3": 147.30025, "r_y3": 548.91264, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.90895, "r_y0": 551.28108, "r_x1": 155.72055, "r_y1": 551.28108, "r_x2": 155.72055, "r_y2": 548.91264, "r_x3": 150.90895, "r_y3": 548.91264, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.30025, "r_y0": 555.52309, "r_x1": 149.70605, "r_y1": 555.52309, "r_x2": 149.70605, "r_y2": 553.15465, "r_x3": 147.30025, "r_y3": 553.15465, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.90895, "r_y0": 555.52309, "r_x1": 155.72055, "r_y1": 555.52309, "r_x2": 155.72055, "r_y2": 553.15465, "r_x3": 150.90895, "r_y3": 553.15465, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 152.05046, "r_y0": 521.27298, "r_x1": 171.24945, "r_y1": 521.27298, "r_x2": 171.24945, "r_y2": 517.0098, "r_x3": 152.05046, "r_y3": 517.0098, "coord_origin": "TOPLEFT" }, "text": "Extracted", "orig": "Extracted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 148.13347, "r_y0": 526.57547, "r_x1": 175.16759, "r_y1": 526.57547, "r_x2": 175.16759, "r_y2": 522.3122900000001, "r_x3": 148.13347, "r_y3": 522.3122900000001, "coord_origin": "TOPLEFT" }, "text": "Table Images", "orig": "Table Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 193.53331, "r_y0": 528.7774, "r_x1": 220.31973, "r_y1": 528.7774, "r_x2": 220.31973, "r_y2": 524.51422, "r_x3": 193.53331, "r_y3": 524.51422, "coord_origin": "TOPLEFT" }, "text": "Standardized", "orig": "Standardized", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 199.47311, "r_y0": 534.0799, "r_x1": 214.37889, "r_y1": 534.0799, "r_x2": 214.37889, "r_y2": 529.8167100000001, "r_x3": 199.47311, "r_y3": 529.8167100000001, "coord_origin": "TOPLEFT" }, "text": "Images", "orig": "Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 273.61066, "r_y0": 514.16849, "r_x1": 284.47275, "r_y1": 514.16849, "r_x2": 284.47275, "r_y2": 509.9053, "r_x3": 273.61066, "r_y3": 509.9053, "coord_origin": "TOPLEFT" }, "text": "BBox", "orig": "BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 270.45187, "r_y0": 517.9560200000001, "r_x1": 287.63242, "r_y1": 517.9560200000001, "r_x2": 287.63242, "r_y2": 513.6928399999999, "r_x3": 270.45187, "r_y3": 513.6928399999999, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.47852, "r_y0": 512.40756, "r_x1": 348.14014, "r_y1": 512.40756, "r_x2": 348.14014, "r_y2": 508.14438, "r_x3": 332.47852, "r_y3": 508.14438, "coord_origin": "TOPLEFT" }, "text": "BBoxes", "orig": "BBoxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 376.68622, "r_y0": 525.38342, "r_x1": 407.25497, "r_y1": 525.38342, "r_x2": 407.25497, "r_y2": 521.12024, "r_x3": 376.68622, "r_y3": 521.12024, "coord_origin": "TOPLEFT" }, "text": "BBoxes can be", "orig": "BBoxes can be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 373.90869, "r_y0": 529.92844, "r_x1": 410.03506, "r_y1": 529.92844, "r_x2": 410.03506, "r_y2": 525.66525, "r_x3": 373.90869, "r_y3": 525.66525, "coord_origin": "TOPLEFT" }, "text": "traced back to the", "orig": "traced back to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 375.29871, "r_y0": 534.47342, "r_x1": 408.64902, "r_y1": 534.47342, "r_x2": 408.64902, "r_y2": 530.21024, "r_x3": 375.29871, "r_y3": 530.21024, "coord_origin": "TOPLEFT" }, "text": "original image to", "orig": "original image to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 377.06747, "r_y0": 539.01843, "r_x1": 406.88312, "r_y1": 539.01843, "r_x2": 406.88312, "r_y2": 534.75522, "r_x3": 377.06747, "r_y3": 534.75522, "coord_origin": "TOPLEFT" }, "text": "extract content", "orig": "extract content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 383.56683, "r_y0": 567.50497, "r_x1": 433.76544, "r_y1": 567.50497, "r_x2": 433.76544, "r_y2": 563.24176, "r_x3": 383.56683, "r_y3": 563.24176, "coord_origin": "TOPLEFT" }, "text": "Structure Tags sequence", "orig": "Structure Tags sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 383.52768, "r_y0": 572.04997, "r_x1": 433.80764999999997, "r_y1": 572.04997, "r_x2": 433.80764999999997, "r_y2": 567.78676, "r_x3": 383.52768, "r_y3": 567.78676, "coord_origin": "TOPLEFT" }, "text": "provide full description of", "orig": "provide full description of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 390.47522, "r_y0": 576.59499, "r_x1": 426.85703, "r_y1": 576.59499, "r_x2": 426.85703, "r_y2": 572.33177, "r_x3": 390.47522, "r_y3": 572.33177, "coord_origin": "TOPLEFT" }, "text": "the table structure", "orig": "the table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.94702, "r_y0": 582.15465, "r_x1": 323.1691, "r_y1": 582.15465, "r_x2": 323.1691, "r_y2": 577.89143, "r_x3": 293.94702, "r_y3": 577.89143, "coord_origin": "TOPLEFT" }, "text": "Structure Tags", "orig": "Structure Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.94702, "r_y0": 586.69969, "r_x1": 324.59396, "r_y1": 586.69969, "r_x2": 324.59396, "r_y2": 582.43648, "r_x3": 293.94702, "r_y3": 582.43648, "coord_origin": "TOPLEFT" }, "text": "in OTSL format", "orig": "in OTSL format", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.07819, "r_y0": 546.08591, "r_x1": 364.14691, "r_y1": 546.08591, "r_x2": 364.14691, "r_y2": 541.82269, "r_x3": 333.07819, "r_y3": 541.82269, "coord_origin": "TOPLEFT" }, "text": "BBoxes in sync", "orig": "BBoxes in sync", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.07819, "r_y0": 549.87341, "r_x1": 369.71542, "r_y1": 549.87341, "r_x2": 369.71542, "r_y2": 545.6102, "r_x3": 333.07819, "r_y3": 545.6102, "coord_origin": "TOPLEFT" }, "text": "with tag sequence", "orig": "with tag sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.65881000000002, "r_y0": 519.50458, "r_x1": 249.58894000000004, "r_y1": 519.50458, "r_x2": 249.58894000000004, "r_y2": 515.24139, "r_x3": 232.65881000000002, "r_y3": 515.24139, "coord_origin": "TOPLEFT" }, "text": "Encoder", "orig": "Encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 269.8219, "r_y0": 550.23424, "r_x1": 288.26279, "r_y1": 550.23424, "r_x2": 288.26279, "r_y2": 545.97102, "r_x3": 269.8219, "r_y3": 545.97102, "coord_origin": "TOPLEFT" }, "text": "Structure", "orig": "Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 270.45187, "r_y0": 554.0217299999999, "r_x1": 287.63242, "r_y1": 554.0217299999999, "r_x2": 287.63242, "r_y2": 549.75851, "r_x3": 270.45187, "r_y3": 549.75851, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.17676, "r_y0": 520.17523, "r_x1": 358.11206, "r_y1": 520.17523, "r_x2": 358.11206, "r_y2": 515.91205, "r_x3": 332.17676, "r_y3": 515.91205, "coord_origin": "TOPLEFT" }, "text": "[x1, y2, x2, y2]", "orig": "[x1, y2, x2, y2]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.17676, "r_y0": 526.23523, "r_x1": 361.58298, "r_y1": 526.23523, "r_x2": 361.58298, "r_y2": 521.9720500000001, "r_x3": 332.17676, "r_y3": 521.9720500000001, "coord_origin": "TOPLEFT" }, "text": "[x1', y2', x2', y2']", "orig": "[x1', y2', x2', y2']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.17676, "r_y0": 532.29523, "r_x1": 364.76474, "r_y1": 532.29523, "r_x2": 364.76474, "r_y2": 528.03204, "r_x3": 332.17676, "r_y3": 528.03204, "coord_origin": "TOPLEFT" }, "text": "[x1'', y2'', x2'', y2'']", "orig": "[x1'', y2'', x2'', y2'']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.17676, "r_y0": 538.35524, "r_x1": 335.96548, "r_y1": 538.35524, "r_x2": 335.96548, "r_y2": 534.09204, "r_x3": 332.17676, "r_y3": 534.09204, "coord_origin": "TOPLEFT" }, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.8894, "r_y0": 520.6582599999999, "r_x1": 329.41641, "r_y1": 520.6582599999999, "r_x2": 329.41641, "r_y2": 516.39508, "r_x3": 326.8894, "r_y3": 516.39508, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.04089, "r_y0": 526.68796, "r_x1": 329.5679, "r_y1": 526.68796, "r_x2": 329.5679, "r_y2": 522.4247700000001, "r_x3": 327.04089, "r_y3": 522.4247700000001, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.04089, "r_y0": 532.77826, "r_x1": 329.5679, "r_y1": 532.77826, "r_x2": 329.5679, "r_y2": 528.51508, "r_x3": 327.04089, "r_y3": 528.51508, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 424.14102, "r_y0": 531.7060200000001, "r_x1": 426.66803, "r_y1": 531.7060200000001, "r_x2": 426.66803, "r_y2": 527.4428399999999, "r_x3": 424.14102, "r_y3": 527.4428399999999, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 453.0018, "r_y0": 521.71713, "r_x1": 455.52881, "r_y1": 521.71713, "r_x2": 455.52881, "r_y2": 517.4539500000001, "r_x3": 453.0018, "r_y3": 517.4539500000001, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.85825, "r_y0": 521.32599, "r_x1": 426.38525, "r_y1": 521.32599, "r_x2": 426.38525, "r_y2": 517.06281, "r_x3": 423.85825, "r_y3": 517.06281, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.4342, "r_y0": 562.35719, "r_x1": 337.27542, "r_y1": 562.35719, "r_x2": 337.27542, "r_y2": 557.36679, "r_x3": 333.4342, "r_y3": 557.36679, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.35397, "r_y0": 562.30719, "r_x1": 344.19519, "r_y1": 562.30719, "r_x2": 344.19519, "r_y2": 557.31679, "r_x3": 340.35397, "r_y3": 557.31679, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.30978, "r_y0": 568.8557900000001, "r_x1": 344.151, "r_y1": 568.8557900000001, "r_x2": 344.151, "r_y2": 563.8653899999999, "r_x3": 340.30978, "r_y3": 563.8653899999999, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.79904, "r_y0": 568.85907, "r_x1": 350.64026, "r_y1": 568.85907, "r_x2": 350.64026, "r_y2": 563.8686700000001, "r_x3": 346.79904, "r_y3": 563.8686700000001, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.59583, "r_y0": 568.81311, "r_x1": 337.43704, "r_y1": 568.81311, "r_x2": 337.43704, "r_y2": 563.82271, "r_x3": 333.59583, "r_y3": 563.82271, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.37543, "r_y0": 575.41713, "r_x1": 344.21664, "r_y1": 575.41713, "r_x2": 344.21664, "r_y2": 570.42673, "r_x3": 340.37543, "r_y3": 570.42673, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.86469, "r_y0": 575.42041, "r_x1": 350.7059, "r_y1": 575.42041, "r_x2": 350.7059, "r_y2": 570.43001, "r_x3": 346.86469, "r_y3": 570.43001, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.66144, "r_y0": 575.37445, "r_x1": 337.50266, "r_y1": 575.37445, "r_x2": 337.50266, "r_y2": 570.38405, "r_x3": 333.66144, "r_y3": 570.38405, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.37671, "r_y0": 582.0164599999999, "r_x1": 344.21793, "r_y1": 582.0164599999999, "r_x2": 344.21793, "r_y2": 577.02606, "r_x3": 340.37671, "r_y3": 577.02606, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.86597, "r_y0": 582.01974, "r_x1": 350.70718, "r_y1": 582.01974, "r_x2": 350.70718, "r_y2": 577.02934, "r_x3": 346.86597, "r_y3": 577.02934, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.66272, "r_y0": 581.97379, "r_x1": 337.50394, "r_y1": 581.97379, "r_x2": 337.50394, "r_y2": 576.98338, "r_x3": 333.66272, "r_y3": 576.98338, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.27948, "r_y0": 588.38777, "r_x1": 344.1207, "r_y1": 588.38777, "r_x2": 344.1207, "r_y2": 583.39737, "r_x3": 340.27948, "r_y3": 583.39737, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.76874, "r_y0": 588.39108, "r_x1": 350.60995, "r_y1": 588.39108, "r_x2": 350.60995, "r_y2": 583.40068, "r_x3": 346.76874, "r_y3": 583.40068, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.56549, "r_y0": 588.34514, "r_x1": 337.40671, "r_y1": 588.34514, "r_x2": 337.40671, "r_y2": 583.35474, "r_x3": 333.56549, "r_y3": 583.35474, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.03326, "r_y0": 561.87354, "r_x1": 359.83362, "r_y1": 561.87354, "r_x2": 359.83362, "r_y2": 556.8831299999999, "r_x3": 353.03326, "r_y3": 556.8831299999999, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.18604, "r_y0": 568.57085, "r_x1": 359.98639, "r_y1": 568.57085, "r_x2": 359.98639, "r_y2": 563.58044, "r_x3": 353.18604, "r_y3": 563.58044, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.19864, "r_y0": 575.15276, "r_x1": 359.99899, "r_y1": 575.15276, "r_x2": 359.99899, "r_y2": 570.1623500000001, "r_x3": 353.19864, "r_y3": 570.1623500000001, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.1532, "r_y0": 581.75652, "r_x1": 359.95355, "r_y1": 581.75652, "r_x2": 359.95355, "r_y2": 576.76611, "r_x3": 353.1532, "r_y3": 576.76611, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.26935, "r_y0": 588.3966800000001, "r_x1": 360.0697, "r_y1": 588.3966800000001, "r_x2": 360.0697, "r_y2": 583.40628, "r_x3": 353.26935, "r_y3": 583.40628, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.37979, "r_y0": 562.07275, "r_x1": 350.33786, "r_y1": 562.07275, "r_x2": 350.33786, "r_y2": 557.08235, "r_x3": 347.37979, "r_y3": 557.08235, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.14026, "r_y0": 568.55399, "r_x1": 333.66727, "r_y1": 568.55399, "r_x2": 333.66727, "r_y2": 564.2907700000001, "r_x3": 331.14026, "r_y3": 564.2907700000001, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.80972, "r_y0": 558.85634, "r_x1": 343.33673, "r_y1": 558.85634, "r_x2": 343.33673, "r_y2": 554.59312, "r_x3": 340.80972, "r_y3": 554.59312, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.97992, "r_y0": 559.09357, "r_x1": 333.50693, "r_y1": 559.09357, "r_x2": 333.50693, "r_y2": 554.83035, "r_x3": 330.97992, "r_y3": 554.83035, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 13, "label": "text", "bbox": { "l": 147.30025, "t": 540.73164, "r": 149.70605, "b": 543.1000799999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.30025, "r_y0": 543.1000799999999, "r_x1": 149.70605, "r_y1": 543.1000799999999, "r_x2": 149.70605, "r_y2": 540.73164, "r_x3": 147.30025, "r_y3": 540.73164, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 14, "label": "text", "bbox": { "l": 150.90895, "t": 540.73164, "r": 155.72055, "b": 543.1000799999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.90895, "r_y0": 543.1000799999999, "r_x1": 155.72055, "r_y1": 543.1000799999999, "r_x2": 155.72055, "r_y2": 540.73164, "r_x3": 150.90895, "r_y3": 540.73164, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 15, "label": "text", "bbox": { "l": 162.75987, "t": 535.3938, "r": 172.2963, "b": 537.76224, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 162.75987, "r_y0": 537.76224, "r_x1": 172.2963, "r_y1": 537.76224, "r_x2": 172.2963, "r_y2": 535.3938, "r_x3": 162.75987, "r_y3": 535.3938, "coord_origin": "TOPLEFT" }, "text": "Amount", "orig": "Amount", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 16, "label": "text", "bbox": { "l": 147.63603, "t": 535.3661500000001, "r": 155.91753, "b": 537.73459, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.63603, "r_y0": 537.73459, "r_x1": 155.91753, "r_y1": 537.73459, "r_x2": 155.91753, "r_y2": 535.3661500000001, "r_x3": 147.63603, "r_y3": 535.3661500000001, "coord_origin": "TOPLEFT" }, "text": "Names", "orig": "Names", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 17, "label": "text", "bbox": { "l": 158.48466, "t": 540.73164, "r": 164.10178, "b": 543.1000799999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.48466, "r_y0": 543.1000799999999, "r_x1": 164.10178, "r_y1": 543.1000799999999, "r_x2": 164.10178, "r_y2": 540.73164, "r_x3": 158.48466, "r_y3": 540.73164, "coord_origin": "TOPLEFT" }, "text": "1000", "orig": "1000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 18, "label": "text", "bbox": { "l": 158.48466, "t": 544.67065, "r": 162.69737, "b": 547.03909, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.48466, "r_y0": 547.03909, "r_x1": 162.69737, "r_y1": 547.03909, "r_x2": 162.69737, "r_y2": 544.67065, "r_x3": 158.48466, "r_y3": 544.67065, "coord_origin": "TOPLEFT" }, "text": "500", "orig": "500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 19, "label": "text", "bbox": { "l": 158.48466, "t": 548.91264, "r": 164.10178, "b": 551.28108, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.48466, "r_y0": 551.28108, "r_x1": 164.10178, "r_y1": 551.28108, "r_x2": 164.10178, "r_y2": 548.91264, "r_x3": 158.48466, "r_y3": 548.91264, "coord_origin": "TOPLEFT" }, "text": "3500", "orig": "3500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 20, "label": "text", "bbox": { "l": 158.48466, "t": 553.15465, "r": 162.69737, "b": 555.52309, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.48466, "r_y0": 555.52309, "r_x1": 162.69737, "r_y1": 555.52309, "r_x2": 162.69737, "r_y2": 553.15465, "r_x3": 158.48466, "r_y3": 553.15465, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 21, "label": "text", "bbox": { "l": 168.81696, "t": 540.73164, "r": 172.88876, "b": 543.1000799999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.81696, "r_y0": 543.1000799999999, "r_x1": 172.88876, "r_y1": 543.1000799999999, "r_x2": 172.88876, "r_y2": 540.73164, "r_x3": 168.81696, "r_y3": 540.73164, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 22, "label": "text", "bbox": { "l": 168.81696, "t": 544.67065, "r": 172.88876, "b": 547.03909, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.81696, "r_y0": 547.03909, "r_x1": 172.88876, "r_y1": 547.03909, "r_x2": 172.88876, "r_y2": 544.67065, "r_x3": 168.81696, "r_y3": 544.67065, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 23, "label": "text", "bbox": { "l": 168.81696, "t": 548.91264, "r": 172.88876, "b": 551.28108, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.81696, "r_y0": 551.28108, "r_x1": 172.88876, "r_y1": 551.28108, "r_x2": 172.88876, "r_y2": 548.91264, "r_x3": 168.81696, "r_y3": 548.91264, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 24, "label": "text", "bbox": { "l": 168.81696, "t": 553.15465, "r": 172.88876, "b": 555.52309, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.81696, "r_y0": 555.52309, "r_x1": 172.88876, "r_y1": 555.52309, "r_x2": 172.88876, "r_y2": 553.15465, "r_x3": 168.81696, "r_y3": 553.15465, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 25, "label": "text", "bbox": { "l": 147.30025, "t": 544.67065, "r": 149.70605, "b": 547.03909, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.30025, "r_y0": 547.03909, "r_x1": 149.70605, "r_y1": 547.03909, "r_x2": 149.70605, "r_y2": 544.67065, "r_x3": 147.30025, "r_y3": 544.67065, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 26, "label": "text", "bbox": { "l": 150.90895, "t": 544.67065, "r": 155.72055, "b": 547.03909, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.90895, "r_y0": 547.03909, "r_x1": 155.72055, "r_y1": 547.03909, "r_x2": 155.72055, "r_y2": 544.67065, "r_x3": 150.90895, "r_y3": 544.67065, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 27, "label": "text", "bbox": { "l": 147.30025, "t": 548.91264, "r": 149.70605, "b": 551.28108, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.30025, "r_y0": 551.28108, "r_x1": 149.70605, "r_y1": 551.28108, "r_x2": 149.70605, "r_y2": 548.91264, "r_x3": 147.30025, "r_y3": 548.91264, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 28, "label": "text", "bbox": { "l": 150.90895, "t": 548.91264, "r": 155.72055, "b": 551.28108, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.90895, "r_y0": 551.28108, "r_x1": 155.72055, "r_y1": 551.28108, "r_x2": 155.72055, "r_y2": 548.91264, "r_x3": 150.90895, "r_y3": 548.91264, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 29, "label": "text", "bbox": { "l": 147.30025, "t": 553.15465, "r": 149.70605, "b": 555.52309, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.30025, "r_y0": 555.52309, "r_x1": 149.70605, "r_y1": 555.52309, "r_x2": 149.70605, "r_y2": 553.15465, "r_x3": 147.30025, "r_y3": 553.15465, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 30, "label": "text", "bbox": { "l": 150.90895, "t": 553.15465, "r": 155.72055, "b": 555.52309, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.90895, "r_y0": 555.52309, "r_x1": 155.72055, "r_y1": 555.52309, "r_x2": 155.72055, "r_y2": 553.15465, "r_x3": 150.90895, "r_y3": 553.15465, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 31, "label": "text", "bbox": { "l": 152.05046, "t": 517.0098, "r": 171.24945, "b": 521.27298, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 152.05046, "r_y0": 521.27298, "r_x1": 171.24945, "r_y1": 521.27298, "r_x2": 171.24945, "r_y2": 517.0098, "r_x3": 152.05046, "r_y3": 517.0098, "coord_origin": "TOPLEFT" }, "text": "Extracted", "orig": "Extracted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 32, "label": "text", "bbox": { "l": 148.13347, "t": 522.3122900000001, "r": 175.16759, "b": 526.57547, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 148.13347, "r_y0": 526.57547, "r_x1": 175.16759, "r_y1": 526.57547, "r_x2": 175.16759, "r_y2": 522.3122900000001, "r_x3": 148.13347, "r_y3": 522.3122900000001, "coord_origin": "TOPLEFT" }, "text": "Table Images", "orig": "Table Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 33, "label": "text", "bbox": { "l": 193.53331, "t": 524.51422, "r": 220.31973, "b": 528.7774, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 193.53331, "r_y0": 528.7774, "r_x1": 220.31973, "r_y1": 528.7774, "r_x2": 220.31973, "r_y2": 524.51422, "r_x3": 193.53331, "r_y3": 524.51422, "coord_origin": "TOPLEFT" }, "text": "Standardized", "orig": "Standardized", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 34, "label": "text", "bbox": { "l": 199.47311, "t": 529.8167100000001, "r": 214.37889, "b": 534.0799, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 199.47311, "r_y0": 534.0799, "r_x1": 214.37889, "r_y1": 534.0799, "r_x2": 214.37889, "r_y2": 529.8167100000001, "r_x3": 199.47311, "r_y3": 529.8167100000001, "coord_origin": "TOPLEFT" }, "text": "Images", "orig": "Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 35, "label": "text", "bbox": { "l": 273.61066, "t": 509.9053, "r": 284.47275, "b": 514.16849, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 273.61066, "r_y0": 514.16849, "r_x1": 284.47275, "r_y1": 514.16849, "r_x2": 284.47275, "r_y2": 509.9053, "r_x3": 273.61066, "r_y3": 509.9053, "coord_origin": "TOPLEFT" }, "text": "BBox", "orig": "BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 36, "label": "text", "bbox": { "l": 270.45187, "t": 513.6928399999999, "r": 287.63242, "b": 517.9560200000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 270.45187, "r_y0": 517.9560200000001, "r_x1": 287.63242, "r_y1": 517.9560200000001, "r_x2": 287.63242, "r_y2": 513.6928399999999, "r_x3": 270.45187, "r_y3": 513.6928399999999, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 37, "label": "text", "bbox": { "l": 332.47852, "t": 508.14438, "r": 348.14014, "b": 512.40756, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.47852, "r_y0": 512.40756, "r_x1": 348.14014, "r_y1": 512.40756, "r_x2": 348.14014, "r_y2": 508.14438, "r_x3": 332.47852, "r_y3": 508.14438, "coord_origin": "TOPLEFT" }, "text": "BBoxes", "orig": "BBoxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 38, "label": "text", "bbox": { "l": 376.68622, "t": 521.12024, "r": 407.25497, "b": 525.38342, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 376.68622, "r_y0": 525.38342, "r_x1": 407.25497, "r_y1": 525.38342, "r_x2": 407.25497, "r_y2": 521.12024, "r_x3": 376.68622, "r_y3": 521.12024, "coord_origin": "TOPLEFT" }, "text": "BBoxes can be", "orig": "BBoxes can be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 39, "label": "text", "bbox": { "l": 373.90869, "t": 525.66525, "r": 410.03506, "b": 529.92844, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 373.90869, "r_y0": 529.92844, "r_x1": 410.03506, "r_y1": 529.92844, "r_x2": 410.03506, "r_y2": 525.66525, "r_x3": 373.90869, "r_y3": 525.66525, "coord_origin": "TOPLEFT" }, "text": "traced back to the", "orig": "traced back to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 40, "label": "text", "bbox": { "l": 375.29871, "t": 530.21024, "r": 408.64902, "b": 534.47342, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 375.29871, "r_y0": 534.47342, "r_x1": 408.64902, "r_y1": 534.47342, "r_x2": 408.64902, "r_y2": 530.21024, "r_x3": 375.29871, "r_y3": 530.21024, "coord_origin": "TOPLEFT" }, "text": "original image to", "orig": "original image to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 377.06747, "t": 534.75522, "r": 406.88312, "b": 539.01843, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 377.06747, "r_y0": 539.01843, "r_x1": 406.88312, "r_y1": 539.01843, "r_x2": 406.88312, "r_y2": 534.75522, "r_x3": 377.06747, "r_y3": 534.75522, "coord_origin": "TOPLEFT" }, "text": "extract content", "orig": "extract content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 383.56683, "t": 563.24176, "r": 433.76544, "b": 567.50497, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 383.56683, "r_y0": 567.50497, "r_x1": 433.76544, "r_y1": 567.50497, "r_x2": 433.76544, "r_y2": 563.24176, "r_x3": 383.56683, "r_y3": 563.24176, "coord_origin": "TOPLEFT" }, "text": "Structure Tags sequence", "orig": "Structure Tags sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 383.52768, "t": 567.78676, "r": 433.80764999999997, "b": 572.04997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 383.52768, "r_y0": 572.04997, "r_x1": 433.80764999999997, "r_y1": 572.04997, "r_x2": 433.80764999999997, "r_y2": 567.78676, "r_x3": 383.52768, "r_y3": 567.78676, "coord_origin": "TOPLEFT" }, "text": "provide full description of", "orig": "provide full description of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 390.47522, "t": 572.33177, "r": 426.85703, "b": 576.59499, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 390.47522, "r_y0": 576.59499, "r_x1": 426.85703, "r_y1": 576.59499, "r_x2": 426.85703, "r_y2": 572.33177, "r_x3": 390.47522, "r_y3": 572.33177, "coord_origin": "TOPLEFT" }, "text": "the table structure", "orig": "the table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 293.94702, "t": 577.89143, "r": 323.1691, "b": 582.15465, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.94702, "r_y0": 582.15465, "r_x1": 323.1691, "r_y1": 582.15465, "r_x2": 323.1691, "r_y2": 577.89143, "r_x3": 293.94702, "r_y3": 577.89143, "coord_origin": "TOPLEFT" }, "text": "Structure Tags", "orig": "Structure Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 293.94702, "t": 582.43648, "r": 324.59396, "b": 586.69969, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.94702, "r_y0": 586.69969, "r_x1": 324.59396, "r_y1": 586.69969, "r_x2": 324.59396, "r_y2": 582.43648, "r_x3": 293.94702, "r_y3": 582.43648, "coord_origin": "TOPLEFT" }, "text": "in OTSL format", "orig": "in OTSL format", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 333.07819, "t": 541.82269, "r": 364.14691, "b": 546.08591, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.07819, "r_y0": 546.08591, "r_x1": 364.14691, "r_y1": 546.08591, "r_x2": 364.14691, "r_y2": 541.82269, "r_x3": 333.07819, "r_y3": 541.82269, "coord_origin": "TOPLEFT" }, "text": "BBoxes in sync", "orig": "BBoxes in sync", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 333.07819, "t": 545.6102, "r": 369.71542, "b": 549.87341, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.07819, "r_y0": 549.87341, "r_x1": 369.71542, "r_y1": 549.87341, "r_x2": 369.71542, "r_y2": 545.6102, "r_x3": 333.07819, "r_y3": 545.6102, "coord_origin": "TOPLEFT" }, "text": "with tag sequence", "orig": "with tag sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 232.65881000000002, "t": 515.24139, "r": 249.58894000000004, "b": 519.50458, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.65881000000002, "r_y0": 519.50458, "r_x1": 249.58894000000004, "r_y1": 519.50458, "r_x2": 249.58894000000004, "r_y2": 515.24139, "r_x3": 232.65881000000002, "r_y3": 515.24139, "coord_origin": "TOPLEFT" }, "text": "Encoder", "orig": "Encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 269.8219, "t": 545.97102, "r": 288.26279, "b": 550.23424, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 269.8219, "r_y0": 550.23424, "r_x1": 288.26279, "r_y1": 550.23424, "r_x2": 288.26279, "r_y2": 545.97102, "r_x3": 269.8219, "r_y3": 545.97102, "coord_origin": "TOPLEFT" }, "text": "Structure", "orig": "Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 51, "label": "text", "bbox": { "l": 270.45187, "t": 549.75851, "r": 287.63242, "b": 554.0217299999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 270.45187, "r_y0": 554.0217299999999, "r_x1": 287.63242, "r_y1": 554.0217299999999, "r_x2": 287.63242, "r_y2": 549.75851, "r_x3": 270.45187, "r_y3": 549.75851, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 52, "label": "text", "bbox": { "l": 332.17676, "t": 515.91205, "r": 358.11206, "b": 520.17523, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.17676, "r_y0": 520.17523, "r_x1": 358.11206, "r_y1": 520.17523, "r_x2": 358.11206, "r_y2": 515.91205, "r_x3": 332.17676, "r_y3": 515.91205, "coord_origin": "TOPLEFT" }, "text": "[x1, y2, x2, y2]", "orig": "[x1, y2, x2, y2]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 53, "label": "text", "bbox": { "l": 332.17676, "t": 521.9720500000001, "r": 361.58298, "b": 526.23523, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.17676, "r_y0": 526.23523, "r_x1": 361.58298, "r_y1": 526.23523, "r_x2": 361.58298, "r_y2": 521.9720500000001, "r_x3": 332.17676, "r_y3": 521.9720500000001, "coord_origin": "TOPLEFT" }, "text": "[x1', y2', x2', y2']", "orig": "[x1', y2', x2', y2']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 54, "label": "text", "bbox": { "l": 332.17676, "t": 528.03204, "r": 364.76474, "b": 532.29523, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.17676, "r_y0": 532.29523, "r_x1": 364.76474, "r_y1": 532.29523, "r_x2": 364.76474, "r_y2": 528.03204, "r_x3": 332.17676, "r_y3": 528.03204, "coord_origin": "TOPLEFT" }, "text": "[x1'', y2'', x2'', y2'']", "orig": "[x1'', y2'', x2'', y2'']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 55, "label": "text", "bbox": { "l": 332.17676, "t": 534.09204, "r": 335.96548, "b": 538.35524, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.17676, "r_y0": 538.35524, "r_x1": 335.96548, "r_y1": 538.35524, "r_x2": 335.96548, "r_y2": 534.09204, "r_x3": 332.17676, "r_y3": 534.09204, "coord_origin": "TOPLEFT" }, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 56, "label": "text", "bbox": { "l": 326.8894, "t": 516.39508, "r": 329.41641, "b": 520.6582599999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.8894, "r_y0": 520.6582599999999, "r_x1": 329.41641, "r_y1": 520.6582599999999, "r_x2": 329.41641, "r_y2": 516.39508, "r_x3": 326.8894, "r_y3": 516.39508, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 57, "label": "text", "bbox": { "l": 327.04089, "t": 522.4247700000001, "r": 329.5679, "b": 526.68796, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.04089, "r_y0": 526.68796, "r_x1": 329.5679, "r_y1": 526.68796, "r_x2": 329.5679, "r_y2": 522.4247700000001, "r_x3": 327.04089, "r_y3": 522.4247700000001, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 58, "label": "text", "bbox": { "l": 327.04089, "t": 528.51508, "r": 329.5679, "b": 532.77826, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.04089, "r_y0": 532.77826, "r_x1": 329.5679, "r_y1": 532.77826, "r_x2": 329.5679, "r_y2": 528.51508, "r_x3": 327.04089, "r_y3": 528.51508, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 59, "label": "text", "bbox": { "l": 424.14102, "t": 527.4428399999999, "r": 426.66803, "b": 531.7060200000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 424.14102, "r_y0": 531.7060200000001, "r_x1": 426.66803, "r_y1": 531.7060200000001, "r_x2": 426.66803, "r_y2": 527.4428399999999, "r_x3": 424.14102, "r_y3": 527.4428399999999, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 60, "label": "text", "bbox": { "l": 453.0018, "t": 517.4539500000001, "r": 455.52881, "b": 521.71713, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 453.0018, "r_y0": 521.71713, "r_x1": 455.52881, "r_y1": 521.71713, "r_x2": 455.52881, "r_y2": 517.4539500000001, "r_x3": 453.0018, "r_y3": 517.4539500000001, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 61, "label": "text", "bbox": { "l": 423.85825, "t": 517.06281, "r": 426.38525, "b": 521.32599, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.85825, "r_y0": 521.32599, "r_x1": 426.38525, "r_y1": 521.32599, "r_x2": 426.38525, "r_y2": 517.06281, "r_x3": 423.85825, "r_y3": 517.06281, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 62, "label": "text", "bbox": { "l": 333.4342, "t": 557.36679, "r": 337.27542, "b": 562.35719, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.4342, "r_y0": 562.35719, "r_x1": 337.27542, "r_y1": 562.35719, "r_x2": 337.27542, "r_y2": 557.36679, "r_x3": 333.4342, "r_y3": 557.36679, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 340.35397, "t": 557.31679, "r": 344.19519, "b": 562.30719, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.35397, "r_y0": 562.30719, "r_x1": 344.19519, "r_y1": 562.30719, "r_x2": 344.19519, "r_y2": 557.31679, "r_x3": 340.35397, "r_y3": 557.31679, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 340.30978, "t": 563.8653899999999, "r": 344.151, "b": 568.8557900000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.30978, "r_y0": 568.8557900000001, "r_x1": 344.151, "r_y1": 568.8557900000001, "r_x2": 344.151, "r_y2": 563.8653899999999, "r_x3": 340.30978, "r_y3": 563.8653899999999, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 346.79904, "t": 563.8686700000001, "r": 350.64026, "b": 568.85907, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.79904, "r_y0": 568.85907, "r_x1": 350.64026, "r_y1": 568.85907, "r_x2": 350.64026, "r_y2": 563.8686700000001, "r_x3": 346.79904, "r_y3": 563.8686700000001, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 333.59583, "t": 563.82271, "r": 337.43704, "b": 568.81311, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.59583, "r_y0": 568.81311, "r_x1": 337.43704, "r_y1": 568.81311, "r_x2": 337.43704, "r_y2": 563.82271, "r_x3": 333.59583, "r_y3": 563.82271, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 340.37543, "t": 570.42673, "r": 344.21664, "b": 575.41713, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.37543, "r_y0": 575.41713, "r_x1": 344.21664, "r_y1": 575.41713, "r_x2": 344.21664, "r_y2": 570.42673, "r_x3": 340.37543, "r_y3": 570.42673, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 346.86469, "t": 570.43001, "r": 350.7059, "b": 575.42041, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.86469, "r_y0": 575.42041, "r_x1": 350.7059, "r_y1": 575.42041, "r_x2": 350.7059, "r_y2": 570.43001, "r_x3": 346.86469, "r_y3": 570.43001, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 333.66144, "t": 570.38405, "r": 337.50266, "b": 575.37445, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.66144, "r_y0": 575.37445, "r_x1": 337.50266, "r_y1": 575.37445, "r_x2": 337.50266, "r_y2": 570.38405, "r_x3": 333.66144, "r_y3": 570.38405, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 340.37671, "t": 577.02606, "r": 344.21793, "b": 582.0164599999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.37671, "r_y0": 582.0164599999999, "r_x1": 344.21793, "r_y1": 582.0164599999999, "r_x2": 344.21793, "r_y2": 577.02606, "r_x3": 340.37671, "r_y3": 577.02606, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 346.86597, "t": 577.02934, "r": 350.70718, "b": 582.01974, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.86597, "r_y0": 582.01974, "r_x1": 350.70718, "r_y1": 582.01974, "r_x2": 350.70718, "r_y2": 577.02934, "r_x3": 346.86597, "r_y3": 577.02934, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 333.66272, "t": 576.98338, "r": 337.50394, "b": 581.97379, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.66272, "r_y0": 581.97379, "r_x1": 337.50394, "r_y1": 581.97379, "r_x2": 337.50394, "r_y2": 576.98338, "r_x3": 333.66272, "r_y3": 576.98338, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 340.27948, "t": 583.39737, "r": 344.1207, "b": 588.38777, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.27948, "r_y0": 588.38777, "r_x1": 344.1207, "r_y1": 588.38777, "r_x2": 344.1207, "r_y2": 583.39737, "r_x3": 340.27948, "r_y3": 583.39737, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 346.76874, "t": 583.40068, "r": 350.60995, "b": 588.39108, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.76874, "r_y0": 588.39108, "r_x1": 350.60995, "r_y1": 588.39108, "r_x2": 350.60995, "r_y2": 583.40068, "r_x3": 346.76874, "r_y3": 583.40068, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 333.56549, "t": 583.35474, "r": 337.40671, "b": 588.34514, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.56549, "r_y0": 588.34514, "r_x1": 337.40671, "r_y1": 588.34514, "r_x2": 337.40671, "r_y2": 583.35474, "r_x3": 333.56549, "r_y3": 583.35474, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 353.03326, "t": 556.8831299999999, "r": 359.83362, "b": 561.87354, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.03326, "r_y0": 561.87354, "r_x1": 359.83362, "r_y1": 561.87354, "r_x2": 359.83362, "r_y2": 556.8831299999999, "r_x3": 353.03326, "r_y3": 556.8831299999999, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 353.18604, "t": 563.58044, "r": 359.98639, "b": 568.57085, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.18604, "r_y0": 568.57085, "r_x1": 359.98639, "r_y1": 568.57085, "r_x2": 359.98639, "r_y2": 563.58044, "r_x3": 353.18604, "r_y3": 563.58044, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 353.19864, "t": 570.1623500000001, "r": 359.99899, "b": 575.15276, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.19864, "r_y0": 575.15276, "r_x1": 359.99899, "r_y1": 575.15276, "r_x2": 359.99899, "r_y2": 570.1623500000001, "r_x3": 353.19864, "r_y3": 570.1623500000001, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 353.1532, "t": 576.76611, "r": 359.95355, "b": 581.75652, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.1532, "r_y0": 581.75652, "r_x1": 359.95355, "r_y1": 581.75652, "r_x2": 359.95355, "r_y2": 576.76611, "r_x3": 353.1532, "r_y3": 576.76611, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 80, "label": "text", "bbox": { "l": 353.26935, "t": 583.40628, "r": 360.0697, "b": 588.3966800000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.26935, "r_y0": 588.3966800000001, "r_x1": 360.0697, "r_y1": 588.3966800000001, "r_x2": 360.0697, "r_y2": 583.40628, "r_x3": 353.26935, "r_y3": 583.40628, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 81, "label": "text", "bbox": { "l": 347.37979, "t": 557.08235, "r": 350.33786, "b": 562.07275, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.37979, "r_y0": 562.07275, "r_x1": 350.33786, "r_y1": 562.07275, "r_x2": 350.33786, "r_y2": 557.08235, "r_x3": 347.37979, "r_y3": 557.08235, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 82, "label": "text", "bbox": { "l": 331.14026, "t": 564.2907700000001, "r": 333.66727, "b": 568.55399, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.14026, "r_y0": 568.55399, "r_x1": 333.66727, "r_y1": 568.55399, "r_x2": 333.66727, "r_y2": 564.2907700000001, "r_x3": 331.14026, "r_y3": 564.2907700000001, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 83, "label": "text", "bbox": { "l": 340.80972, "t": 554.59312, "r": 343.33673, "b": 558.85634, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.80972, "r_y0": 558.85634, "r_x1": 343.33673, "r_y1": 558.85634, "r_x2": 343.33673, "r_y2": 554.59312, "r_x3": 340.80972, "r_y3": 554.59312, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 84, "label": "text", "bbox": { "l": 330.97992, "t": 554.83035, "r": 333.50693, "b": 559.09357, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.97992, "r_y0": 559.09357, "r_x1": 333.50693, "r_y1": 559.09357, "r_x2": 333.50693, "r_y2": 554.83035, "r_x3": 330.97992, "r_y3": 554.83035, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "text", "id": 4, "page_no": 7, "cluster": { "id": 4, "label": "text", "bbox": { "l": 134.765, "t": 620.19278, "r": 480.5917400000001, "b": 664.8547599999999, "coord_origin": "TOPLEFT" }, "confidence": 0.951270341873169, "cells": [ { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.709, "r_y0": 628.98975, "r_x1": 480.58792, "r_y1": 628.98975, "r_x2": 480.58792, "r_y2": 620.19278, "r_x3": 149.709, "r_y3": 620.19278, "coord_origin": "TOPLEFT" }, "text": "We rely on standard metrics such as Tree Edit Distance score (TEDs) for", "orig": "We rely on standard metrics such as Tree Edit Distance score (TEDs) for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 640.94475, "r_x1": 480.58871, "r_y1": 640.94475, "r_x2": 480.58871, "r_y2": 632.14778, "r_x3": 134.765, "r_y3": 632.14778, "coord_origin": "TOPLEFT" }, "text": "table structure prediction, and Mean Average Precision (mAP) with 0.75 Inter-", "orig": "table structure prediction, and Mean Average Precision (mAP) with 0.75 Inter-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 652.89975, "r_x1": 480.5917400000001, "r_y1": 652.89975, "r_x2": 480.5917400000001, "r_y2": 644.1027799999999, "r_x3": 134.765, "r_y3": 644.1027799999999, "coord_origin": "TOPLEFT" }, "text": "section Over Union (IOU) threshold for the bounding-box predictions of table", "orig": "section Over Union (IOU) threshold for the bounding-box predictions of table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 664.8547599999999, "r_x1": 480.58968999999996, "r_y1": 664.8547599999999, "r_x2": 480.58968999999996, "r_y2": 656.0577900000001, "r_x3": 134.765, "r_y3": 656.0577900000001, "coord_origin": "TOPLEFT" }, "text": "cells. The predicted OTSL structures were converted back to HTML format in", "orig": "cells. The predicted OTSL structures were converted back to HTML format in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "We rely on standard metrics such as Tree Edit Distance score (TEDs) for table structure prediction, and Mean Average Precision (mAP) with 0.75 Intersection Over Union (IOU) threshold for the bounding-box predictions of table cells. The predicted OTSL structures were converted back to HTML format in" } ], "headers": [ { "label": "page_header", "id": 9, "page_no": 7, "cluster": { "id": 9, "label": "page_header", "bbox": { "l": 134.765, "t": 93.77099999999996, "r": 139.37193, "b": 101.84069999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.8301323056221008, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 101.84069999999997, "r_x1": 139.37193, "r_y1": 101.84069999999997, "r_x2": 139.37193, "r_y2": 93.77099999999996, "r_x3": 134.765, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "8" }, { "label": "page_header", "id": 8, "page_no": 7, "cluster": { "id": 8, "label": "page_header", "bbox": { "l": 167.81335, "t": 93.77099999999996, "r": 231.72227, "b": 101.84069999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.8631826043128967, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.81335, "r_y0": 101.84069999999997, "r_x1": 178.07675, "r_y1": 101.84069999999997, "r_x2": 178.07675, "r_y2": 93.77099999999996, "r_x3": 167.81335, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.37415, "r_y0": 101.84069999999997, "r_x1": 231.72227, "r_y1": 101.84069999999997, "r_x2": 231.72227, "r_y2": 93.77099999999996, "r_x3": 182.37415, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "M. Lysak, et al." } ] } }, { "page_no": 8, "size": { "width": 612.0, "height": 792.0 }, "parsed_page": { "dimension": { "angle": 0.0, "rect": { "r_x0": 0.0, "r_y0": 0.0, "r_x1": 612.0, "r_y1": 0.0, "r_x2": 612.0, "r_y2": 792.0, "r_x3": 0.0, "r_y3": 792.0, "coord_origin": "BOTTOMLEFT" }, "boundary_type": "crop_box", "art_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "bleed_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "crop_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "media_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "trim_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" } }, "bitmap_resources": [], "char_cells": [], "word_cells": [], "textline_cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.478, "r_y0": 101.84069999999997, "r_x1": 447.54291000000006, "r_y1": 101.84069999999997, "r_x2": 447.54291000000006, "r_y2": 93.77099999999996, "r_x3": 194.478, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 475.98431, "r_y0": 101.84069999999997, "r_x1": 480.59125000000006, "r_y1": 101.84069999999997, "r_x2": 480.59125000000006, "r_y2": 93.77099999999996, "r_x3": 475.98431, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 127.73077, "r_x1": 480.5936899999999, "r_y1": 127.73077, "r_x2": 480.5936899999999, "r_y2": 118.93377999999996, "r_x3": 134.765, "r_y3": 118.93377999999996, "coord_origin": "TOPLEFT" }, "text": "order to compute the TED score. Inference timing results for all experiments", "orig": "order to compute the TED score. Inference timing results for all experiments", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 139.68579, "r_x1": 480.59579, "r_y1": 139.68579, "r_x2": 480.59579, "r_y2": 130.88878999999997, "r_x3": 134.765, "r_y3": 130.88878999999997, "coord_origin": "TOPLEFT" }, "text": "were obtained from the same machine on a single core with AMD EPYC 7763", "orig": "were obtained from the same machine on a single core with AMD EPYC 7763", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 151.64178000000004, "r_x1": 210.78462, "r_y1": 151.64178000000004, "r_x2": 210.78462, "r_y2": 142.84479, "r_x3": 134.765, "r_y3": 142.84479, "coord_origin": "TOPLEFT" }, "text": "CPU @2.45 GHz.", "orig": "CPU @2.45 GHz.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 177.9928, "r_x1": 149.40205, "r_y1": 177.9928, "r_x2": 149.40205, "r_y2": 169.18584999999996, "r_x3": 134.765, "r_y3": 169.18584999999996, "coord_origin": "TOPLEFT" }, "text": "5.1", "orig": "5.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.85904, "r_y0": 177.9928, "r_x1": 318.44843, "r_y1": 177.9928, "r_x2": 318.44843, "r_y2": 169.18584999999996, "r_x3": 160.85904, "r_y3": 169.18584999999996, "coord_origin": "TOPLEFT" }, "text": "Hyper Parameter Optimization", "orig": "Hyper Parameter Optimization", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 194.38280999999995, "r_x1": 480.59183, "r_y1": 194.38280999999995, "r_x2": 480.59183, "r_y2": 185.58582, "r_x3": 134.765, "r_y3": 185.58582, "coord_origin": "TOPLEFT" }, "text": "We have chosen the PubTabNet data set to perform HPO, since it includes a", "orig": "We have chosen the PubTabNet data set to perform HPO, since it includes a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 206.33783000000005, "r_x1": 480.59183, "r_y1": 206.33783000000005, "r_x2": 480.59183, "r_y2": 197.54083000000003, "r_x3": 134.765, "r_y3": 197.54083000000003, "coord_origin": "TOPLEFT" }, "text": "highly diverse set of tables. Also we report TED scores separately for simple and", "orig": "highly diverse set of tables. Also we report TED scores separately for simple and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 218.29285000000004, "r_x1": 480.59177000000005, "r_y1": 218.29285000000004, "r_x2": 480.59177000000005, "r_y2": 209.49585000000002, "r_x3": 134.765, "r_y3": 209.49585000000002, "coord_origin": "TOPLEFT" }, "text": "complex tables (tables with cell spans). Results are presented in Table. 1. It is", "orig": "complex tables (tables with cell spans). Results are presented in Table. 1. It is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 230.24785999999995, "r_x1": 480.59277, "r_y1": 230.24785999999995, "r_x2": 480.59277, "r_y2": 221.45087, "r_x3": 134.765, "r_y3": 221.45087, "coord_origin": "TOPLEFT" }, "text": "evident that with OTSL, our model achieves the same TED score and slightly", "orig": "evident that with OTSL, our model achieves the same TED score and slightly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 242.20288000000005, "r_x1": 440.94159, "r_y1": 242.20288000000005, "r_x2": 440.94159, "r_y2": 233.40588000000002, "r_x3": 134.765, "r_y3": 233.40588000000002, "coord_origin": "TOPLEFT" }, "text": "better mAP scores in comparison to HTML. However OTSL yields a", "orig": "better mAP scores in comparison to HTML. However OTSL yields a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 444.86798, "r_y0": 242.20288000000005, "r_x1": 480.58786000000003, "r_y1": 242.20288000000005, "r_x2": 480.58786000000003, "r_y2": 233.40588000000002, "r_x3": 444.86798, "r_y3": 233.40588000000002, "coord_origin": "TOPLEFT" }, "text": "2x speed", "orig": "2x speed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 254.15886999999998, "r_x1": 145.20081, "r_y1": 254.15886999999998, "r_x2": 145.20081, "r_y2": 245.36188000000004, "r_x3": 134.76498, "r_y3": 245.36188000000004, "coord_origin": "TOPLEFT" }, "text": "up", "orig": "up", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.14899, "r_y0": 254.15886999999998, "r_x1": 311.21957, "r_y1": 254.15886999999998, "r_x2": 311.21957, "r_y2": 245.36188000000004, "r_x3": 149.14899, "r_y3": 245.36188000000004, "coord_origin": "TOPLEFT" }, "text": "in the inference runtime over HTML.", "orig": "in the inference runtime over HTML.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 282.9986, "r_x1": 160.11836, "r_y1": 282.9986, "r_x2": 160.11836, "r_y2": 275.07232999999997, "r_x3": 134.76498, "r_y3": 275.07232999999997, "coord_origin": "TOPLEFT" }, "text": "Table", "orig": "Table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.34528, "r_y0": 282.9986, "r_x1": 175.59526, "r_y1": 282.9986, "r_x2": 175.59526, "r_y2": 275.07232999999997, "r_x3": 167.34528, "r_y3": 275.07232999999997, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 188.13298, "r_y0": 283.2048300000001, "r_x1": 480.59365999999994, "r_y1": 283.2048300000001, "r_x2": 480.59365999999994, "r_y2": 275.13507000000004, "r_x3": 188.13298, "r_y3": 275.13507000000004, "coord_origin": "TOPLEFT" }, "text": "HPO performed in OTSL and HTML representation on the same", "orig": "HPO performed in OTSL and HTML representation on the same", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 294.16385, "r_x1": 480.59444999999994, "r_y1": 294.16385, "r_x2": 480.59444999999994, "r_y2": 286.09409, "r_x3": 134.76498, "r_y3": 286.09409, "coord_origin": "TOPLEFT" }, "text": "transformer-based TableFormer [9] architecture, trained only on PubTabNet [22]. Ef-", "orig": "transformer-based TableFormer [9] architecture, trained only on PubTabNet [22]. Ef-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 305.12283, "r_x1": 480.5954, "r_y1": 305.12283, "r_x2": 480.5954, "r_y2": 297.05307, "r_x3": 134.76498, "r_y3": 297.05307, "coord_origin": "TOPLEFT" }, "text": "fects of reducing the # of layers in encoder and decoder stages of the model show that", "orig": "fects of reducing the # of layers in encoder and decoder stages of the model show that", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 316.08182, "r_x1": 480.59451, "r_y1": 316.08182, "r_x2": 480.59451, "r_y2": 308.01205, "r_x3": 134.76498, "r_y3": 308.01205, "coord_origin": "TOPLEFT" }, "text": "smaller models trained on OTSL perform better, especially in recognizing complex", "orig": "smaller models trained on OTSL perform better, especially in recognizing complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 327.0408, "r_x1": 480.59441999999996, "r_y1": 327.0408, "r_x2": 480.59441999999996, "r_y2": 318.97104, "r_x3": 134.76498, "r_y3": 318.97104, "coord_origin": "TOPLEFT" }, "text": "table structures, and maintain a much higher mAP score than the HTML counterpart.", "orig": "table structures, and maintain a much higher mAP score than the HTML counterpart.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.37, "r_y0": 349.8047199999999, "r_x1": 168.04793, "r_y1": 349.8047199999999, "r_x2": 168.04793, "r_y2": 341.73495, "r_x3": 160.37, "r_y3": 341.73495, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 144.592, "r_y0": 362.75570999999997, "r_x1": 183.82806, "r_y1": 362.75570999999997, "r_x2": 183.82806, "r_y2": 354.68594, "r_x3": 144.592, "r_y3": 354.68594, "coord_origin": "TOPLEFT" }, "text": "enc-layers", "orig": "enc-layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 207.974, "r_y0": 349.8047199999999, "r_x1": 215.65193, "r_y1": 349.8047199999999, "r_x2": 215.65193, "r_y2": 341.73495, "r_x3": 207.974, "r_y3": 341.73495, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 192.19499, "r_y0": 362.75570999999997, "r_x1": 231.43106, "r_y1": 362.75570999999997, "r_x2": 231.43106, "r_y2": 354.68594, "r_x3": 192.19499, "r_y3": 354.68594, "coord_origin": "TOPLEFT" }, "text": "dec-layers", "orig": "dec-layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.79799999999997, "r_y0": 355.28372, "r_x1": 278.31766, "r_y1": 355.28372, "r_x2": 278.31766, "r_y2": 347.21396, "r_x3": 239.79799999999997, "r_y3": 347.21396, "coord_origin": "TOPLEFT" }, "text": "Language", "orig": "Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 324.67001, "r_y0": 349.8047199999999, "r_x1": 348.26419, "r_y1": 349.8047199999999, "r_x2": 348.26419, "r_y2": 341.73495, "r_x3": 324.67001, "r_y3": 341.73495, "coord_origin": "TOPLEFT" }, "text": "TEDs", "orig": "TEDs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.271, "r_y0": 349.8047199999999, "r_x1": 417.12683, "r_y1": 349.8047199999999, "r_x2": 417.12683, "r_y2": 341.73495, "r_x3": 396.271, "r_y3": 341.73495, "coord_origin": "TOPLEFT" }, "text": "mAP", "orig": "mAP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.927, "r_y0": 360.7637, "r_x1": 418.47278, "r_y1": 360.7637, "r_x2": 418.47278, "r_y2": 352.69394000000005, "r_x3": 394.927, "r_y3": 352.69394000000005, "coord_origin": "TOPLEFT" }, "text": "(0.75)", "orig": "(0.75)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 430.771, "r_y0": 349.8047199999999, "r_x1": 467.1423, "r_y1": 349.8047199999999, "r_x2": 467.1423, "r_y2": 341.73495, "r_x3": 430.771, "r_y3": 341.73495, "coord_origin": "TOPLEFT" }, "text": "Inference", "orig": "Inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 427.14801, "r_y0": 360.7637, "r_x1": 470.76056, "r_y1": 360.7637, "r_x2": 470.76056, "r_y2": 352.69394000000005, "r_x3": 427.14801, "r_y3": 352.69394000000005, "coord_origin": "TOPLEFT" }, "text": "time (secs)", "orig": "time (secs)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 286.686, "r_y0": 362.75570999999997, "r_x1": 312.33261, "r_y1": 362.75570999999997, "r_x2": 312.33261, "r_y2": 354.68594, "r_x3": 286.686, "r_y3": 354.68594, "coord_origin": "TOPLEFT" }, "text": "simple", "orig": "simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.702, "r_y0": 362.75570999999997, "r_x1": 353.71988, "r_y1": 362.75570999999997, "r_x2": 353.71988, "r_y2": 354.68594, "r_x3": 320.702, "r_y3": 354.68594, "coord_origin": "TOPLEFT" }, "text": "complex", "orig": "complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 369.306, "r_y0": 362.75570999999997, "r_x1": 379.03094, "r_y1": 362.75570999999997, "r_x2": 379.03094, "r_y2": 354.68594, "r_x3": 369.306, "r_y3": 354.68594, "coord_origin": "TOPLEFT" }, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.90601, "r_y0": 381.58572, "r_x1": 166.51294, "r_y1": 381.58572, "r_x2": 166.51294, "r_y2": 373.51596, "r_x3": 161.90601, "r_y3": 373.51596, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.509, "r_y0": 381.58572, "r_x1": 214.11594, "r_y1": 381.58572, "r_x2": 214.11594, "r_y2": 373.51596, "r_x3": 209.509, "r_y3": 373.51596, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.71000999999998, "r_y0": 376.10571, "r_x1": 271.40527, "r_y1": 376.10571, "r_x2": 271.40527, "r_y2": 368.03595, "r_x3": 246.71000999999998, "r_y3": 368.03595, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.017, "r_y0": 376.10571, "r_x1": 310.00375, "r_y1": 376.10571, "r_x2": 310.00375, "r_y2": 368.03595, "r_x3": 289.017, "r_y3": 368.03595, "coord_origin": "TOPLEFT" }, "text": "0.965", "orig": "0.965", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.71701, "r_y0": 376.10571, "r_x1": 347.70377, "r_y1": 376.10571, "r_x2": 347.70377, "r_y2": 368.03595, "r_x3": 326.71701, "r_y3": 368.03595, "coord_origin": "TOPLEFT" }, "text": "0.934", "orig": "0.934", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.67599, "r_y0": 376.10571, "r_x1": 384.66275, "r_y1": 376.10571, "r_x2": 384.66275, "r_y2": 368.03595, "r_x3": 363.67599, "r_y3": 368.03595, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.26999, "r_y0": 375.89948, "r_x1": 416.12723, "r_y1": 375.89948, "r_x2": 416.12723, "r_y2": 367.97317999999996, "r_x3": 397.26999, "r_y3": 367.97317999999996, "coord_origin": "TOPLEFT" }, "text": "0.88", "orig": "0.88", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.52701, "r_y0": 375.89948, "r_x1": 458.38425, "r_y1": 375.89948, "r_x2": 458.38425, "r_y2": 367.97317999999996, "r_x3": 439.52701, "r_y3": 367.97317999999996, "coord_origin": "TOPLEFT" }, "text": "2.73", "orig": "2.73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.17598999999998, "r_y0": 389.05771, "r_x1": 272.93954, "r_y1": 389.05771, "r_x2": 272.93954, "r_y2": 380.98795, "r_x3": 245.17598999999998, "r_y3": 380.98795, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.017, "r_y0": 389.05771, "r_x1": 310.00375, "r_y1": 389.05771, "r_x2": 310.00375, "r_y2": 380.98795, "r_x3": 289.017, "r_y3": 380.98795, "coord_origin": "TOPLEFT" }, "text": "0.969", "orig": "0.969", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.71701, "r_y0": 389.05771, "r_x1": 347.70377, "r_y1": 389.05771, "r_x2": 347.70377, "r_y2": 380.98795, "r_x3": 326.71701, "r_y3": 380.98795, "coord_origin": "TOPLEFT" }, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.67599, "r_y0": 389.05771, "r_x1": 384.66275, "r_y1": 389.05771, "r_x2": 384.66275, "r_y2": 380.98795, "r_x3": 363.67599, "r_y3": 380.98795, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.20599, "r_y0": 389.05771, "r_x1": 417.19275, "r_y1": 389.05771, "r_x2": 417.19275, "r_y2": 380.98795, "r_x3": 396.20599, "r_y3": 380.98795, "coord_origin": "TOPLEFT" }, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.767, "r_y0": 389.05771, "r_x1": 457.14682, "r_y1": 389.05771, "r_x2": 457.14682, "r_y2": 380.98795, "r_x3": 440.767, "r_y3": 380.98795, "coord_origin": "TOPLEFT" }, "text": "5.39", "orig": "5.39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.90601, "r_y0": 407.88672, "r_x1": 166.51294, "r_y1": 407.88672, "r_x2": 166.51294, "r_y2": 399.81696, "r_x3": 161.90601, "r_y3": 399.81696, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.509, "r_y0": 407.88672, "r_x1": 214.11594, "r_y1": 407.88672, "r_x2": 214.11594, "r_y2": 399.81696, "r_x3": 209.509, "r_y3": 399.81696, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.71000999999998, "r_y0": 402.40771, "r_x1": 271.40527, "r_y1": 402.40771, "r_x2": 271.40527, "r_y2": 394.33795, "r_x3": 246.71000999999998, "r_y3": 394.33795, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.017, "r_y0": 402.40771, "r_x1": 310.00375, "r_y1": 402.40771, "r_x2": 310.00375, "r_y2": 394.33795, "r_x3": 289.017, "r_y3": 394.33795, "coord_origin": "TOPLEFT" }, "text": "0.938", "orig": "0.938", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.71701, "r_y0": 402.40771, "r_x1": 347.70377, "r_y1": 402.40771, "r_x2": 347.70377, "r_y2": 394.33795, "r_x3": 326.71701, "r_y3": 394.33795, "coord_origin": "TOPLEFT" }, "text": "0.904", "orig": "0.904", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.67599, "r_y0": 402.40771, "r_x1": 384.66275, "r_y1": 402.40771, "r_x2": 384.66275, "r_y2": 394.33795, "r_x3": 363.67599, "r_y3": 394.33795, "coord_origin": "TOPLEFT" }, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.61801, "r_y0": 402.20148, "r_x1": 418.77887, "r_y1": 402.20148, "r_x2": 418.77887, "r_y2": 394.27518, "r_x3": 394.61801, "r_y3": 394.27518, "coord_origin": "TOPLEFT" }, "text": "0.853", "orig": "0.853", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.52701, "r_y0": 402.20148, "r_x1": 458.38425, "r_y1": 402.20148, "r_x2": 458.38425, "r_y2": 394.27518, "r_x3": 439.52701, "r_y3": 394.27518, "coord_origin": "TOPLEFT" }, "text": "1.97", "orig": "1.97", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.17598999999998, "r_y0": 415.3587, "r_x1": 272.93954, "r_y1": 415.3587, "r_x2": 272.93954, "r_y2": 407.28894, "r_x3": 245.17598999999998, "r_y3": 407.28894, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.017, "r_y0": 415.3587, "r_x1": 310.00375, "r_y1": 415.3587, "r_x2": 310.00375, "r_y2": 407.28894, "r_x3": 289.017, "r_y3": 407.28894, "coord_origin": "TOPLEFT" }, "text": "0.952", "orig": "0.952", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.71701, "r_y0": 415.3587, "r_x1": 347.70377, "r_y1": 415.3587, "r_x2": 347.70377, "r_y2": 407.28894, "r_x3": 326.71701, "r_y3": 407.28894, "coord_origin": "TOPLEFT" }, "text": "0.909", "orig": "0.909", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.08801, "r_y0": 415.15247, "r_x1": 386.24887, "r_y1": 415.15247, "r_x2": 386.24887, "r_y2": 407.22617, "r_x3": 362.08801, "r_y3": 407.22617, "coord_origin": "TOPLEFT" }, "text": "0.938", "orig": "0.938", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.20599, "r_y0": 415.3587, "r_x1": 417.19275, "r_y1": 415.3587, "r_x2": 417.19275, "r_y2": 407.28894, "r_x3": 396.20599, "r_y3": 407.28894, "coord_origin": "TOPLEFT" }, "text": "0.843", "orig": "0.843", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.767, "r_y0": 415.3587, "r_x1": 457.14682, "r_y1": 415.3587, "r_x2": 457.14682, "r_y2": 407.28894, "r_x3": 440.767, "r_y3": 407.28894, "coord_origin": "TOPLEFT" }, "text": "3.77", "orig": "3.77", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.90601, "r_y0": 434.1877099999999, "r_x1": 166.51294, "r_y1": 434.1877099999999, "r_x2": 166.51294, "r_y2": 426.11795, "r_x3": 161.90601, "r_y3": 426.11795, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.509, "r_y0": 434.1877099999999, "r_x1": 214.11594, "r_y1": 434.1877099999999, "r_x2": 214.11594, "r_y2": 426.11795, "r_x3": 209.509, "r_y3": 426.11795, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.71000999999998, "r_y0": 428.70871, "r_x1": 271.40527, "r_y1": 428.70871, "r_x2": 271.40527, "r_y2": 420.63895, "r_x3": 246.71000999999998, "r_y3": 420.63895, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.017, "r_y0": 428.70871, "r_x1": 310.00375, "r_y1": 428.70871, "r_x2": 310.00375, "r_y2": 420.63895, "r_x3": 289.017, "r_y3": 420.63895, "coord_origin": "TOPLEFT" }, "text": "0.923", "orig": "0.923", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.71701, "r_y0": 428.70871, "r_x1": 347.70377, "r_y1": 428.70871, "r_x2": 347.70377, "r_y2": 420.63895, "r_x3": 326.71701, "r_y3": 420.63895, "coord_origin": "TOPLEFT" }, "text": "0.897", "orig": "0.897", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.67599, "r_y0": 428.70871, "r_x1": 384.66275, "r_y1": 428.70871, "r_x2": 384.66275, "r_y2": 420.63895, "r_x3": 363.67599, "r_y3": 420.63895, "coord_origin": "TOPLEFT" }, "text": "0.915", "orig": "0.915", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.61801, "r_y0": 428.50247, "r_x1": 418.77887, "r_y1": 428.50247, "r_x2": 418.77887, "r_y2": 420.57617, "r_x3": 394.61801, "r_y3": 420.57617, "coord_origin": "TOPLEFT" }, "text": "0.859", "orig": "0.859", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.52701, "r_y0": 428.50247, "r_x1": 458.38425, "r_y1": 428.50247, "r_x2": 458.38425, "r_y2": 420.57617, "r_x3": 439.52701, "r_y3": 420.57617, "coord_origin": "TOPLEFT" }, "text": "1.91", "orig": "1.91", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.17598999999998, "r_y0": 441.6597, "r_x1": 272.93954, "r_y1": 441.6597, "r_x2": 272.93954, "r_y2": 433.58994, "r_x3": 245.17598999999998, "r_y3": 433.58994, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.017, "r_y0": 441.6597, "r_x1": 310.00375, "r_y1": 441.6597, "r_x2": 310.00375, "r_y2": 433.58994, "r_x3": 289.017, "r_y3": 433.58994, "coord_origin": "TOPLEFT" }, "text": "0.945", "orig": "0.945", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.71701, "r_y0": 441.6597, "r_x1": 347.70377, "r_y1": 441.6597, "r_x2": 347.70377, "r_y2": 433.58994, "r_x3": 326.71701, "r_y3": 433.58994, "coord_origin": "TOPLEFT" }, "text": "0.901", "orig": "0.901", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.08801, "r_y0": 441.45346, "r_x1": 386.24887, "r_y1": 441.45346, "r_x2": 386.24887, "r_y2": 433.5271599999999, "r_x3": 362.08801, "r_y3": 433.5271599999999, "coord_origin": "TOPLEFT" }, "text": "0.931", "orig": "0.931", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.20599, "r_y0": 441.6597, "r_x1": 417.19275, "r_y1": 441.6597, "r_x2": 417.19275, "r_y2": 433.58994, "r_x3": 396.20599, "r_y3": 433.58994, "coord_origin": "TOPLEFT" }, "text": "0.834", "orig": "0.834", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.767, "r_y0": 441.6597, "r_x1": 457.14682, "r_y1": 441.6597, "r_x2": 457.14682, "r_y2": 433.58994, "r_x3": 440.767, "r_y3": 433.58994, "coord_origin": "TOPLEFT" }, "text": "3.81", "orig": "3.81", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.90601, "r_y0": 460.48972, "r_x1": 166.51294, "r_y1": 460.48972, "r_x2": 166.51294, "r_y2": 452.41995, "r_x3": 161.90601, "r_y3": 452.41995, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.509, "r_y0": 460.48972, "r_x1": 214.11594, "r_y1": 460.48972, "r_x2": 214.11594, "r_y2": 452.41995, "r_x3": 209.509, "r_y3": 452.41995, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.71000999999998, "r_y0": 455.0097, "r_x1": 271.40527, "r_y1": 455.0097, "r_x2": 271.40527, "r_y2": 446.9399399999999, "r_x3": 246.71000999999998, "r_y3": 446.9399399999999, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.017, "r_y0": 455.0097, "r_x1": 310.00375, "r_y1": 455.0097, "r_x2": 310.00375, "r_y2": 446.9399399999999, "r_x3": 289.017, "r_y3": 446.9399399999999, "coord_origin": "TOPLEFT" }, "text": "0.952", "orig": "0.952", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 329.021, "r_y0": 455.0097, "r_x1": 345.40082, "r_y1": 455.0097, "r_x2": 345.40082, "r_y2": 446.9399399999999, "r_x3": 329.021, "r_y3": 446.9399399999999, "coord_origin": "TOPLEFT" }, "text": "0.92", "orig": "0.92", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.08801, "r_y0": 454.80347, "r_x1": 386.24887, "r_y1": 454.80347, "r_x2": 386.24887, "r_y2": 446.87717, "r_x3": 362.08801, "r_y3": 446.87717, "coord_origin": "TOPLEFT" }, "text": "0.942", "orig": "0.942", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.61801, "r_y0": 454.80347, "r_x1": 418.77887, "r_y1": 454.80347, "r_x2": 418.77887, "r_y2": 446.87717, "r_x3": 394.61801, "r_y3": 446.87717, "coord_origin": "TOPLEFT" }, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.52701, "r_y0": 454.80347, "r_x1": 458.38425, "r_y1": 454.80347, "r_x2": 458.38425, "r_y2": 446.87717, "r_x3": 439.52701, "r_y3": 446.87717, "coord_origin": "TOPLEFT" }, "text": "1.22", "orig": "1.22", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.17598999999998, "r_y0": 467.9617, "r_x1": 272.93954, "r_y1": 467.9617, "r_x2": 272.93954, "r_y2": 459.8919399999999, "r_x3": 245.17598999999998, "r_y3": 459.8919399999999, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.017, "r_y0": 467.9617, "r_x1": 310.00375, "r_y1": 467.9617, "r_x2": 310.00375, "r_y2": 459.8919399999999, "r_x3": 289.017, "r_y3": 459.8919399999999, "coord_origin": "TOPLEFT" }, "text": "0.944", "orig": "0.944", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.71701, "r_y0": 467.9617, "r_x1": 347.70377, "r_y1": 467.9617, "r_x2": 347.70377, "r_y2": 459.8919399999999, "r_x3": 326.71701, "r_y3": 459.8919399999999, "coord_origin": "TOPLEFT" }, "text": "0.903", "orig": "0.903", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.67599, "r_y0": 467.9617, "r_x1": 384.66275, "r_y1": 467.9617, "r_x2": 384.66275, "r_y2": 459.8919399999999, "r_x3": 363.67599, "r_y3": 459.8919399999999, "coord_origin": "TOPLEFT" }, "text": "0.931", "orig": "0.931", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.20599, "r_y0": 467.9617, "r_x1": 417.19275, "r_y1": 467.9617, "r_x2": 417.19275, "r_y2": 459.8919399999999, "r_x3": 396.20599, "r_y3": 459.8919399999999, "coord_origin": "TOPLEFT" }, "text": "0.824", "orig": "0.824", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 446.65302, "r_y0": 467.9617, "r_x1": 451.25995, "r_y1": 467.9617, "r_x2": 451.25995, "r_y2": 459.8919399999999, "r_x3": 446.65302, "r_y3": 459.8919399999999, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 516.95874, "r_x1": 149.40205, "r_y1": 516.95874, "r_x2": 149.40205, "r_y2": 508.15179, "r_x3": 134.765, "r_y3": 508.15179, "coord_origin": "TOPLEFT" }, "text": "5.2", "orig": "5.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.85904, "r_y0": 516.95874, "r_x1": 264.40332, "r_y1": 516.95874, "r_x2": 264.40332, "r_y2": 508.15179, "r_x3": 160.85904, "r_y3": 508.15179, "coord_origin": "TOPLEFT" }, "text": "Quantitative Results", "orig": "Quantitative Results", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 533.34775, "r_x1": 480.59075999999993, "r_y1": 533.34775, "r_x2": 480.59075999999993, "r_y2": 524.55078, "r_x3": 134.765, "r_y3": 524.55078, "coord_origin": "TOPLEFT" }, "text": "We picked the model parameter configuration that produced the best prediction", "orig": "We picked the model parameter configuration that produced the best prediction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 545.3037400000001, "r_x1": 480.58675999999997, "r_y1": 545.3037400000001, "r_x2": 480.58675999999997, "r_y2": 536.50677, "r_x3": 134.765, "r_y3": 536.50677, "coord_origin": "TOPLEFT" }, "text": "quality (enc=6, dec=6, heads=8) with PubTabNet alone, then independently", "orig": "quality (enc=6, dec=6, heads=8) with PubTabNet alone, then independently", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 557.25874, "r_x1": 480.59572999999995, "r_y1": 557.25874, "r_x2": 480.59572999999995, "r_y2": 548.4617800000001, "r_x3": 134.765, "r_y3": 548.4617800000001, "coord_origin": "TOPLEFT" }, "text": "trained and evaluated it on three publicly available data sets: PubTabNet (395k", "orig": "trained and evaluated it on three publicly available data sets: PubTabNet (395k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 569.21375, "r_x1": 480.59177000000005, "r_y1": 569.21375, "r_x2": 480.59177000000005, "r_y2": 560.41678, "r_x3": 134.765, "r_y3": 560.41678, "coord_origin": "TOPLEFT" }, "text": "samples), FinTabNet (113k samples) and PubTables-1M (about 1M samples).", "orig": "samples), FinTabNet (113k samples) and PubTables-1M (about 1M samples).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 581.16875, "r_x1": 480.59069999999997, "r_y1": 581.16875, "r_x2": 480.59069999999997, "r_y2": 572.37178, "r_x3": 134.765, "r_y3": 572.37178, "coord_origin": "TOPLEFT" }, "text": "Performance results are presented in Table. 2. It is clearly evident that the model", "orig": "Performance results are presented in Table. 2. It is clearly evident that the model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 593.12375, "r_x1": 480.5957599999999, "r_y1": 593.12375, "r_x2": 480.5957599999999, "r_y2": 584.32678, "r_x3": 134.765, "r_y3": 584.32678, "coord_origin": "TOPLEFT" }, "text": "trained on OTSL outperforms HTML across the board, keeping high TEDs and", "orig": "trained on OTSL outperforms HTML across the board, keeping high TEDs and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 605.07974, "r_x1": 480.58774, "r_y1": 605.07974, "r_x2": 480.58774, "r_y2": 596.28278, "r_x3": 134.765, "r_y3": 596.28278, "coord_origin": "TOPLEFT" }, "text": "mAP scores even on difficult financial tables (FinTabNet) that contain sparse", "orig": "mAP scores even on difficult financial tables (FinTabNet) that contain sparse", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 617.03474, "r_x1": 206.78664, "r_y1": 617.03474, "r_x2": 206.78664, "r_y2": 608.2377799999999, "r_x3": 134.765, "r_y3": 608.2377799999999, "coord_origin": "TOPLEFT" }, "text": "and large tables.", "orig": "and large tables.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.709, "r_y0": 628.98975, "r_x1": 480.59271, "r_y1": 628.98975, "r_x2": 480.59271, "r_y2": 620.19278, "r_x3": 149.709, "r_y3": 620.19278, "coord_origin": "TOPLEFT" }, "text": "Additionally, the results show that OTSL has an advantage over HTML", "orig": "Additionally, the results show that OTSL has an advantage over HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 640.94475, "r_x1": 480.5957599999999, "r_y1": 640.94475, "r_x2": 480.5957599999999, "r_y2": 632.14778, "r_x3": 134.765, "r_y3": 632.14778, "coord_origin": "TOPLEFT" }, "text": "when applied on a bigger data set like PubTables-1M and achieves significantly", "orig": "when applied on a bigger data set like PubTables-1M and achieves significantly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 652.89975, "r_x1": 480.59283000000005, "r_y1": 652.89975, "r_x2": 480.59283000000005, "r_y2": 644.1027799999999, "r_x3": 134.765, "r_y3": 644.1027799999999, "coord_origin": "TOPLEFT" }, "text": "improved scores. Finally, OTSL achieves faster inference due to fewer decoding", "orig": "improved scores. Finally, OTSL achieves faster inference due to fewer decoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 664.8547599999999, "r_x1": 405.79651, "r_y1": 664.8547599999999, "r_x2": 405.79651, "r_y2": 656.0577900000001, "r_x3": 134.765, "r_y3": 656.0577900000001, "coord_origin": "TOPLEFT" }, "text": "steps which is a result of the reduced sequence representation.", "orig": "steps which is a result of the reduced sequence representation.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "has_chars": false, "has_words": false, "has_lines": true, "image": null, "lines": [] }, "predictions": { "layout": { "clusters": [ { "id": 8, "label": "page_header", "bbox": { "l": 194.478, "t": 93.77099999999996, "r": 447.54291000000006, "b": 101.84069999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.9373378753662109, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.478, "r_y0": 101.84069999999997, "r_x1": 447.54291000000006, "r_y1": 101.84069999999997, "r_x2": 447.54291000000006, "r_y2": 93.77099999999996, "r_x3": 194.478, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 9, "label": "page_header", "bbox": { "l": 475.98431, "t": 93.77099999999996, "r": 480.59125000000006, "b": 101.84069999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.8857625722885132, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 475.98431, "r_y0": 101.84069999999997, "r_x1": 480.59125000000006, "r_y1": 101.84069999999997, "r_x2": 480.59125000000006, "r_y2": 93.77099999999996, "r_x3": 475.98431, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 4, "label": "text", "bbox": { "l": 134.765, "t": 118.93377999999996, "r": 480.59579, "b": 151.64178000000004, "coord_origin": "TOPLEFT" }, "confidence": 0.9805440306663513, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 127.73077, "r_x1": 480.5936899999999, "r_y1": 127.73077, "r_x2": 480.5936899999999, "r_y2": 118.93377999999996, "r_x3": 134.765, "r_y3": 118.93377999999996, "coord_origin": "TOPLEFT" }, "text": "order to compute the TED score. Inference timing results for all experiments", "orig": "order to compute the TED score. Inference timing results for all experiments", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 139.68579, "r_x1": 480.59579, "r_y1": 139.68579, "r_x2": 480.59579, "r_y2": 130.88878999999997, "r_x3": 134.765, "r_y3": 130.88878999999997, "coord_origin": "TOPLEFT" }, "text": "were obtained from the same machine on a single core with AMD EPYC 7763", "orig": "were obtained from the same machine on a single core with AMD EPYC 7763", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 151.64178000000004, "r_x1": 210.78462, "r_y1": 151.64178000000004, "r_x2": 210.78462, "r_y2": 142.84479, "r_x3": 134.765, "r_y3": 142.84479, "coord_origin": "TOPLEFT" }, "text": "CPU @2.45 GHz.", "orig": "CPU @2.45 GHz.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 6, "label": "section_header", "bbox": { "l": 134.765, "t": 169.18584999999996, "r": 318.44843, "b": 177.9928, "coord_origin": "TOPLEFT" }, "confidence": 0.9579681158065796, "cells": [ { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 177.9928, "r_x1": 149.40205, "r_y1": 177.9928, "r_x2": 149.40205, "r_y2": 169.18584999999996, "r_x3": 134.765, "r_y3": 169.18584999999996, "coord_origin": "TOPLEFT" }, "text": "5.1", "orig": "5.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.85904, "r_y0": 177.9928, "r_x1": 318.44843, "r_y1": 177.9928, "r_x2": 318.44843, "r_y2": 169.18584999999996, "r_x3": 160.85904, "r_y3": 169.18584999999996, "coord_origin": "TOPLEFT" }, "text": "Hyper Parameter Optimization", "orig": "Hyper Parameter Optimization", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 3, "label": "text", "bbox": { "l": 134.76498, "t": 185.58582, "r": 480.59277, "b": 254.15886999999998, "coord_origin": "TOPLEFT" }, "confidence": 0.9842326641082764, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 194.38280999999995, "r_x1": 480.59183, "r_y1": 194.38280999999995, "r_x2": 480.59183, "r_y2": 185.58582, "r_x3": 134.765, "r_y3": 185.58582, "coord_origin": "TOPLEFT" }, "text": "We have chosen the PubTabNet data set to perform HPO, since it includes a", "orig": "We have chosen the PubTabNet data set to perform HPO, since it includes a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 206.33783000000005, "r_x1": 480.59183, "r_y1": 206.33783000000005, "r_x2": 480.59183, "r_y2": 197.54083000000003, "r_x3": 134.765, "r_y3": 197.54083000000003, "coord_origin": "TOPLEFT" }, "text": "highly diverse set of tables. Also we report TED scores separately for simple and", "orig": "highly diverse set of tables. Also we report TED scores separately for simple and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 218.29285000000004, "r_x1": 480.59177000000005, "r_y1": 218.29285000000004, "r_x2": 480.59177000000005, "r_y2": 209.49585000000002, "r_x3": 134.765, "r_y3": 209.49585000000002, "coord_origin": "TOPLEFT" }, "text": "complex tables (tables with cell spans). Results are presented in Table. 1. It is", "orig": "complex tables (tables with cell spans). Results are presented in Table. 1. It is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 230.24785999999995, "r_x1": 480.59277, "r_y1": 230.24785999999995, "r_x2": 480.59277, "r_y2": 221.45087, "r_x3": 134.765, "r_y3": 221.45087, "coord_origin": "TOPLEFT" }, "text": "evident that with OTSL, our model achieves the same TED score and slightly", "orig": "evident that with OTSL, our model achieves the same TED score and slightly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 242.20288000000005, "r_x1": 440.94159, "r_y1": 242.20288000000005, "r_x2": 440.94159, "r_y2": 233.40588000000002, "r_x3": 134.765, "r_y3": 233.40588000000002, "coord_origin": "TOPLEFT" }, "text": "better mAP scores in comparison to HTML. However OTSL yields a", "orig": "better mAP scores in comparison to HTML. However OTSL yields a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 444.86798, "r_y0": 242.20288000000005, "r_x1": 480.58786000000003, "r_y1": 242.20288000000005, "r_x2": 480.58786000000003, "r_y2": 233.40588000000002, "r_x3": 444.86798, "r_y3": 233.40588000000002, "coord_origin": "TOPLEFT" }, "text": "2x speed", "orig": "2x speed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 254.15886999999998, "r_x1": 145.20081, "r_y1": 254.15886999999998, "r_x2": 145.20081, "r_y2": 245.36188000000004, "r_x3": 134.76498, "r_y3": 245.36188000000004, "coord_origin": "TOPLEFT" }, "text": "up", "orig": "up", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.14899, "r_y0": 254.15886999999998, "r_x1": 311.21957, "r_y1": 254.15886999999998, "r_x2": 311.21957, "r_y2": 245.36188000000004, "r_x3": 149.14899, "r_y3": 245.36188000000004, "coord_origin": "TOPLEFT" }, "text": "in the inference runtime over HTML.", "orig": "in the inference runtime over HTML.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 7, "label": "caption", "bbox": { "l": 134.76498, "t": 275.07232999999997, "r": 480.5954, "b": 327.0408, "coord_origin": "TOPLEFT" }, "confidence": 0.9570781588554382, "cells": [ { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 282.9986, "r_x1": 160.11836, "r_y1": 282.9986, "r_x2": 160.11836, "r_y2": 275.07232999999997, "r_x3": 134.76498, "r_y3": 275.07232999999997, "coord_origin": "TOPLEFT" }, "text": "Table", "orig": "Table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.34528, "r_y0": 282.9986, "r_x1": 175.59526, "r_y1": 282.9986, "r_x2": 175.59526, "r_y2": 275.07232999999997, "r_x3": 167.34528, "r_y3": 275.07232999999997, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 188.13298, "r_y0": 283.2048300000001, "r_x1": 480.59365999999994, "r_y1": 283.2048300000001, "r_x2": 480.59365999999994, "r_y2": 275.13507000000004, "r_x3": 188.13298, "r_y3": 275.13507000000004, "coord_origin": "TOPLEFT" }, "text": "HPO performed in OTSL and HTML representation on the same", "orig": "HPO performed in OTSL and HTML representation on the same", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 294.16385, "r_x1": 480.59444999999994, "r_y1": 294.16385, "r_x2": 480.59444999999994, "r_y2": 286.09409, "r_x3": 134.76498, "r_y3": 286.09409, "coord_origin": "TOPLEFT" }, "text": "transformer-based TableFormer [9] architecture, trained only on PubTabNet [22]. Ef-", "orig": "transformer-based TableFormer [9] architecture, trained only on PubTabNet [22]. Ef-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 305.12283, "r_x1": 480.5954, "r_y1": 305.12283, "r_x2": 480.5954, "r_y2": 297.05307, "r_x3": 134.76498, "r_y3": 297.05307, "coord_origin": "TOPLEFT" }, "text": "fects of reducing the # of layers in encoder and decoder stages of the model show that", "orig": "fects of reducing the # of layers in encoder and decoder stages of the model show that", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 316.08182, "r_x1": 480.59451, "r_y1": 316.08182, "r_x2": 480.59451, "r_y2": 308.01205, "r_x3": 134.76498, "r_y3": 308.01205, "coord_origin": "TOPLEFT" }, "text": "smaller models trained on OTSL perform better, especially in recognizing complex", "orig": "smaller models trained on OTSL perform better, especially in recognizing complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 327.0408, "r_x1": 480.59441999999996, "r_y1": 327.0408, "r_x2": 480.59441999999996, "r_y2": 318.97104, "r_x3": 134.76498, "r_y3": 318.97104, "coord_origin": "TOPLEFT" }, "text": "table structures, and maintain a much higher mAP score than the HTML counterpart.", "orig": "table structures, and maintain a much higher mAP score than the HTML counterpart.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 0, "label": "table", "bbox": { "l": 139.66845703125, "t": 337.5747985839844, "r": 475.00372314453125, "b": 469.4721374511719, "coord_origin": "TOPLEFT" }, "confidence": 0.9901032447814941, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.37, "r_y0": 349.8047199999999, "r_x1": 168.04793, "r_y1": 349.8047199999999, "r_x2": 168.04793, "r_y2": 341.73495, "r_x3": 160.37, "r_y3": 341.73495, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 144.592, "r_y0": 362.75570999999997, "r_x1": 183.82806, "r_y1": 362.75570999999997, "r_x2": 183.82806, "r_y2": 354.68594, "r_x3": 144.592, "r_y3": 354.68594, "coord_origin": "TOPLEFT" }, "text": "enc-layers", "orig": "enc-layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 207.974, "r_y0": 349.8047199999999, "r_x1": 215.65193, "r_y1": 349.8047199999999, "r_x2": 215.65193, "r_y2": 341.73495, "r_x3": 207.974, "r_y3": 341.73495, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 192.19499, "r_y0": 362.75570999999997, "r_x1": 231.43106, "r_y1": 362.75570999999997, "r_x2": 231.43106, "r_y2": 354.68594, "r_x3": 192.19499, "r_y3": 354.68594, "coord_origin": "TOPLEFT" }, "text": "dec-layers", "orig": "dec-layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.79799999999997, "r_y0": 355.28372, "r_x1": 278.31766, "r_y1": 355.28372, "r_x2": 278.31766, "r_y2": 347.21396, "r_x3": 239.79799999999997, "r_y3": 347.21396, "coord_origin": "TOPLEFT" }, "text": "Language", "orig": "Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 324.67001, "r_y0": 349.8047199999999, "r_x1": 348.26419, "r_y1": 349.8047199999999, "r_x2": 348.26419, "r_y2": 341.73495, "r_x3": 324.67001, "r_y3": 341.73495, "coord_origin": "TOPLEFT" }, "text": "TEDs", "orig": "TEDs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.271, "r_y0": 349.8047199999999, "r_x1": 417.12683, "r_y1": 349.8047199999999, "r_x2": 417.12683, "r_y2": 341.73495, "r_x3": 396.271, "r_y3": 341.73495, "coord_origin": "TOPLEFT" }, "text": "mAP", "orig": "mAP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.927, "r_y0": 360.7637, "r_x1": 418.47278, "r_y1": 360.7637, "r_x2": 418.47278, "r_y2": 352.69394000000005, "r_x3": 394.927, "r_y3": 352.69394000000005, "coord_origin": "TOPLEFT" }, "text": "(0.75)", "orig": "(0.75)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 430.771, "r_y0": 349.8047199999999, "r_x1": 467.1423, "r_y1": 349.8047199999999, "r_x2": 467.1423, "r_y2": 341.73495, "r_x3": 430.771, "r_y3": 341.73495, "coord_origin": "TOPLEFT" }, "text": "Inference", "orig": "Inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 427.14801, "r_y0": 360.7637, "r_x1": 470.76056, "r_y1": 360.7637, "r_x2": 470.76056, "r_y2": 352.69394000000005, "r_x3": 427.14801, "r_y3": 352.69394000000005, "coord_origin": "TOPLEFT" }, "text": "time (secs)", "orig": "time (secs)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 286.686, "r_y0": 362.75570999999997, "r_x1": 312.33261, "r_y1": 362.75570999999997, "r_x2": 312.33261, "r_y2": 354.68594, "r_x3": 286.686, "r_y3": 354.68594, "coord_origin": "TOPLEFT" }, "text": "simple", "orig": "simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.702, "r_y0": 362.75570999999997, "r_x1": 353.71988, "r_y1": 362.75570999999997, "r_x2": 353.71988, "r_y2": 354.68594, "r_x3": 320.702, "r_y3": 354.68594, "coord_origin": "TOPLEFT" }, "text": "complex", "orig": "complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 369.306, "r_y0": 362.75570999999997, "r_x1": 379.03094, "r_y1": 362.75570999999997, "r_x2": 379.03094, "r_y2": 354.68594, "r_x3": 369.306, "r_y3": 354.68594, "coord_origin": "TOPLEFT" }, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.90601, "r_y0": 381.58572, "r_x1": 166.51294, "r_y1": 381.58572, "r_x2": 166.51294, "r_y2": 373.51596, "r_x3": 161.90601, "r_y3": 373.51596, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.509, "r_y0": 381.58572, "r_x1": 214.11594, "r_y1": 381.58572, "r_x2": 214.11594, "r_y2": 373.51596, "r_x3": 209.509, "r_y3": 373.51596, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.71000999999998, "r_y0": 376.10571, "r_x1": 271.40527, "r_y1": 376.10571, "r_x2": 271.40527, "r_y2": 368.03595, "r_x3": 246.71000999999998, "r_y3": 368.03595, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.017, "r_y0": 376.10571, "r_x1": 310.00375, "r_y1": 376.10571, "r_x2": 310.00375, "r_y2": 368.03595, "r_x3": 289.017, "r_y3": 368.03595, "coord_origin": "TOPLEFT" }, "text": "0.965", "orig": "0.965", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.71701, "r_y0": 376.10571, "r_x1": 347.70377, "r_y1": 376.10571, "r_x2": 347.70377, "r_y2": 368.03595, "r_x3": 326.71701, "r_y3": 368.03595, "coord_origin": "TOPLEFT" }, "text": "0.934", "orig": "0.934", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.67599, "r_y0": 376.10571, "r_x1": 384.66275, "r_y1": 376.10571, "r_x2": 384.66275, "r_y2": 368.03595, "r_x3": 363.67599, "r_y3": 368.03595, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.26999, "r_y0": 375.89948, "r_x1": 416.12723, "r_y1": 375.89948, "r_x2": 416.12723, "r_y2": 367.97317999999996, "r_x3": 397.26999, "r_y3": 367.97317999999996, "coord_origin": "TOPLEFT" }, "text": "0.88", "orig": "0.88", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.52701, "r_y0": 375.89948, "r_x1": 458.38425, "r_y1": 375.89948, "r_x2": 458.38425, "r_y2": 367.97317999999996, "r_x3": 439.52701, "r_y3": 367.97317999999996, "coord_origin": "TOPLEFT" }, "text": "2.73", "orig": "2.73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.17598999999998, "r_y0": 389.05771, "r_x1": 272.93954, "r_y1": 389.05771, "r_x2": 272.93954, "r_y2": 380.98795, "r_x3": 245.17598999999998, "r_y3": 380.98795, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.017, "r_y0": 389.05771, "r_x1": 310.00375, "r_y1": 389.05771, "r_x2": 310.00375, "r_y2": 380.98795, "r_x3": 289.017, "r_y3": 380.98795, "coord_origin": "TOPLEFT" }, "text": "0.969", "orig": "0.969", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.71701, "r_y0": 389.05771, "r_x1": 347.70377, "r_y1": 389.05771, "r_x2": 347.70377, "r_y2": 380.98795, "r_x3": 326.71701, "r_y3": 380.98795, "coord_origin": "TOPLEFT" }, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.67599, "r_y0": 389.05771, "r_x1": 384.66275, "r_y1": 389.05771, "r_x2": 384.66275, "r_y2": 380.98795, "r_x3": 363.67599, "r_y3": 380.98795, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.20599, "r_y0": 389.05771, "r_x1": 417.19275, "r_y1": 389.05771, "r_x2": 417.19275, "r_y2": 380.98795, "r_x3": 396.20599, "r_y3": 380.98795, "coord_origin": "TOPLEFT" }, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.767, "r_y0": 389.05771, "r_x1": 457.14682, "r_y1": 389.05771, "r_x2": 457.14682, "r_y2": 380.98795, "r_x3": 440.767, "r_y3": 380.98795, "coord_origin": "TOPLEFT" }, "text": "5.39", "orig": "5.39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.90601, "r_y0": 407.88672, "r_x1": 166.51294, "r_y1": 407.88672, "r_x2": 166.51294, "r_y2": 399.81696, "r_x3": 161.90601, "r_y3": 399.81696, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.509, "r_y0": 407.88672, "r_x1": 214.11594, "r_y1": 407.88672, "r_x2": 214.11594, "r_y2": 399.81696, "r_x3": 209.509, "r_y3": 399.81696, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.71000999999998, "r_y0": 402.40771, "r_x1": 271.40527, "r_y1": 402.40771, "r_x2": 271.40527, "r_y2": 394.33795, "r_x3": 246.71000999999998, "r_y3": 394.33795, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.017, "r_y0": 402.40771, "r_x1": 310.00375, "r_y1": 402.40771, "r_x2": 310.00375, "r_y2": 394.33795, "r_x3": 289.017, "r_y3": 394.33795, "coord_origin": "TOPLEFT" }, "text": "0.938", "orig": "0.938", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.71701, "r_y0": 402.40771, "r_x1": 347.70377, "r_y1": 402.40771, "r_x2": 347.70377, "r_y2": 394.33795, "r_x3": 326.71701, "r_y3": 394.33795, "coord_origin": "TOPLEFT" }, "text": "0.904", "orig": "0.904", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.67599, "r_y0": 402.40771, "r_x1": 384.66275, "r_y1": 402.40771, "r_x2": 384.66275, "r_y2": 394.33795, "r_x3": 363.67599, "r_y3": 394.33795, "coord_origin": "TOPLEFT" }, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.61801, "r_y0": 402.20148, "r_x1": 418.77887, "r_y1": 402.20148, "r_x2": 418.77887, "r_y2": 394.27518, "r_x3": 394.61801, "r_y3": 394.27518, "coord_origin": "TOPLEFT" }, "text": "0.853", "orig": "0.853", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.52701, "r_y0": 402.20148, "r_x1": 458.38425, "r_y1": 402.20148, "r_x2": 458.38425, "r_y2": 394.27518, "r_x3": 439.52701, "r_y3": 394.27518, "coord_origin": "TOPLEFT" }, "text": "1.97", "orig": "1.97", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.17598999999998, "r_y0": 415.3587, "r_x1": 272.93954, "r_y1": 415.3587, "r_x2": 272.93954, "r_y2": 407.28894, "r_x3": 245.17598999999998, "r_y3": 407.28894, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.017, "r_y0": 415.3587, "r_x1": 310.00375, "r_y1": 415.3587, "r_x2": 310.00375, "r_y2": 407.28894, "r_x3": 289.017, "r_y3": 407.28894, "coord_origin": "TOPLEFT" }, "text": "0.952", "orig": "0.952", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.71701, "r_y0": 415.3587, "r_x1": 347.70377, "r_y1": 415.3587, "r_x2": 347.70377, "r_y2": 407.28894, "r_x3": 326.71701, "r_y3": 407.28894, "coord_origin": "TOPLEFT" }, "text": "0.909", "orig": "0.909", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.08801, "r_y0": 415.15247, "r_x1": 386.24887, "r_y1": 415.15247, "r_x2": 386.24887, "r_y2": 407.22617, "r_x3": 362.08801, "r_y3": 407.22617, "coord_origin": "TOPLEFT" }, "text": "0.938", "orig": "0.938", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.20599, "r_y0": 415.3587, "r_x1": 417.19275, "r_y1": 415.3587, "r_x2": 417.19275, "r_y2": 407.28894, "r_x3": 396.20599, "r_y3": 407.28894, "coord_origin": "TOPLEFT" }, "text": "0.843", "orig": "0.843", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.767, "r_y0": 415.3587, "r_x1": 457.14682, "r_y1": 415.3587, "r_x2": 457.14682, "r_y2": 407.28894, "r_x3": 440.767, "r_y3": 407.28894, "coord_origin": "TOPLEFT" }, "text": "3.77", "orig": "3.77", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.90601, "r_y0": 434.1877099999999, "r_x1": 166.51294, "r_y1": 434.1877099999999, "r_x2": 166.51294, "r_y2": 426.11795, "r_x3": 161.90601, "r_y3": 426.11795, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.509, "r_y0": 434.1877099999999, "r_x1": 214.11594, "r_y1": 434.1877099999999, "r_x2": 214.11594, "r_y2": 426.11795, "r_x3": 209.509, "r_y3": 426.11795, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.71000999999998, "r_y0": 428.70871, "r_x1": 271.40527, "r_y1": 428.70871, "r_x2": 271.40527, "r_y2": 420.63895, "r_x3": 246.71000999999998, "r_y3": 420.63895, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.017, "r_y0": 428.70871, "r_x1": 310.00375, "r_y1": 428.70871, "r_x2": 310.00375, "r_y2": 420.63895, "r_x3": 289.017, "r_y3": 420.63895, "coord_origin": "TOPLEFT" }, "text": "0.923", "orig": "0.923", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.71701, "r_y0": 428.70871, "r_x1": 347.70377, "r_y1": 428.70871, "r_x2": 347.70377, "r_y2": 420.63895, "r_x3": 326.71701, "r_y3": 420.63895, "coord_origin": "TOPLEFT" }, "text": "0.897", "orig": "0.897", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.67599, "r_y0": 428.70871, "r_x1": 384.66275, "r_y1": 428.70871, "r_x2": 384.66275, "r_y2": 420.63895, "r_x3": 363.67599, "r_y3": 420.63895, "coord_origin": "TOPLEFT" }, "text": "0.915", "orig": "0.915", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.61801, "r_y0": 428.50247, "r_x1": 418.77887, "r_y1": 428.50247, "r_x2": 418.77887, "r_y2": 420.57617, "r_x3": 394.61801, "r_y3": 420.57617, "coord_origin": "TOPLEFT" }, "text": "0.859", "orig": "0.859", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.52701, "r_y0": 428.50247, "r_x1": 458.38425, "r_y1": 428.50247, "r_x2": 458.38425, "r_y2": 420.57617, "r_x3": 439.52701, "r_y3": 420.57617, "coord_origin": "TOPLEFT" }, "text": "1.91", "orig": "1.91", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.17598999999998, "r_y0": 441.6597, "r_x1": 272.93954, "r_y1": 441.6597, "r_x2": 272.93954, "r_y2": 433.58994, "r_x3": 245.17598999999998, "r_y3": 433.58994, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.017, "r_y0": 441.6597, "r_x1": 310.00375, "r_y1": 441.6597, "r_x2": 310.00375, "r_y2": 433.58994, "r_x3": 289.017, "r_y3": 433.58994, "coord_origin": "TOPLEFT" }, "text": "0.945", "orig": "0.945", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.71701, "r_y0": 441.6597, "r_x1": 347.70377, "r_y1": 441.6597, "r_x2": 347.70377, "r_y2": 433.58994, "r_x3": 326.71701, "r_y3": 433.58994, "coord_origin": "TOPLEFT" }, "text": "0.901", "orig": "0.901", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.08801, "r_y0": 441.45346, "r_x1": 386.24887, "r_y1": 441.45346, "r_x2": 386.24887, "r_y2": 433.5271599999999, "r_x3": 362.08801, "r_y3": 433.5271599999999, "coord_origin": "TOPLEFT" }, "text": "0.931", "orig": "0.931", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.20599, "r_y0": 441.6597, "r_x1": 417.19275, "r_y1": 441.6597, "r_x2": 417.19275, "r_y2": 433.58994, "r_x3": 396.20599, "r_y3": 433.58994, "coord_origin": "TOPLEFT" }, "text": "0.834", "orig": "0.834", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.767, "r_y0": 441.6597, "r_x1": 457.14682, "r_y1": 441.6597, "r_x2": 457.14682, "r_y2": 433.58994, "r_x3": 440.767, "r_y3": 433.58994, "coord_origin": "TOPLEFT" }, "text": "3.81", "orig": "3.81", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.90601, "r_y0": 460.48972, "r_x1": 166.51294, "r_y1": 460.48972, "r_x2": 166.51294, "r_y2": 452.41995, "r_x3": 161.90601, "r_y3": 452.41995, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.509, "r_y0": 460.48972, "r_x1": 214.11594, "r_y1": 460.48972, "r_x2": 214.11594, "r_y2": 452.41995, "r_x3": 209.509, "r_y3": 452.41995, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.71000999999998, "r_y0": 455.0097, "r_x1": 271.40527, "r_y1": 455.0097, "r_x2": 271.40527, "r_y2": 446.9399399999999, "r_x3": 246.71000999999998, "r_y3": 446.9399399999999, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.017, "r_y0": 455.0097, "r_x1": 310.00375, "r_y1": 455.0097, "r_x2": 310.00375, "r_y2": 446.9399399999999, "r_x3": 289.017, "r_y3": 446.9399399999999, "coord_origin": "TOPLEFT" }, "text": "0.952", "orig": "0.952", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 329.021, "r_y0": 455.0097, "r_x1": 345.40082, "r_y1": 455.0097, "r_x2": 345.40082, "r_y2": 446.9399399999999, "r_x3": 329.021, "r_y3": 446.9399399999999, "coord_origin": "TOPLEFT" }, "text": "0.92", "orig": "0.92", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.08801, "r_y0": 454.80347, "r_x1": 386.24887, "r_y1": 454.80347, "r_x2": 386.24887, "r_y2": 446.87717, "r_x3": 362.08801, "r_y3": 446.87717, "coord_origin": "TOPLEFT" }, "text": "0.942", "orig": "0.942", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.61801, "r_y0": 454.80347, "r_x1": 418.77887, "r_y1": 454.80347, "r_x2": 418.77887, "r_y2": 446.87717, "r_x3": 394.61801, "r_y3": 446.87717, "coord_origin": "TOPLEFT" }, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.52701, "r_y0": 454.80347, "r_x1": 458.38425, "r_y1": 454.80347, "r_x2": 458.38425, "r_y2": 446.87717, "r_x3": 439.52701, "r_y3": 446.87717, "coord_origin": "TOPLEFT" }, "text": "1.22", "orig": "1.22", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.17598999999998, "r_y0": 467.9617, "r_x1": 272.93954, "r_y1": 467.9617, "r_x2": 272.93954, "r_y2": 459.8919399999999, "r_x3": 245.17598999999998, "r_y3": 459.8919399999999, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.017, "r_y0": 467.9617, "r_x1": 310.00375, "r_y1": 467.9617, "r_x2": 310.00375, "r_y2": 459.8919399999999, "r_x3": 289.017, "r_y3": 459.8919399999999, "coord_origin": "TOPLEFT" }, "text": "0.944", "orig": "0.944", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.71701, "r_y0": 467.9617, "r_x1": 347.70377, "r_y1": 467.9617, "r_x2": 347.70377, "r_y2": 459.8919399999999, "r_x3": 326.71701, "r_y3": 459.8919399999999, "coord_origin": "TOPLEFT" }, "text": "0.903", "orig": "0.903", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.67599, "r_y0": 467.9617, "r_x1": 384.66275, "r_y1": 467.9617, "r_x2": 384.66275, "r_y2": 459.8919399999999, "r_x3": 363.67599, "r_y3": 459.8919399999999, "coord_origin": "TOPLEFT" }, "text": "0.931", "orig": "0.931", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.20599, "r_y0": 467.9617, "r_x1": 417.19275, "r_y1": 467.9617, "r_x2": 417.19275, "r_y2": 459.8919399999999, "r_x3": 396.20599, "r_y3": 459.8919399999999, "coord_origin": "TOPLEFT" }, "text": "0.824", "orig": "0.824", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 446.65302, "r_y0": 467.9617, "r_x1": 451.25995, "r_y1": 467.9617, "r_x2": 451.25995, "r_y2": 459.8919399999999, "r_x3": 446.65302, "r_y3": 459.8919399999999, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 11, "label": "text", "bbox": { "l": 160.37, "t": 341.73495, "r": 168.04793, "b": 349.8047199999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.37, "r_y0": 349.8047199999999, "r_x1": 168.04793, "r_y1": 349.8047199999999, "r_x2": 168.04793, "r_y2": 341.73495, "r_x3": 160.37, "r_y3": 341.73495, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 12, "label": "text", "bbox": { "l": 144.592, "t": 354.68594, "r": 183.82806, "b": 362.75570999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 144.592, "r_y0": 362.75570999999997, "r_x1": 183.82806, "r_y1": 362.75570999999997, "r_x2": 183.82806, "r_y2": 354.68594, "r_x3": 144.592, "r_y3": 354.68594, "coord_origin": "TOPLEFT" }, "text": "enc-layers", "orig": "enc-layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 13, "label": "text", "bbox": { "l": 207.974, "t": 341.73495, "r": 215.65193, "b": 349.8047199999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 207.974, "r_y0": 349.8047199999999, "r_x1": 215.65193, "r_y1": 349.8047199999999, "r_x2": 215.65193, "r_y2": 341.73495, "r_x3": 207.974, "r_y3": 341.73495, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 14, "label": "text", "bbox": { "l": 192.19499, "t": 354.68594, "r": 231.43106, "b": 362.75570999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 192.19499, "r_y0": 362.75570999999997, "r_x1": 231.43106, "r_y1": 362.75570999999997, "r_x2": 231.43106, "r_y2": 354.68594, "r_x3": 192.19499, "r_y3": 354.68594, "coord_origin": "TOPLEFT" }, "text": "dec-layers", "orig": "dec-layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 15, "label": "text", "bbox": { "l": 239.79799999999997, "t": 347.21396, "r": 278.31766, "b": 355.28372, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.79799999999997, "r_y0": 355.28372, "r_x1": 278.31766, "r_y1": 355.28372, "r_x2": 278.31766, "r_y2": 347.21396, "r_x3": 239.79799999999997, "r_y3": 347.21396, "coord_origin": "TOPLEFT" }, "text": "Language", "orig": "Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 16, "label": "text", "bbox": { "l": 324.67001, "t": 341.73495, "r": 348.26419, "b": 349.8047199999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 324.67001, "r_y0": 349.8047199999999, "r_x1": 348.26419, "r_y1": 349.8047199999999, "r_x2": 348.26419, "r_y2": 341.73495, "r_x3": 324.67001, "r_y3": 341.73495, "coord_origin": "TOPLEFT" }, "text": "TEDs", "orig": "TEDs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 17, "label": "text", "bbox": { "l": 396.271, "t": 341.73495, "r": 417.12683, "b": 349.8047199999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.271, "r_y0": 349.8047199999999, "r_x1": 417.12683, "r_y1": 349.8047199999999, "r_x2": 417.12683, "r_y2": 341.73495, "r_x3": 396.271, "r_y3": 341.73495, "coord_origin": "TOPLEFT" }, "text": "mAP", "orig": "mAP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 18, "label": "text", "bbox": { "l": 394.927, "t": 352.69394000000005, "r": 418.47278, "b": 360.7637, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.927, "r_y0": 360.7637, "r_x1": 418.47278, "r_y1": 360.7637, "r_x2": 418.47278, "r_y2": 352.69394000000005, "r_x3": 394.927, "r_y3": 352.69394000000005, "coord_origin": "TOPLEFT" }, "text": "(0.75)", "orig": "(0.75)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 19, "label": "text", "bbox": { "l": 430.771, "t": 341.73495, "r": 467.1423, "b": 349.8047199999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 430.771, "r_y0": 349.8047199999999, "r_x1": 467.1423, "r_y1": 349.8047199999999, "r_x2": 467.1423, "r_y2": 341.73495, "r_x3": 430.771, "r_y3": 341.73495, "coord_origin": "TOPLEFT" }, "text": "Inference", "orig": "Inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 20, "label": "text", "bbox": { "l": 427.14801, "t": 352.69394000000005, "r": 470.76056, "b": 360.7637, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 427.14801, "r_y0": 360.7637, "r_x1": 470.76056, "r_y1": 360.7637, "r_x2": 470.76056, "r_y2": 352.69394000000005, "r_x3": 427.14801, "r_y3": 352.69394000000005, "coord_origin": "TOPLEFT" }, "text": "time (secs)", "orig": "time (secs)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 21, "label": "text", "bbox": { "l": 286.686, "t": 354.68594, "r": 312.33261, "b": 362.75570999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 286.686, "r_y0": 362.75570999999997, "r_x1": 312.33261, "r_y1": 362.75570999999997, "r_x2": 312.33261, "r_y2": 354.68594, "r_x3": 286.686, "r_y3": 354.68594, "coord_origin": "TOPLEFT" }, "text": "simple", "orig": "simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 22, "label": "text", "bbox": { "l": 320.702, "t": 354.68594, "r": 353.71988, "b": 362.75570999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.702, "r_y0": 362.75570999999997, "r_x1": 353.71988, "r_y1": 362.75570999999997, "r_x2": 353.71988, "r_y2": 354.68594, "r_x3": 320.702, "r_y3": 354.68594, "coord_origin": "TOPLEFT" }, "text": "complex", "orig": "complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 23, "label": "text", "bbox": { "l": 369.306, "t": 354.68594, "r": 379.03094, "b": 362.75570999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 369.306, "r_y0": 362.75570999999997, "r_x1": 379.03094, "r_y1": 362.75570999999997, "r_x2": 379.03094, "r_y2": 354.68594, "r_x3": 369.306, "r_y3": 354.68594, "coord_origin": "TOPLEFT" }, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 24, "label": "text", "bbox": { "l": 161.90601, "t": 373.51596, "r": 166.51294, "b": 381.58572, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.90601, "r_y0": 381.58572, "r_x1": 166.51294, "r_y1": 381.58572, "r_x2": 166.51294, "r_y2": 373.51596, "r_x3": 161.90601, "r_y3": 373.51596, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 25, "label": "text", "bbox": { "l": 209.509, "t": 373.51596, "r": 214.11594, "b": 381.58572, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.509, "r_y0": 381.58572, "r_x1": 214.11594, "r_y1": 381.58572, "r_x2": 214.11594, "r_y2": 373.51596, "r_x3": 209.509, "r_y3": 373.51596, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 26, "label": "text", "bbox": { "l": 246.71000999999998, "t": 368.03595, "r": 271.40527, "b": 376.10571, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.71000999999998, "r_y0": 376.10571, "r_x1": 271.40527, "r_y1": 376.10571, "r_x2": 271.40527, "r_y2": 368.03595, "r_x3": 246.71000999999998, "r_y3": 368.03595, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 27, "label": "text", "bbox": { "l": 289.017, "t": 368.03595, "r": 310.00375, "b": 376.10571, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.017, "r_y0": 376.10571, "r_x1": 310.00375, "r_y1": 376.10571, "r_x2": 310.00375, "r_y2": 368.03595, "r_x3": 289.017, "r_y3": 368.03595, "coord_origin": "TOPLEFT" }, "text": "0.965", "orig": "0.965", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 28, "label": "text", "bbox": { "l": 326.71701, "t": 368.03595, "r": 347.70377, "b": 376.10571, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.71701, "r_y0": 376.10571, "r_x1": 347.70377, "r_y1": 376.10571, "r_x2": 347.70377, "r_y2": 368.03595, "r_x3": 326.71701, "r_y3": 368.03595, "coord_origin": "TOPLEFT" }, "text": "0.934", "orig": "0.934", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 29, "label": "text", "bbox": { "l": 363.67599, "t": 368.03595, "r": 384.66275, "b": 376.10571, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.67599, "r_y0": 376.10571, "r_x1": 384.66275, "r_y1": 376.10571, "r_x2": 384.66275, "r_y2": 368.03595, "r_x3": 363.67599, "r_y3": 368.03595, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 30, "label": "text", "bbox": { "l": 397.26999, "t": 367.97317999999996, "r": 416.12723, "b": 375.89948, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.26999, "r_y0": 375.89948, "r_x1": 416.12723, "r_y1": 375.89948, "r_x2": 416.12723, "r_y2": 367.97317999999996, "r_x3": 397.26999, "r_y3": 367.97317999999996, "coord_origin": "TOPLEFT" }, "text": "0.88", "orig": "0.88", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 31, "label": "text", "bbox": { "l": 439.52701, "t": 367.97317999999996, "r": 458.38425, "b": 375.89948, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.52701, "r_y0": 375.89948, "r_x1": 458.38425, "r_y1": 375.89948, "r_x2": 458.38425, "r_y2": 367.97317999999996, "r_x3": 439.52701, "r_y3": 367.97317999999996, "coord_origin": "TOPLEFT" }, "text": "2.73", "orig": "2.73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 32, "label": "text", "bbox": { "l": 245.17598999999998, "t": 380.98795, "r": 272.93954, "b": 389.05771, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.17598999999998, "r_y0": 389.05771, "r_x1": 272.93954, "r_y1": 389.05771, "r_x2": 272.93954, "r_y2": 380.98795, "r_x3": 245.17598999999998, "r_y3": 380.98795, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 33, "label": "text", "bbox": { "l": 289.017, "t": 380.98795, "r": 310.00375, "b": 389.05771, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.017, "r_y0": 389.05771, "r_x1": 310.00375, "r_y1": 389.05771, "r_x2": 310.00375, "r_y2": 380.98795, "r_x3": 289.017, "r_y3": 380.98795, "coord_origin": "TOPLEFT" }, "text": "0.969", "orig": "0.969", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 34, "label": "text", "bbox": { "l": 326.71701, "t": 380.98795, "r": 347.70377, "b": 389.05771, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.71701, "r_y0": 389.05771, "r_x1": 347.70377, "r_y1": 389.05771, "r_x2": 347.70377, "r_y2": 380.98795, "r_x3": 326.71701, "r_y3": 380.98795, "coord_origin": "TOPLEFT" }, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 35, "label": "text", "bbox": { "l": 363.67599, "t": 380.98795, "r": 384.66275, "b": 389.05771, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.67599, "r_y0": 389.05771, "r_x1": 384.66275, "r_y1": 389.05771, "r_x2": 384.66275, "r_y2": 380.98795, "r_x3": 363.67599, "r_y3": 380.98795, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 36, "label": "text", "bbox": { "l": 396.20599, "t": 380.98795, "r": 417.19275, "b": 389.05771, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.20599, "r_y0": 389.05771, "r_x1": 417.19275, "r_y1": 389.05771, "r_x2": 417.19275, "r_y2": 380.98795, "r_x3": 396.20599, "r_y3": 380.98795, "coord_origin": "TOPLEFT" }, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 37, "label": "text", "bbox": { "l": 440.767, "t": 380.98795, "r": 457.14682, "b": 389.05771, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.767, "r_y0": 389.05771, "r_x1": 457.14682, "r_y1": 389.05771, "r_x2": 457.14682, "r_y2": 380.98795, "r_x3": 440.767, "r_y3": 380.98795, "coord_origin": "TOPLEFT" }, "text": "5.39", "orig": "5.39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 38, "label": "text", "bbox": { "l": 161.90601, "t": 399.81696, "r": 166.51294, "b": 407.88672, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.90601, "r_y0": 407.88672, "r_x1": 166.51294, "r_y1": 407.88672, "r_x2": 166.51294, "r_y2": 399.81696, "r_x3": 161.90601, "r_y3": 399.81696, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 39, "label": "text", "bbox": { "l": 209.509, "t": 399.81696, "r": 214.11594, "b": 407.88672, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.509, "r_y0": 407.88672, "r_x1": 214.11594, "r_y1": 407.88672, "r_x2": 214.11594, "r_y2": 399.81696, "r_x3": 209.509, "r_y3": 399.81696, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 40, "label": "text", "bbox": { "l": 246.71000999999998, "t": 394.33795, "r": 271.40527, "b": 402.40771, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.71000999999998, "r_y0": 402.40771, "r_x1": 271.40527, "r_y1": 402.40771, "r_x2": 271.40527, "r_y2": 394.33795, "r_x3": 246.71000999999998, "r_y3": 394.33795, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 289.017, "t": 394.33795, "r": 310.00375, "b": 402.40771, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.017, "r_y0": 402.40771, "r_x1": 310.00375, "r_y1": 402.40771, "r_x2": 310.00375, "r_y2": 394.33795, "r_x3": 289.017, "r_y3": 394.33795, "coord_origin": "TOPLEFT" }, "text": "0.938", "orig": "0.938", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 326.71701, "t": 394.33795, "r": 347.70377, "b": 402.40771, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.71701, "r_y0": 402.40771, "r_x1": 347.70377, "r_y1": 402.40771, "r_x2": 347.70377, "r_y2": 394.33795, "r_x3": 326.71701, "r_y3": 394.33795, "coord_origin": "TOPLEFT" }, "text": "0.904", "orig": "0.904", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 363.67599, "t": 394.33795, "r": 384.66275, "b": 402.40771, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.67599, "r_y0": 402.40771, "r_x1": 384.66275, "r_y1": 402.40771, "r_x2": 384.66275, "r_y2": 394.33795, "r_x3": 363.67599, "r_y3": 394.33795, "coord_origin": "TOPLEFT" }, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 394.61801, "t": 394.27518, "r": 418.77887, "b": 402.20148, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.61801, "r_y0": 402.20148, "r_x1": 418.77887, "r_y1": 402.20148, "r_x2": 418.77887, "r_y2": 394.27518, "r_x3": 394.61801, "r_y3": 394.27518, "coord_origin": "TOPLEFT" }, "text": "0.853", "orig": "0.853", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 439.52701, "t": 394.27518, "r": 458.38425, "b": 402.20148, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.52701, "r_y0": 402.20148, "r_x1": 458.38425, "r_y1": 402.20148, "r_x2": 458.38425, "r_y2": 394.27518, "r_x3": 439.52701, "r_y3": 394.27518, "coord_origin": "TOPLEFT" }, "text": "1.97", "orig": "1.97", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 245.17598999999998, "t": 407.28894, "r": 272.93954, "b": 415.3587, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.17598999999998, "r_y0": 415.3587, "r_x1": 272.93954, "r_y1": 415.3587, "r_x2": 272.93954, "r_y2": 407.28894, "r_x3": 245.17598999999998, "r_y3": 407.28894, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 289.017, "t": 407.28894, "r": 310.00375, "b": 415.3587, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.017, "r_y0": 415.3587, "r_x1": 310.00375, "r_y1": 415.3587, "r_x2": 310.00375, "r_y2": 407.28894, "r_x3": 289.017, "r_y3": 407.28894, "coord_origin": "TOPLEFT" }, "text": "0.952", "orig": "0.952", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 326.71701, "t": 407.28894, "r": 347.70377, "b": 415.3587, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.71701, "r_y0": 415.3587, "r_x1": 347.70377, "r_y1": 415.3587, "r_x2": 347.70377, "r_y2": 407.28894, "r_x3": 326.71701, "r_y3": 407.28894, "coord_origin": "TOPLEFT" }, "text": "0.909", "orig": "0.909", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 362.08801, "t": 407.22617, "r": 386.24887, "b": 415.15247, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.08801, "r_y0": 415.15247, "r_x1": 386.24887, "r_y1": 415.15247, "r_x2": 386.24887, "r_y2": 407.22617, "r_x3": 362.08801, "r_y3": 407.22617, "coord_origin": "TOPLEFT" }, "text": "0.938", "orig": "0.938", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 396.20599, "t": 407.28894, "r": 417.19275, "b": 415.3587, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.20599, "r_y0": 415.3587, "r_x1": 417.19275, "r_y1": 415.3587, "r_x2": 417.19275, "r_y2": 407.28894, "r_x3": 396.20599, "r_y3": 407.28894, "coord_origin": "TOPLEFT" }, "text": "0.843", "orig": "0.843", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 51, "label": "text", "bbox": { "l": 440.767, "t": 407.28894, "r": 457.14682, "b": 415.3587, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.767, "r_y0": 415.3587, "r_x1": 457.14682, "r_y1": 415.3587, "r_x2": 457.14682, "r_y2": 407.28894, "r_x3": 440.767, "r_y3": 407.28894, "coord_origin": "TOPLEFT" }, "text": "3.77", "orig": "3.77", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 52, "label": "text", "bbox": { "l": 161.90601, "t": 426.11795, "r": 166.51294, "b": 434.1877099999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.90601, "r_y0": 434.1877099999999, "r_x1": 166.51294, "r_y1": 434.1877099999999, "r_x2": 166.51294, "r_y2": 426.11795, "r_x3": 161.90601, "r_y3": 426.11795, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 53, "label": "text", "bbox": { "l": 209.509, "t": 426.11795, "r": 214.11594, "b": 434.1877099999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.509, "r_y0": 434.1877099999999, "r_x1": 214.11594, "r_y1": 434.1877099999999, "r_x2": 214.11594, "r_y2": 426.11795, "r_x3": 209.509, "r_y3": 426.11795, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 54, "label": "text", "bbox": { "l": 246.71000999999998, "t": 420.63895, "r": 271.40527, "b": 428.70871, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.71000999999998, "r_y0": 428.70871, "r_x1": 271.40527, "r_y1": 428.70871, "r_x2": 271.40527, "r_y2": 420.63895, "r_x3": 246.71000999999998, "r_y3": 420.63895, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 55, "label": "text", "bbox": { "l": 289.017, "t": 420.63895, "r": 310.00375, "b": 428.70871, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.017, "r_y0": 428.70871, "r_x1": 310.00375, "r_y1": 428.70871, "r_x2": 310.00375, "r_y2": 420.63895, "r_x3": 289.017, "r_y3": 420.63895, "coord_origin": "TOPLEFT" }, "text": "0.923", "orig": "0.923", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 56, "label": "text", "bbox": { "l": 326.71701, "t": 420.63895, "r": 347.70377, "b": 428.70871, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.71701, "r_y0": 428.70871, "r_x1": 347.70377, "r_y1": 428.70871, "r_x2": 347.70377, "r_y2": 420.63895, "r_x3": 326.71701, "r_y3": 420.63895, "coord_origin": "TOPLEFT" }, "text": "0.897", "orig": "0.897", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 57, "label": "text", "bbox": { "l": 363.67599, "t": 420.63895, "r": 384.66275, "b": 428.70871, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.67599, "r_y0": 428.70871, "r_x1": 384.66275, "r_y1": 428.70871, "r_x2": 384.66275, "r_y2": 420.63895, "r_x3": 363.67599, "r_y3": 420.63895, "coord_origin": "TOPLEFT" }, "text": "0.915", "orig": "0.915", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 58, "label": "text", "bbox": { "l": 394.61801, "t": 420.57617, "r": 418.77887, "b": 428.50247, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.61801, "r_y0": 428.50247, "r_x1": 418.77887, "r_y1": 428.50247, "r_x2": 418.77887, "r_y2": 420.57617, "r_x3": 394.61801, "r_y3": 420.57617, "coord_origin": "TOPLEFT" }, "text": "0.859", "orig": "0.859", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 59, "label": "text", "bbox": { "l": 439.52701, "t": 420.57617, "r": 458.38425, "b": 428.50247, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.52701, "r_y0": 428.50247, "r_x1": 458.38425, "r_y1": 428.50247, "r_x2": 458.38425, "r_y2": 420.57617, "r_x3": 439.52701, "r_y3": 420.57617, "coord_origin": "TOPLEFT" }, "text": "1.91", "orig": "1.91", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 60, "label": "text", "bbox": { "l": 245.17598999999998, "t": 433.58994, "r": 272.93954, "b": 441.6597, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.17598999999998, "r_y0": 441.6597, "r_x1": 272.93954, "r_y1": 441.6597, "r_x2": 272.93954, "r_y2": 433.58994, "r_x3": 245.17598999999998, "r_y3": 433.58994, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 61, "label": "text", "bbox": { "l": 289.017, "t": 433.58994, "r": 310.00375, "b": 441.6597, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.017, "r_y0": 441.6597, "r_x1": 310.00375, "r_y1": 441.6597, "r_x2": 310.00375, "r_y2": 433.58994, "r_x3": 289.017, "r_y3": 433.58994, "coord_origin": "TOPLEFT" }, "text": "0.945", "orig": "0.945", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 62, "label": "text", "bbox": { "l": 326.71701, "t": 433.58994, "r": 347.70377, "b": 441.6597, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.71701, "r_y0": 441.6597, "r_x1": 347.70377, "r_y1": 441.6597, "r_x2": 347.70377, "r_y2": 433.58994, "r_x3": 326.71701, "r_y3": 433.58994, "coord_origin": "TOPLEFT" }, "text": "0.901", "orig": "0.901", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 362.08801, "t": 433.5271599999999, "r": 386.24887, "b": 441.45346, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.08801, "r_y0": 441.45346, "r_x1": 386.24887, "r_y1": 441.45346, "r_x2": 386.24887, "r_y2": 433.5271599999999, "r_x3": 362.08801, "r_y3": 433.5271599999999, "coord_origin": "TOPLEFT" }, "text": "0.931", "orig": "0.931", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 396.20599, "t": 433.58994, "r": 417.19275, "b": 441.6597, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.20599, "r_y0": 441.6597, "r_x1": 417.19275, "r_y1": 441.6597, "r_x2": 417.19275, "r_y2": 433.58994, "r_x3": 396.20599, "r_y3": 433.58994, "coord_origin": "TOPLEFT" }, "text": "0.834", "orig": "0.834", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 440.767, "t": 433.58994, "r": 457.14682, "b": 441.6597, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.767, "r_y0": 441.6597, "r_x1": 457.14682, "r_y1": 441.6597, "r_x2": 457.14682, "r_y2": 433.58994, "r_x3": 440.767, "r_y3": 433.58994, "coord_origin": "TOPLEFT" }, "text": "3.81", "orig": "3.81", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 161.90601, "t": 452.41995, "r": 166.51294, "b": 460.48972, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.90601, "r_y0": 460.48972, "r_x1": 166.51294, "r_y1": 460.48972, "r_x2": 166.51294, "r_y2": 452.41995, "r_x3": 161.90601, "r_y3": 452.41995, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 209.509, "t": 452.41995, "r": 214.11594, "b": 460.48972, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.509, "r_y0": 460.48972, "r_x1": 214.11594, "r_y1": 460.48972, "r_x2": 214.11594, "r_y2": 452.41995, "r_x3": 209.509, "r_y3": 452.41995, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 246.71000999999998, "t": 446.9399399999999, "r": 271.40527, "b": 455.0097, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.71000999999998, "r_y0": 455.0097, "r_x1": 271.40527, "r_y1": 455.0097, "r_x2": 271.40527, "r_y2": 446.9399399999999, "r_x3": 246.71000999999998, "r_y3": 446.9399399999999, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 289.017, "t": 446.9399399999999, "r": 310.00375, "b": 455.0097, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.017, "r_y0": 455.0097, "r_x1": 310.00375, "r_y1": 455.0097, "r_x2": 310.00375, "r_y2": 446.9399399999999, "r_x3": 289.017, "r_y3": 446.9399399999999, "coord_origin": "TOPLEFT" }, "text": "0.952", "orig": "0.952", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 329.021, "t": 446.9399399999999, "r": 345.40082, "b": 455.0097, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 329.021, "r_y0": 455.0097, "r_x1": 345.40082, "r_y1": 455.0097, "r_x2": 345.40082, "r_y2": 446.9399399999999, "r_x3": 329.021, "r_y3": 446.9399399999999, "coord_origin": "TOPLEFT" }, "text": "0.92", "orig": "0.92", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 362.08801, "t": 446.87717, "r": 386.24887, "b": 454.80347, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.08801, "r_y0": 454.80347, "r_x1": 386.24887, "r_y1": 454.80347, "r_x2": 386.24887, "r_y2": 446.87717, "r_x3": 362.08801, "r_y3": 446.87717, "coord_origin": "TOPLEFT" }, "text": "0.942", "orig": "0.942", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 394.61801, "t": 446.87717, "r": 418.77887, "b": 454.80347, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.61801, "r_y0": 454.80347, "r_x1": 418.77887, "r_y1": 454.80347, "r_x2": 418.77887, "r_y2": 446.87717, "r_x3": 394.61801, "r_y3": 446.87717, "coord_origin": "TOPLEFT" }, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 439.52701, "t": 446.87717, "r": 458.38425, "b": 454.80347, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.52701, "r_y0": 454.80347, "r_x1": 458.38425, "r_y1": 454.80347, "r_x2": 458.38425, "r_y2": 446.87717, "r_x3": 439.52701, "r_y3": 446.87717, "coord_origin": "TOPLEFT" }, "text": "1.22", "orig": "1.22", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 245.17598999999998, "t": 459.8919399999999, "r": 272.93954, "b": 467.9617, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.17598999999998, "r_y0": 467.9617, "r_x1": 272.93954, "r_y1": 467.9617, "r_x2": 272.93954, "r_y2": 459.8919399999999, "r_x3": 245.17598999999998, "r_y3": 459.8919399999999, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 289.017, "t": 459.8919399999999, "r": 310.00375, "b": 467.9617, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.017, "r_y0": 467.9617, "r_x1": 310.00375, "r_y1": 467.9617, "r_x2": 310.00375, "r_y2": 459.8919399999999, "r_x3": 289.017, "r_y3": 459.8919399999999, "coord_origin": "TOPLEFT" }, "text": "0.944", "orig": "0.944", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 326.71701, "t": 459.8919399999999, "r": 347.70377, "b": 467.9617, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.71701, "r_y0": 467.9617, "r_x1": 347.70377, "r_y1": 467.9617, "r_x2": 347.70377, "r_y2": 459.8919399999999, "r_x3": 326.71701, "r_y3": 459.8919399999999, "coord_origin": "TOPLEFT" }, "text": "0.903", "orig": "0.903", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 363.67599, "t": 459.8919399999999, "r": 384.66275, "b": 467.9617, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.67599, "r_y0": 467.9617, "r_x1": 384.66275, "r_y1": 467.9617, "r_x2": 384.66275, "r_y2": 459.8919399999999, "r_x3": 363.67599, "r_y3": 459.8919399999999, "coord_origin": "TOPLEFT" }, "text": "0.931", "orig": "0.931", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 396.20599, "t": 459.8919399999999, "r": 417.19275, "b": 467.9617, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.20599, "r_y0": 467.9617, "r_x1": 417.19275, "r_y1": 467.9617, "r_x2": 417.19275, "r_y2": 459.8919399999999, "r_x3": 396.20599, "r_y3": 459.8919399999999, "coord_origin": "TOPLEFT" }, "text": "0.824", "orig": "0.824", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 446.65302, "t": 459.8919399999999, "r": 451.25995, "b": 467.9617, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 446.65302, "r_y0": 467.9617, "r_x1": 451.25995, "r_y1": 467.9617, "r_x2": 451.25995, "r_y2": 459.8919399999999, "r_x3": 446.65302, "r_y3": 459.8919399999999, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, { "id": 5, "label": "section_header", "bbox": { "l": 134.765, "t": 508.15179, "r": 264.40332, "b": 516.95874, "coord_origin": "TOPLEFT" }, "confidence": 0.9592539668083191, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 516.95874, "r_x1": 149.40205, "r_y1": 516.95874, "r_x2": 149.40205, "r_y2": 508.15179, "r_x3": 134.765, "r_y3": 508.15179, "coord_origin": "TOPLEFT" }, "text": "5.2", "orig": "5.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.85904, "r_y0": 516.95874, "r_x1": 264.40332, "r_y1": 516.95874, "r_x2": 264.40332, "r_y2": 508.15179, "r_x3": 160.85904, "r_y3": 508.15179, "coord_origin": "TOPLEFT" }, "text": "Quantitative Results", "orig": "Quantitative Results", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 1, "label": "text", "bbox": { "l": 134.765, "t": 524.55078, "r": 480.5957599999999, "b": 617.03474, "coord_origin": "TOPLEFT" }, "confidence": 0.9854757189750671, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 533.34775, "r_x1": 480.59075999999993, "r_y1": 533.34775, "r_x2": 480.59075999999993, "r_y2": 524.55078, "r_x3": 134.765, "r_y3": 524.55078, "coord_origin": "TOPLEFT" }, "text": "We picked the model parameter configuration that produced the best prediction", "orig": "We picked the model parameter configuration that produced the best prediction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 545.3037400000001, "r_x1": 480.58675999999997, "r_y1": 545.3037400000001, "r_x2": 480.58675999999997, "r_y2": 536.50677, "r_x3": 134.765, "r_y3": 536.50677, "coord_origin": "TOPLEFT" }, "text": "quality (enc=6, dec=6, heads=8) with PubTabNet alone, then independently", "orig": "quality (enc=6, dec=6, heads=8) with PubTabNet alone, then independently", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 557.25874, "r_x1": 480.59572999999995, "r_y1": 557.25874, "r_x2": 480.59572999999995, "r_y2": 548.4617800000001, "r_x3": 134.765, "r_y3": 548.4617800000001, "coord_origin": "TOPLEFT" }, "text": "trained and evaluated it on three publicly available data sets: PubTabNet (395k", "orig": "trained and evaluated it on three publicly available data sets: PubTabNet (395k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 569.21375, "r_x1": 480.59177000000005, "r_y1": 569.21375, "r_x2": 480.59177000000005, "r_y2": 560.41678, "r_x3": 134.765, "r_y3": 560.41678, "coord_origin": "TOPLEFT" }, "text": "samples), FinTabNet (113k samples) and PubTables-1M (about 1M samples).", "orig": "samples), FinTabNet (113k samples) and PubTables-1M (about 1M samples).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 581.16875, "r_x1": 480.59069999999997, "r_y1": 581.16875, "r_x2": 480.59069999999997, "r_y2": 572.37178, "r_x3": 134.765, "r_y3": 572.37178, "coord_origin": "TOPLEFT" }, "text": "Performance results are presented in Table. 2. It is clearly evident that the model", "orig": "Performance results are presented in Table. 2. It is clearly evident that the model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 593.12375, "r_x1": 480.5957599999999, "r_y1": 593.12375, "r_x2": 480.5957599999999, "r_y2": 584.32678, "r_x3": 134.765, "r_y3": 584.32678, "coord_origin": "TOPLEFT" }, "text": "trained on OTSL outperforms HTML across the board, keeping high TEDs and", "orig": "trained on OTSL outperforms HTML across the board, keeping high TEDs and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 605.07974, "r_x1": 480.58774, "r_y1": 605.07974, "r_x2": 480.58774, "r_y2": 596.28278, "r_x3": 134.765, "r_y3": 596.28278, "coord_origin": "TOPLEFT" }, "text": "mAP scores even on difficult financial tables (FinTabNet) that contain sparse", "orig": "mAP scores even on difficult financial tables (FinTabNet) that contain sparse", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 617.03474, "r_x1": 206.78664, "r_y1": 617.03474, "r_x2": 206.78664, "r_y2": 608.2377799999999, "r_x3": 134.765, "r_y3": 608.2377799999999, "coord_origin": "TOPLEFT" }, "text": "and large tables.", "orig": "and large tables.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 2, "label": "text", "bbox": { "l": 134.765, "t": 620.19278, "r": 480.5957599999999, "b": 664.8547599999999, "coord_origin": "TOPLEFT" }, "confidence": 0.9851234555244446, "cells": [ { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.709, "r_y0": 628.98975, "r_x1": 480.59271, "r_y1": 628.98975, "r_x2": 480.59271, "r_y2": 620.19278, "r_x3": 149.709, "r_y3": 620.19278, "coord_origin": "TOPLEFT" }, "text": "Additionally, the results show that OTSL has an advantage over HTML", "orig": "Additionally, the results show that OTSL has an advantage over HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 640.94475, "r_x1": 480.5957599999999, "r_y1": 640.94475, "r_x2": 480.5957599999999, "r_y2": 632.14778, "r_x3": 134.765, "r_y3": 632.14778, "coord_origin": "TOPLEFT" }, "text": "when applied on a bigger data set like PubTables-1M and achieves significantly", "orig": "when applied on a bigger data set like PubTables-1M and achieves significantly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 652.89975, "r_x1": 480.59283000000005, "r_y1": 652.89975, "r_x2": 480.59283000000005, "r_y2": 644.1027799999999, "r_x3": 134.765, "r_y3": 644.1027799999999, "coord_origin": "TOPLEFT" }, "text": "improved scores. Finally, OTSL achieves faster inference due to fewer decoding", "orig": "improved scores. Finally, OTSL achieves faster inference due to fewer decoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 664.8547599999999, "r_x1": 405.79651, "r_y1": 664.8547599999999, "r_x2": 405.79651, "r_y2": 656.0577900000001, "r_x3": 134.765, "r_y3": 656.0577900000001, "coord_origin": "TOPLEFT" }, "text": "steps which is a result of the reduced sequence representation.", "orig": "steps which is a result of the reduced sequence representation.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "tablestructure": { "table_map": { "0": { "label": "table", "id": 0, "page_no": 8, "cluster": { "id": 0, "label": "table", "bbox": { "l": 139.66845703125, "t": 337.5747985839844, "r": 475.00372314453125, "b": 469.4721374511719, "coord_origin": "TOPLEFT" }, "confidence": 0.9901032447814941, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.37, "r_y0": 349.8047199999999, "r_x1": 168.04793, "r_y1": 349.8047199999999, "r_x2": 168.04793, "r_y2": 341.73495, "r_x3": 160.37, "r_y3": 341.73495, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 144.592, "r_y0": 362.75570999999997, "r_x1": 183.82806, "r_y1": 362.75570999999997, "r_x2": 183.82806, "r_y2": 354.68594, "r_x3": 144.592, "r_y3": 354.68594, "coord_origin": "TOPLEFT" }, "text": "enc-layers", "orig": "enc-layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 207.974, "r_y0": 349.8047199999999, "r_x1": 215.65193, "r_y1": 349.8047199999999, "r_x2": 215.65193, "r_y2": 341.73495, "r_x3": 207.974, "r_y3": 341.73495, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 192.19499, "r_y0": 362.75570999999997, "r_x1": 231.43106, "r_y1": 362.75570999999997, "r_x2": 231.43106, "r_y2": 354.68594, "r_x3": 192.19499, "r_y3": 354.68594, "coord_origin": "TOPLEFT" }, "text": "dec-layers", "orig": "dec-layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.79799999999997, "r_y0": 355.28372, "r_x1": 278.31766, "r_y1": 355.28372, "r_x2": 278.31766, "r_y2": 347.21396, "r_x3": 239.79799999999997, "r_y3": 347.21396, "coord_origin": "TOPLEFT" }, "text": "Language", "orig": "Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 324.67001, "r_y0": 349.8047199999999, "r_x1": 348.26419, "r_y1": 349.8047199999999, "r_x2": 348.26419, "r_y2": 341.73495, "r_x3": 324.67001, "r_y3": 341.73495, "coord_origin": "TOPLEFT" }, "text": "TEDs", "orig": "TEDs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.271, "r_y0": 349.8047199999999, "r_x1": 417.12683, "r_y1": 349.8047199999999, "r_x2": 417.12683, "r_y2": 341.73495, "r_x3": 396.271, "r_y3": 341.73495, "coord_origin": "TOPLEFT" }, "text": "mAP", "orig": "mAP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.927, "r_y0": 360.7637, "r_x1": 418.47278, "r_y1": 360.7637, "r_x2": 418.47278, "r_y2": 352.69394000000005, "r_x3": 394.927, "r_y3": 352.69394000000005, "coord_origin": "TOPLEFT" }, "text": "(0.75)", "orig": "(0.75)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 430.771, "r_y0": 349.8047199999999, "r_x1": 467.1423, "r_y1": 349.8047199999999, "r_x2": 467.1423, "r_y2": 341.73495, "r_x3": 430.771, "r_y3": 341.73495, "coord_origin": "TOPLEFT" }, "text": "Inference", "orig": "Inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 427.14801, "r_y0": 360.7637, "r_x1": 470.76056, "r_y1": 360.7637, "r_x2": 470.76056, "r_y2": 352.69394000000005, "r_x3": 427.14801, "r_y3": 352.69394000000005, "coord_origin": "TOPLEFT" }, "text": "time (secs)", "orig": "time (secs)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 286.686, "r_y0": 362.75570999999997, "r_x1": 312.33261, "r_y1": 362.75570999999997, "r_x2": 312.33261, "r_y2": 354.68594, "r_x3": 286.686, "r_y3": 354.68594, "coord_origin": "TOPLEFT" }, "text": "simple", "orig": "simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.702, "r_y0": 362.75570999999997, "r_x1": 353.71988, "r_y1": 362.75570999999997, "r_x2": 353.71988, "r_y2": 354.68594, "r_x3": 320.702, "r_y3": 354.68594, "coord_origin": "TOPLEFT" }, "text": "complex", "orig": "complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 369.306, "r_y0": 362.75570999999997, "r_x1": 379.03094, "r_y1": 362.75570999999997, "r_x2": 379.03094, "r_y2": 354.68594, "r_x3": 369.306, "r_y3": 354.68594, "coord_origin": "TOPLEFT" }, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.90601, "r_y0": 381.58572, "r_x1": 166.51294, "r_y1": 381.58572, "r_x2": 166.51294, "r_y2": 373.51596, "r_x3": 161.90601, "r_y3": 373.51596, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.509, "r_y0": 381.58572, "r_x1": 214.11594, "r_y1": 381.58572, "r_x2": 214.11594, "r_y2": 373.51596, "r_x3": 209.509, "r_y3": 373.51596, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.71000999999998, "r_y0": 376.10571, "r_x1": 271.40527, "r_y1": 376.10571, "r_x2": 271.40527, "r_y2": 368.03595, "r_x3": 246.71000999999998, "r_y3": 368.03595, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.017, "r_y0": 376.10571, "r_x1": 310.00375, "r_y1": 376.10571, "r_x2": 310.00375, "r_y2": 368.03595, "r_x3": 289.017, "r_y3": 368.03595, "coord_origin": "TOPLEFT" }, "text": "0.965", "orig": "0.965", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.71701, "r_y0": 376.10571, "r_x1": 347.70377, "r_y1": 376.10571, "r_x2": 347.70377, "r_y2": 368.03595, "r_x3": 326.71701, "r_y3": 368.03595, "coord_origin": "TOPLEFT" }, "text": "0.934", "orig": "0.934", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.67599, "r_y0": 376.10571, "r_x1": 384.66275, "r_y1": 376.10571, "r_x2": 384.66275, "r_y2": 368.03595, "r_x3": 363.67599, "r_y3": 368.03595, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.26999, "r_y0": 375.89948, "r_x1": 416.12723, "r_y1": 375.89948, "r_x2": 416.12723, "r_y2": 367.97317999999996, "r_x3": 397.26999, "r_y3": 367.97317999999996, "coord_origin": "TOPLEFT" }, "text": "0.88", "orig": "0.88", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.52701, "r_y0": 375.89948, "r_x1": 458.38425, "r_y1": 375.89948, "r_x2": 458.38425, "r_y2": 367.97317999999996, "r_x3": 439.52701, "r_y3": 367.97317999999996, "coord_origin": "TOPLEFT" }, "text": "2.73", "orig": "2.73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.17598999999998, "r_y0": 389.05771, "r_x1": 272.93954, "r_y1": 389.05771, "r_x2": 272.93954, "r_y2": 380.98795, "r_x3": 245.17598999999998, "r_y3": 380.98795, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.017, "r_y0": 389.05771, "r_x1": 310.00375, "r_y1": 389.05771, "r_x2": 310.00375, "r_y2": 380.98795, "r_x3": 289.017, "r_y3": 380.98795, "coord_origin": "TOPLEFT" }, "text": "0.969", "orig": "0.969", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.71701, "r_y0": 389.05771, "r_x1": 347.70377, "r_y1": 389.05771, "r_x2": 347.70377, "r_y2": 380.98795, "r_x3": 326.71701, "r_y3": 380.98795, "coord_origin": "TOPLEFT" }, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.67599, "r_y0": 389.05771, "r_x1": 384.66275, "r_y1": 389.05771, "r_x2": 384.66275, "r_y2": 380.98795, "r_x3": 363.67599, "r_y3": 380.98795, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.20599, "r_y0": 389.05771, "r_x1": 417.19275, "r_y1": 389.05771, "r_x2": 417.19275, "r_y2": 380.98795, "r_x3": 396.20599, "r_y3": 380.98795, "coord_origin": "TOPLEFT" }, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.767, "r_y0": 389.05771, "r_x1": 457.14682, "r_y1": 389.05771, "r_x2": 457.14682, "r_y2": 380.98795, "r_x3": 440.767, "r_y3": 380.98795, "coord_origin": "TOPLEFT" }, "text": "5.39", "orig": "5.39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.90601, "r_y0": 407.88672, "r_x1": 166.51294, "r_y1": 407.88672, "r_x2": 166.51294, "r_y2": 399.81696, "r_x3": 161.90601, "r_y3": 399.81696, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.509, "r_y0": 407.88672, "r_x1": 214.11594, "r_y1": 407.88672, "r_x2": 214.11594, "r_y2": 399.81696, "r_x3": 209.509, "r_y3": 399.81696, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.71000999999998, "r_y0": 402.40771, "r_x1": 271.40527, "r_y1": 402.40771, "r_x2": 271.40527, "r_y2": 394.33795, "r_x3": 246.71000999999998, "r_y3": 394.33795, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.017, "r_y0": 402.40771, "r_x1": 310.00375, "r_y1": 402.40771, "r_x2": 310.00375, "r_y2": 394.33795, "r_x3": 289.017, "r_y3": 394.33795, "coord_origin": "TOPLEFT" }, "text": "0.938", "orig": "0.938", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.71701, "r_y0": 402.40771, "r_x1": 347.70377, "r_y1": 402.40771, "r_x2": 347.70377, "r_y2": 394.33795, "r_x3": 326.71701, "r_y3": 394.33795, "coord_origin": "TOPLEFT" }, "text": "0.904", "orig": "0.904", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.67599, "r_y0": 402.40771, "r_x1": 384.66275, "r_y1": 402.40771, "r_x2": 384.66275, "r_y2": 394.33795, "r_x3": 363.67599, "r_y3": 394.33795, "coord_origin": "TOPLEFT" }, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.61801, "r_y0": 402.20148, "r_x1": 418.77887, "r_y1": 402.20148, "r_x2": 418.77887, "r_y2": 394.27518, "r_x3": 394.61801, "r_y3": 394.27518, "coord_origin": "TOPLEFT" }, "text": "0.853", "orig": "0.853", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.52701, "r_y0": 402.20148, "r_x1": 458.38425, "r_y1": 402.20148, "r_x2": 458.38425, "r_y2": 394.27518, "r_x3": 439.52701, "r_y3": 394.27518, "coord_origin": "TOPLEFT" }, "text": "1.97", "orig": "1.97", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.17598999999998, "r_y0": 415.3587, "r_x1": 272.93954, "r_y1": 415.3587, "r_x2": 272.93954, "r_y2": 407.28894, "r_x3": 245.17598999999998, "r_y3": 407.28894, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.017, "r_y0": 415.3587, "r_x1": 310.00375, "r_y1": 415.3587, "r_x2": 310.00375, "r_y2": 407.28894, "r_x3": 289.017, "r_y3": 407.28894, "coord_origin": "TOPLEFT" }, "text": "0.952", "orig": "0.952", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.71701, "r_y0": 415.3587, "r_x1": 347.70377, "r_y1": 415.3587, "r_x2": 347.70377, "r_y2": 407.28894, "r_x3": 326.71701, "r_y3": 407.28894, "coord_origin": "TOPLEFT" }, "text": "0.909", "orig": "0.909", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.08801, "r_y0": 415.15247, "r_x1": 386.24887, "r_y1": 415.15247, "r_x2": 386.24887, "r_y2": 407.22617, "r_x3": 362.08801, "r_y3": 407.22617, "coord_origin": "TOPLEFT" }, "text": "0.938", "orig": "0.938", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.20599, "r_y0": 415.3587, "r_x1": 417.19275, "r_y1": 415.3587, "r_x2": 417.19275, "r_y2": 407.28894, "r_x3": 396.20599, "r_y3": 407.28894, "coord_origin": "TOPLEFT" }, "text": "0.843", "orig": "0.843", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.767, "r_y0": 415.3587, "r_x1": 457.14682, "r_y1": 415.3587, "r_x2": 457.14682, "r_y2": 407.28894, "r_x3": 440.767, "r_y3": 407.28894, "coord_origin": "TOPLEFT" }, "text": "3.77", "orig": "3.77", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.90601, "r_y0": 434.1877099999999, "r_x1": 166.51294, "r_y1": 434.1877099999999, "r_x2": 166.51294, "r_y2": 426.11795, "r_x3": 161.90601, "r_y3": 426.11795, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.509, "r_y0": 434.1877099999999, "r_x1": 214.11594, "r_y1": 434.1877099999999, "r_x2": 214.11594, "r_y2": 426.11795, "r_x3": 209.509, "r_y3": 426.11795, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.71000999999998, "r_y0": 428.70871, "r_x1": 271.40527, "r_y1": 428.70871, "r_x2": 271.40527, "r_y2": 420.63895, "r_x3": 246.71000999999998, "r_y3": 420.63895, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.017, "r_y0": 428.70871, "r_x1": 310.00375, "r_y1": 428.70871, "r_x2": 310.00375, "r_y2": 420.63895, "r_x3": 289.017, "r_y3": 420.63895, "coord_origin": "TOPLEFT" }, "text": "0.923", "orig": "0.923", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.71701, "r_y0": 428.70871, "r_x1": 347.70377, "r_y1": 428.70871, "r_x2": 347.70377, "r_y2": 420.63895, "r_x3": 326.71701, "r_y3": 420.63895, "coord_origin": "TOPLEFT" }, "text": "0.897", "orig": "0.897", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.67599, "r_y0": 428.70871, "r_x1": 384.66275, "r_y1": 428.70871, "r_x2": 384.66275, "r_y2": 420.63895, "r_x3": 363.67599, "r_y3": 420.63895, "coord_origin": "TOPLEFT" }, "text": "0.915", "orig": "0.915", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.61801, "r_y0": 428.50247, "r_x1": 418.77887, "r_y1": 428.50247, "r_x2": 418.77887, "r_y2": 420.57617, "r_x3": 394.61801, "r_y3": 420.57617, "coord_origin": "TOPLEFT" }, "text": "0.859", "orig": "0.859", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.52701, "r_y0": 428.50247, "r_x1": 458.38425, "r_y1": 428.50247, "r_x2": 458.38425, "r_y2": 420.57617, "r_x3": 439.52701, "r_y3": 420.57617, "coord_origin": "TOPLEFT" }, "text": "1.91", "orig": "1.91", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.17598999999998, "r_y0": 441.6597, "r_x1": 272.93954, "r_y1": 441.6597, "r_x2": 272.93954, "r_y2": 433.58994, "r_x3": 245.17598999999998, "r_y3": 433.58994, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.017, "r_y0": 441.6597, "r_x1": 310.00375, "r_y1": 441.6597, "r_x2": 310.00375, "r_y2": 433.58994, "r_x3": 289.017, "r_y3": 433.58994, "coord_origin": "TOPLEFT" }, "text": "0.945", "orig": "0.945", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.71701, "r_y0": 441.6597, "r_x1": 347.70377, "r_y1": 441.6597, "r_x2": 347.70377, "r_y2": 433.58994, "r_x3": 326.71701, "r_y3": 433.58994, "coord_origin": "TOPLEFT" }, "text": "0.901", "orig": "0.901", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.08801, "r_y0": 441.45346, "r_x1": 386.24887, "r_y1": 441.45346, "r_x2": 386.24887, "r_y2": 433.5271599999999, "r_x3": 362.08801, "r_y3": 433.5271599999999, "coord_origin": "TOPLEFT" }, "text": "0.931", "orig": "0.931", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.20599, "r_y0": 441.6597, "r_x1": 417.19275, "r_y1": 441.6597, "r_x2": 417.19275, "r_y2": 433.58994, "r_x3": 396.20599, "r_y3": 433.58994, "coord_origin": "TOPLEFT" }, "text": "0.834", "orig": "0.834", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.767, "r_y0": 441.6597, "r_x1": 457.14682, "r_y1": 441.6597, "r_x2": 457.14682, "r_y2": 433.58994, "r_x3": 440.767, "r_y3": 433.58994, "coord_origin": "TOPLEFT" }, "text": "3.81", "orig": "3.81", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.90601, "r_y0": 460.48972, "r_x1": 166.51294, "r_y1": 460.48972, "r_x2": 166.51294, "r_y2": 452.41995, "r_x3": 161.90601, "r_y3": 452.41995, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.509, "r_y0": 460.48972, "r_x1": 214.11594, "r_y1": 460.48972, "r_x2": 214.11594, "r_y2": 452.41995, "r_x3": 209.509, "r_y3": 452.41995, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.71000999999998, "r_y0": 455.0097, "r_x1": 271.40527, "r_y1": 455.0097, "r_x2": 271.40527, "r_y2": 446.9399399999999, "r_x3": 246.71000999999998, "r_y3": 446.9399399999999, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.017, "r_y0": 455.0097, "r_x1": 310.00375, "r_y1": 455.0097, "r_x2": 310.00375, "r_y2": 446.9399399999999, "r_x3": 289.017, "r_y3": 446.9399399999999, "coord_origin": "TOPLEFT" }, "text": "0.952", "orig": "0.952", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 329.021, "r_y0": 455.0097, "r_x1": 345.40082, "r_y1": 455.0097, "r_x2": 345.40082, "r_y2": 446.9399399999999, "r_x3": 329.021, "r_y3": 446.9399399999999, "coord_origin": "TOPLEFT" }, "text": "0.92", "orig": "0.92", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.08801, "r_y0": 454.80347, "r_x1": 386.24887, "r_y1": 454.80347, "r_x2": 386.24887, "r_y2": 446.87717, "r_x3": 362.08801, "r_y3": 446.87717, "coord_origin": "TOPLEFT" }, "text": "0.942", "orig": "0.942", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.61801, "r_y0": 454.80347, "r_x1": 418.77887, "r_y1": 454.80347, "r_x2": 418.77887, "r_y2": 446.87717, "r_x3": 394.61801, "r_y3": 446.87717, "coord_origin": "TOPLEFT" }, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.52701, "r_y0": 454.80347, "r_x1": 458.38425, "r_y1": 454.80347, "r_x2": 458.38425, "r_y2": 446.87717, "r_x3": 439.52701, "r_y3": 446.87717, "coord_origin": "TOPLEFT" }, "text": "1.22", "orig": "1.22", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.17598999999998, "r_y0": 467.9617, "r_x1": 272.93954, "r_y1": 467.9617, "r_x2": 272.93954, "r_y2": 459.8919399999999, "r_x3": 245.17598999999998, "r_y3": 459.8919399999999, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.017, "r_y0": 467.9617, "r_x1": 310.00375, "r_y1": 467.9617, "r_x2": 310.00375, "r_y2": 459.8919399999999, "r_x3": 289.017, "r_y3": 459.8919399999999, "coord_origin": "TOPLEFT" }, "text": "0.944", "orig": "0.944", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.71701, "r_y0": 467.9617, "r_x1": 347.70377, "r_y1": 467.9617, "r_x2": 347.70377, "r_y2": 459.8919399999999, "r_x3": 326.71701, "r_y3": 459.8919399999999, "coord_origin": "TOPLEFT" }, "text": "0.903", "orig": "0.903", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.67599, "r_y0": 467.9617, "r_x1": 384.66275, "r_y1": 467.9617, "r_x2": 384.66275, "r_y2": 459.8919399999999, "r_x3": 363.67599, "r_y3": 459.8919399999999, "coord_origin": "TOPLEFT" }, "text": "0.931", "orig": "0.931", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.20599, "r_y0": 467.9617, "r_x1": 417.19275, "r_y1": 467.9617, "r_x2": 417.19275, "r_y2": 459.8919399999999, "r_x3": 396.20599, "r_y3": 459.8919399999999, "coord_origin": "TOPLEFT" }, "text": "0.824", "orig": "0.824", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 446.65302, "r_y0": 467.9617, "r_x1": 451.25995, "r_y1": 467.9617, "r_x2": 451.25995, "r_y2": 459.8919399999999, "r_x3": 446.65302, "r_y3": 459.8919399999999, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 11, "label": "text", "bbox": { "l": 160.37, "t": 341.73495, "r": 168.04793, "b": 349.8047199999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.37, "r_y0": 349.8047199999999, "r_x1": 168.04793, "r_y1": 349.8047199999999, "r_x2": 168.04793, "r_y2": 341.73495, "r_x3": 160.37, "r_y3": 341.73495, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 12, "label": "text", "bbox": { "l": 144.592, "t": 354.68594, "r": 183.82806, "b": 362.75570999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 144.592, "r_y0": 362.75570999999997, "r_x1": 183.82806, "r_y1": 362.75570999999997, "r_x2": 183.82806, "r_y2": 354.68594, "r_x3": 144.592, "r_y3": 354.68594, "coord_origin": "TOPLEFT" }, "text": "enc-layers", "orig": "enc-layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 13, "label": "text", "bbox": { "l": 207.974, "t": 341.73495, "r": 215.65193, "b": 349.8047199999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 207.974, "r_y0": 349.8047199999999, "r_x1": 215.65193, "r_y1": 349.8047199999999, "r_x2": 215.65193, "r_y2": 341.73495, "r_x3": 207.974, "r_y3": 341.73495, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 14, "label": "text", "bbox": { "l": 192.19499, "t": 354.68594, "r": 231.43106, "b": 362.75570999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 192.19499, "r_y0": 362.75570999999997, "r_x1": 231.43106, "r_y1": 362.75570999999997, "r_x2": 231.43106, "r_y2": 354.68594, "r_x3": 192.19499, "r_y3": 354.68594, "coord_origin": "TOPLEFT" }, "text": "dec-layers", "orig": "dec-layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 15, "label": "text", "bbox": { "l": 239.79799999999997, "t": 347.21396, "r": 278.31766, "b": 355.28372, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.79799999999997, "r_y0": 355.28372, "r_x1": 278.31766, "r_y1": 355.28372, "r_x2": 278.31766, "r_y2": 347.21396, "r_x3": 239.79799999999997, "r_y3": 347.21396, "coord_origin": "TOPLEFT" }, "text": "Language", "orig": "Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 16, "label": "text", "bbox": { "l": 324.67001, "t": 341.73495, "r": 348.26419, "b": 349.8047199999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 324.67001, "r_y0": 349.8047199999999, "r_x1": 348.26419, "r_y1": 349.8047199999999, "r_x2": 348.26419, "r_y2": 341.73495, "r_x3": 324.67001, "r_y3": 341.73495, "coord_origin": "TOPLEFT" }, "text": "TEDs", "orig": "TEDs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 17, "label": "text", "bbox": { "l": 396.271, "t": 341.73495, "r": 417.12683, "b": 349.8047199999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.271, "r_y0": 349.8047199999999, "r_x1": 417.12683, "r_y1": 349.8047199999999, "r_x2": 417.12683, "r_y2": 341.73495, "r_x3": 396.271, "r_y3": 341.73495, "coord_origin": "TOPLEFT" }, "text": "mAP", "orig": "mAP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 18, "label": "text", "bbox": { "l": 394.927, "t": 352.69394000000005, "r": 418.47278, "b": 360.7637, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.927, "r_y0": 360.7637, "r_x1": 418.47278, "r_y1": 360.7637, "r_x2": 418.47278, "r_y2": 352.69394000000005, "r_x3": 394.927, "r_y3": 352.69394000000005, "coord_origin": "TOPLEFT" }, "text": "(0.75)", "orig": "(0.75)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 19, "label": "text", "bbox": { "l": 430.771, "t": 341.73495, "r": 467.1423, "b": 349.8047199999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 430.771, "r_y0": 349.8047199999999, "r_x1": 467.1423, "r_y1": 349.8047199999999, "r_x2": 467.1423, "r_y2": 341.73495, "r_x3": 430.771, "r_y3": 341.73495, "coord_origin": "TOPLEFT" }, "text": "Inference", "orig": "Inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 20, "label": "text", "bbox": { "l": 427.14801, "t": 352.69394000000005, "r": 470.76056, "b": 360.7637, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 427.14801, "r_y0": 360.7637, "r_x1": 470.76056, "r_y1": 360.7637, "r_x2": 470.76056, "r_y2": 352.69394000000005, "r_x3": 427.14801, "r_y3": 352.69394000000005, "coord_origin": "TOPLEFT" }, "text": "time (secs)", "orig": "time (secs)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 21, "label": "text", "bbox": { "l": 286.686, "t": 354.68594, "r": 312.33261, "b": 362.75570999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 286.686, "r_y0": 362.75570999999997, "r_x1": 312.33261, "r_y1": 362.75570999999997, "r_x2": 312.33261, "r_y2": 354.68594, "r_x3": 286.686, "r_y3": 354.68594, "coord_origin": "TOPLEFT" }, "text": "simple", "orig": "simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 22, "label": "text", "bbox": { "l": 320.702, "t": 354.68594, "r": 353.71988, "b": 362.75570999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.702, "r_y0": 362.75570999999997, "r_x1": 353.71988, "r_y1": 362.75570999999997, "r_x2": 353.71988, "r_y2": 354.68594, "r_x3": 320.702, "r_y3": 354.68594, "coord_origin": "TOPLEFT" }, "text": "complex", "orig": "complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 23, "label": "text", "bbox": { "l": 369.306, "t": 354.68594, "r": 379.03094, "b": 362.75570999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 369.306, "r_y0": 362.75570999999997, "r_x1": 379.03094, "r_y1": 362.75570999999997, "r_x2": 379.03094, "r_y2": 354.68594, "r_x3": 369.306, "r_y3": 354.68594, "coord_origin": "TOPLEFT" }, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 24, "label": "text", "bbox": { "l": 161.90601, "t": 373.51596, "r": 166.51294, "b": 381.58572, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.90601, "r_y0": 381.58572, "r_x1": 166.51294, "r_y1": 381.58572, "r_x2": 166.51294, "r_y2": 373.51596, "r_x3": 161.90601, "r_y3": 373.51596, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 25, "label": "text", "bbox": { "l": 209.509, "t": 373.51596, "r": 214.11594, "b": 381.58572, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.509, "r_y0": 381.58572, "r_x1": 214.11594, "r_y1": 381.58572, "r_x2": 214.11594, "r_y2": 373.51596, "r_x3": 209.509, "r_y3": 373.51596, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 26, "label": "text", "bbox": { "l": 246.71000999999998, "t": 368.03595, "r": 271.40527, "b": 376.10571, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.71000999999998, "r_y0": 376.10571, "r_x1": 271.40527, "r_y1": 376.10571, "r_x2": 271.40527, "r_y2": 368.03595, "r_x3": 246.71000999999998, "r_y3": 368.03595, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 27, "label": "text", "bbox": { "l": 289.017, "t": 368.03595, "r": 310.00375, "b": 376.10571, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.017, "r_y0": 376.10571, "r_x1": 310.00375, "r_y1": 376.10571, "r_x2": 310.00375, "r_y2": 368.03595, "r_x3": 289.017, "r_y3": 368.03595, "coord_origin": "TOPLEFT" }, "text": "0.965", "orig": "0.965", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 28, "label": "text", "bbox": { "l": 326.71701, "t": 368.03595, "r": 347.70377, "b": 376.10571, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.71701, "r_y0": 376.10571, "r_x1": 347.70377, "r_y1": 376.10571, "r_x2": 347.70377, "r_y2": 368.03595, "r_x3": 326.71701, "r_y3": 368.03595, "coord_origin": "TOPLEFT" }, "text": "0.934", "orig": "0.934", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 29, "label": "text", "bbox": { "l": 363.67599, "t": 368.03595, "r": 384.66275, "b": 376.10571, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.67599, "r_y0": 376.10571, "r_x1": 384.66275, "r_y1": 376.10571, "r_x2": 384.66275, "r_y2": 368.03595, "r_x3": 363.67599, "r_y3": 368.03595, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 30, "label": "text", "bbox": { "l": 397.26999, "t": 367.97317999999996, "r": 416.12723, "b": 375.89948, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.26999, "r_y0": 375.89948, "r_x1": 416.12723, "r_y1": 375.89948, "r_x2": 416.12723, "r_y2": 367.97317999999996, "r_x3": 397.26999, "r_y3": 367.97317999999996, "coord_origin": "TOPLEFT" }, "text": "0.88", "orig": "0.88", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 31, "label": "text", "bbox": { "l": 439.52701, "t": 367.97317999999996, "r": 458.38425, "b": 375.89948, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.52701, "r_y0": 375.89948, "r_x1": 458.38425, "r_y1": 375.89948, "r_x2": 458.38425, "r_y2": 367.97317999999996, "r_x3": 439.52701, "r_y3": 367.97317999999996, "coord_origin": "TOPLEFT" }, "text": "2.73", "orig": "2.73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 32, "label": "text", "bbox": { "l": 245.17598999999998, "t": 380.98795, "r": 272.93954, "b": 389.05771, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.17598999999998, "r_y0": 389.05771, "r_x1": 272.93954, "r_y1": 389.05771, "r_x2": 272.93954, "r_y2": 380.98795, "r_x3": 245.17598999999998, "r_y3": 380.98795, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 33, "label": "text", "bbox": { "l": 289.017, "t": 380.98795, "r": 310.00375, "b": 389.05771, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.017, "r_y0": 389.05771, "r_x1": 310.00375, "r_y1": 389.05771, "r_x2": 310.00375, "r_y2": 380.98795, "r_x3": 289.017, "r_y3": 380.98795, "coord_origin": "TOPLEFT" }, "text": "0.969", "orig": "0.969", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 34, "label": "text", "bbox": { "l": 326.71701, "t": 380.98795, "r": 347.70377, "b": 389.05771, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.71701, "r_y0": 389.05771, "r_x1": 347.70377, "r_y1": 389.05771, "r_x2": 347.70377, "r_y2": 380.98795, "r_x3": 326.71701, "r_y3": 380.98795, "coord_origin": "TOPLEFT" }, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 35, "label": "text", "bbox": { "l": 363.67599, "t": 380.98795, "r": 384.66275, "b": 389.05771, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.67599, "r_y0": 389.05771, "r_x1": 384.66275, "r_y1": 389.05771, "r_x2": 384.66275, "r_y2": 380.98795, "r_x3": 363.67599, "r_y3": 380.98795, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 36, "label": "text", "bbox": { "l": 396.20599, "t": 380.98795, "r": 417.19275, "b": 389.05771, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.20599, "r_y0": 389.05771, "r_x1": 417.19275, "r_y1": 389.05771, "r_x2": 417.19275, "r_y2": 380.98795, "r_x3": 396.20599, "r_y3": 380.98795, "coord_origin": "TOPLEFT" }, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 37, "label": "text", "bbox": { "l": 440.767, "t": 380.98795, "r": 457.14682, "b": 389.05771, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.767, "r_y0": 389.05771, "r_x1": 457.14682, "r_y1": 389.05771, "r_x2": 457.14682, "r_y2": 380.98795, "r_x3": 440.767, "r_y3": 380.98795, "coord_origin": "TOPLEFT" }, "text": "5.39", "orig": "5.39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 38, "label": "text", "bbox": { "l": 161.90601, "t": 399.81696, "r": 166.51294, "b": 407.88672, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.90601, "r_y0": 407.88672, "r_x1": 166.51294, "r_y1": 407.88672, "r_x2": 166.51294, "r_y2": 399.81696, "r_x3": 161.90601, "r_y3": 399.81696, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 39, "label": "text", "bbox": { "l": 209.509, "t": 399.81696, "r": 214.11594, "b": 407.88672, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.509, "r_y0": 407.88672, "r_x1": 214.11594, "r_y1": 407.88672, "r_x2": 214.11594, "r_y2": 399.81696, "r_x3": 209.509, "r_y3": 399.81696, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 40, "label": "text", "bbox": { "l": 246.71000999999998, "t": 394.33795, "r": 271.40527, "b": 402.40771, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.71000999999998, "r_y0": 402.40771, "r_x1": 271.40527, "r_y1": 402.40771, "r_x2": 271.40527, "r_y2": 394.33795, "r_x3": 246.71000999999998, "r_y3": 394.33795, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 289.017, "t": 394.33795, "r": 310.00375, "b": 402.40771, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.017, "r_y0": 402.40771, "r_x1": 310.00375, "r_y1": 402.40771, "r_x2": 310.00375, "r_y2": 394.33795, "r_x3": 289.017, "r_y3": 394.33795, "coord_origin": "TOPLEFT" }, "text": "0.938", "orig": "0.938", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 326.71701, "t": 394.33795, "r": 347.70377, "b": 402.40771, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.71701, "r_y0": 402.40771, "r_x1": 347.70377, "r_y1": 402.40771, "r_x2": 347.70377, "r_y2": 394.33795, "r_x3": 326.71701, "r_y3": 394.33795, "coord_origin": "TOPLEFT" }, "text": "0.904", "orig": "0.904", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 363.67599, "t": 394.33795, "r": 384.66275, "b": 402.40771, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.67599, "r_y0": 402.40771, "r_x1": 384.66275, "r_y1": 402.40771, "r_x2": 384.66275, "r_y2": 394.33795, "r_x3": 363.67599, "r_y3": 394.33795, "coord_origin": "TOPLEFT" }, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 394.61801, "t": 394.27518, "r": 418.77887, "b": 402.20148, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.61801, "r_y0": 402.20148, "r_x1": 418.77887, "r_y1": 402.20148, "r_x2": 418.77887, "r_y2": 394.27518, "r_x3": 394.61801, "r_y3": 394.27518, "coord_origin": "TOPLEFT" }, "text": "0.853", "orig": "0.853", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 439.52701, "t": 394.27518, "r": 458.38425, "b": 402.20148, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.52701, "r_y0": 402.20148, "r_x1": 458.38425, "r_y1": 402.20148, "r_x2": 458.38425, "r_y2": 394.27518, "r_x3": 439.52701, "r_y3": 394.27518, "coord_origin": "TOPLEFT" }, "text": "1.97", "orig": "1.97", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 245.17598999999998, "t": 407.28894, "r": 272.93954, "b": 415.3587, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.17598999999998, "r_y0": 415.3587, "r_x1": 272.93954, "r_y1": 415.3587, "r_x2": 272.93954, "r_y2": 407.28894, "r_x3": 245.17598999999998, "r_y3": 407.28894, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 289.017, "t": 407.28894, "r": 310.00375, "b": 415.3587, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.017, "r_y0": 415.3587, "r_x1": 310.00375, "r_y1": 415.3587, "r_x2": 310.00375, "r_y2": 407.28894, "r_x3": 289.017, "r_y3": 407.28894, "coord_origin": "TOPLEFT" }, "text": "0.952", "orig": "0.952", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 326.71701, "t": 407.28894, "r": 347.70377, "b": 415.3587, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.71701, "r_y0": 415.3587, "r_x1": 347.70377, "r_y1": 415.3587, "r_x2": 347.70377, "r_y2": 407.28894, "r_x3": 326.71701, "r_y3": 407.28894, "coord_origin": "TOPLEFT" }, "text": "0.909", "orig": "0.909", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 362.08801, "t": 407.22617, "r": 386.24887, "b": 415.15247, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.08801, "r_y0": 415.15247, "r_x1": 386.24887, "r_y1": 415.15247, "r_x2": 386.24887, "r_y2": 407.22617, "r_x3": 362.08801, "r_y3": 407.22617, "coord_origin": "TOPLEFT" }, "text": "0.938", "orig": "0.938", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 396.20599, "t": 407.28894, "r": 417.19275, "b": 415.3587, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.20599, "r_y0": 415.3587, "r_x1": 417.19275, "r_y1": 415.3587, "r_x2": 417.19275, "r_y2": 407.28894, "r_x3": 396.20599, "r_y3": 407.28894, "coord_origin": "TOPLEFT" }, "text": "0.843", "orig": "0.843", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 51, "label": "text", "bbox": { "l": 440.767, "t": 407.28894, "r": 457.14682, "b": 415.3587, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.767, "r_y0": 415.3587, "r_x1": 457.14682, "r_y1": 415.3587, "r_x2": 457.14682, "r_y2": 407.28894, "r_x3": 440.767, "r_y3": 407.28894, "coord_origin": "TOPLEFT" }, "text": "3.77", "orig": "3.77", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 52, "label": "text", "bbox": { "l": 161.90601, "t": 426.11795, "r": 166.51294, "b": 434.1877099999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.90601, "r_y0": 434.1877099999999, "r_x1": 166.51294, "r_y1": 434.1877099999999, "r_x2": 166.51294, "r_y2": 426.11795, "r_x3": 161.90601, "r_y3": 426.11795, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 53, "label": "text", "bbox": { "l": 209.509, "t": 426.11795, "r": 214.11594, "b": 434.1877099999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.509, "r_y0": 434.1877099999999, "r_x1": 214.11594, "r_y1": 434.1877099999999, "r_x2": 214.11594, "r_y2": 426.11795, "r_x3": 209.509, "r_y3": 426.11795, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 54, "label": "text", "bbox": { "l": 246.71000999999998, "t": 420.63895, "r": 271.40527, "b": 428.70871, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.71000999999998, "r_y0": 428.70871, "r_x1": 271.40527, "r_y1": 428.70871, "r_x2": 271.40527, "r_y2": 420.63895, "r_x3": 246.71000999999998, "r_y3": 420.63895, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 55, "label": "text", "bbox": { "l": 289.017, "t": 420.63895, "r": 310.00375, "b": 428.70871, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.017, "r_y0": 428.70871, "r_x1": 310.00375, "r_y1": 428.70871, "r_x2": 310.00375, "r_y2": 420.63895, "r_x3": 289.017, "r_y3": 420.63895, "coord_origin": "TOPLEFT" }, "text": "0.923", "orig": "0.923", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 56, "label": "text", "bbox": { "l": 326.71701, "t": 420.63895, "r": 347.70377, "b": 428.70871, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.71701, "r_y0": 428.70871, "r_x1": 347.70377, "r_y1": 428.70871, "r_x2": 347.70377, "r_y2": 420.63895, "r_x3": 326.71701, "r_y3": 420.63895, "coord_origin": "TOPLEFT" }, "text": "0.897", "orig": "0.897", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 57, "label": "text", "bbox": { "l": 363.67599, "t": 420.63895, "r": 384.66275, "b": 428.70871, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.67599, "r_y0": 428.70871, "r_x1": 384.66275, "r_y1": 428.70871, "r_x2": 384.66275, "r_y2": 420.63895, "r_x3": 363.67599, "r_y3": 420.63895, "coord_origin": "TOPLEFT" }, "text": "0.915", "orig": "0.915", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 58, "label": "text", "bbox": { "l": 394.61801, "t": 420.57617, "r": 418.77887, "b": 428.50247, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.61801, "r_y0": 428.50247, "r_x1": 418.77887, "r_y1": 428.50247, "r_x2": 418.77887, "r_y2": 420.57617, "r_x3": 394.61801, "r_y3": 420.57617, "coord_origin": "TOPLEFT" }, "text": "0.859", "orig": "0.859", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 59, "label": "text", "bbox": { "l": 439.52701, "t": 420.57617, "r": 458.38425, "b": 428.50247, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.52701, "r_y0": 428.50247, "r_x1": 458.38425, "r_y1": 428.50247, "r_x2": 458.38425, "r_y2": 420.57617, "r_x3": 439.52701, "r_y3": 420.57617, "coord_origin": "TOPLEFT" }, "text": "1.91", "orig": "1.91", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 60, "label": "text", "bbox": { "l": 245.17598999999998, "t": 433.58994, "r": 272.93954, "b": 441.6597, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.17598999999998, "r_y0": 441.6597, "r_x1": 272.93954, "r_y1": 441.6597, "r_x2": 272.93954, "r_y2": 433.58994, "r_x3": 245.17598999999998, "r_y3": 433.58994, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 61, "label": "text", "bbox": { "l": 289.017, "t": 433.58994, "r": 310.00375, "b": 441.6597, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.017, "r_y0": 441.6597, "r_x1": 310.00375, "r_y1": 441.6597, "r_x2": 310.00375, "r_y2": 433.58994, "r_x3": 289.017, "r_y3": 433.58994, "coord_origin": "TOPLEFT" }, "text": "0.945", "orig": "0.945", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 62, "label": "text", "bbox": { "l": 326.71701, "t": 433.58994, "r": 347.70377, "b": 441.6597, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.71701, "r_y0": 441.6597, "r_x1": 347.70377, "r_y1": 441.6597, "r_x2": 347.70377, "r_y2": 433.58994, "r_x3": 326.71701, "r_y3": 433.58994, "coord_origin": "TOPLEFT" }, "text": "0.901", "orig": "0.901", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 362.08801, "t": 433.5271599999999, "r": 386.24887, "b": 441.45346, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.08801, "r_y0": 441.45346, "r_x1": 386.24887, "r_y1": 441.45346, "r_x2": 386.24887, "r_y2": 433.5271599999999, "r_x3": 362.08801, "r_y3": 433.5271599999999, "coord_origin": "TOPLEFT" }, "text": "0.931", "orig": "0.931", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 396.20599, "t": 433.58994, "r": 417.19275, "b": 441.6597, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.20599, "r_y0": 441.6597, "r_x1": 417.19275, "r_y1": 441.6597, "r_x2": 417.19275, "r_y2": 433.58994, "r_x3": 396.20599, "r_y3": 433.58994, "coord_origin": "TOPLEFT" }, "text": "0.834", "orig": "0.834", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 440.767, "t": 433.58994, "r": 457.14682, "b": 441.6597, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.767, "r_y0": 441.6597, "r_x1": 457.14682, "r_y1": 441.6597, "r_x2": 457.14682, "r_y2": 433.58994, "r_x3": 440.767, "r_y3": 433.58994, "coord_origin": "TOPLEFT" }, "text": "3.81", "orig": "3.81", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 161.90601, "t": 452.41995, "r": 166.51294, "b": 460.48972, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.90601, "r_y0": 460.48972, "r_x1": 166.51294, "r_y1": 460.48972, "r_x2": 166.51294, "r_y2": 452.41995, "r_x3": 161.90601, "r_y3": 452.41995, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 209.509, "t": 452.41995, "r": 214.11594, "b": 460.48972, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.509, "r_y0": 460.48972, "r_x1": 214.11594, "r_y1": 460.48972, "r_x2": 214.11594, "r_y2": 452.41995, "r_x3": 209.509, "r_y3": 452.41995, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 246.71000999999998, "t": 446.9399399999999, "r": 271.40527, "b": 455.0097, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.71000999999998, "r_y0": 455.0097, "r_x1": 271.40527, "r_y1": 455.0097, "r_x2": 271.40527, "r_y2": 446.9399399999999, "r_x3": 246.71000999999998, "r_y3": 446.9399399999999, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 289.017, "t": 446.9399399999999, "r": 310.00375, "b": 455.0097, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.017, "r_y0": 455.0097, "r_x1": 310.00375, "r_y1": 455.0097, "r_x2": 310.00375, "r_y2": 446.9399399999999, "r_x3": 289.017, "r_y3": 446.9399399999999, "coord_origin": "TOPLEFT" }, "text": "0.952", "orig": "0.952", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 329.021, "t": 446.9399399999999, "r": 345.40082, "b": 455.0097, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 329.021, "r_y0": 455.0097, "r_x1": 345.40082, "r_y1": 455.0097, "r_x2": 345.40082, "r_y2": 446.9399399999999, "r_x3": 329.021, "r_y3": 446.9399399999999, "coord_origin": "TOPLEFT" }, "text": "0.92", "orig": "0.92", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 362.08801, "t": 446.87717, "r": 386.24887, "b": 454.80347, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.08801, "r_y0": 454.80347, "r_x1": 386.24887, "r_y1": 454.80347, "r_x2": 386.24887, "r_y2": 446.87717, "r_x3": 362.08801, "r_y3": 446.87717, "coord_origin": "TOPLEFT" }, "text": "0.942", "orig": "0.942", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 394.61801, "t": 446.87717, "r": 418.77887, "b": 454.80347, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.61801, "r_y0": 454.80347, "r_x1": 418.77887, "r_y1": 454.80347, "r_x2": 418.77887, "r_y2": 446.87717, "r_x3": 394.61801, "r_y3": 446.87717, "coord_origin": "TOPLEFT" }, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 439.52701, "t": 446.87717, "r": 458.38425, "b": 454.80347, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.52701, "r_y0": 454.80347, "r_x1": 458.38425, "r_y1": 454.80347, "r_x2": 458.38425, "r_y2": 446.87717, "r_x3": 439.52701, "r_y3": 446.87717, "coord_origin": "TOPLEFT" }, "text": "1.22", "orig": "1.22", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 245.17598999999998, "t": 459.8919399999999, "r": 272.93954, "b": 467.9617, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.17598999999998, "r_y0": 467.9617, "r_x1": 272.93954, "r_y1": 467.9617, "r_x2": 272.93954, "r_y2": 459.8919399999999, "r_x3": 245.17598999999998, "r_y3": 459.8919399999999, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 289.017, "t": 459.8919399999999, "r": 310.00375, "b": 467.9617, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.017, "r_y0": 467.9617, "r_x1": 310.00375, "r_y1": 467.9617, "r_x2": 310.00375, "r_y2": 459.8919399999999, "r_x3": 289.017, "r_y3": 459.8919399999999, "coord_origin": "TOPLEFT" }, "text": "0.944", "orig": "0.944", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 326.71701, "t": 459.8919399999999, "r": 347.70377, "b": 467.9617, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.71701, "r_y0": 467.9617, "r_x1": 347.70377, "r_y1": 467.9617, "r_x2": 347.70377, "r_y2": 459.8919399999999, "r_x3": 326.71701, "r_y3": 459.8919399999999, "coord_origin": "TOPLEFT" }, "text": "0.903", "orig": "0.903", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 363.67599, "t": 459.8919399999999, "r": 384.66275, "b": 467.9617, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.67599, "r_y0": 467.9617, "r_x1": 384.66275, "r_y1": 467.9617, "r_x2": 384.66275, "r_y2": 459.8919399999999, "r_x3": 363.67599, "r_y3": 459.8919399999999, "coord_origin": "TOPLEFT" }, "text": "0.931", "orig": "0.931", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 396.20599, "t": 459.8919399999999, "r": 417.19275, "b": 467.9617, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.20599, "r_y0": 467.9617, "r_x1": 417.19275, "r_y1": 467.9617, "r_x2": 417.19275, "r_y2": 459.8919399999999, "r_x3": 396.20599, "r_y3": 459.8919399999999, "coord_origin": "TOPLEFT" }, "text": "0.824", "orig": "0.824", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 446.65302, "t": 459.8919399999999, "r": 451.25995, "b": 467.9617, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 446.65302, "r_y0": 467.9617, "r_x1": 451.25995, "r_y1": 467.9617, "r_x2": 451.25995, "r_y2": 459.8919399999999, "r_x3": 446.65302, "r_y3": 459.8919399999999, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "lcel", "lcel", "ched", "ched", "nl", "ucel", "ucel", "ucel", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 6, "num_cols": 8, "table_cells": [ { "bbox": { "l": 160.37, "t": 341.73495, "r": 168.04793, "b": 349.8047199999999, "coord_origin": "TOPLEFT" }, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "# enc-layers", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 207.974, "t": 341.73495, "r": 215.65193, "b": 349.8047199999999, "coord_origin": "TOPLEFT" }, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "# dec-layers", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 239.79799999999997, "t": 347.21396, "r": 278.31766, "b": 355.28372, "coord_origin": "TOPLEFT" }, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "Language", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 324.67001, "t": 341.73495, "r": 348.26419, "b": 349.8047199999999, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 3, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 3, "end_col_offset_idx": 6, "text": "TEDs", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 396.271, "t": 341.73495, "r": 417.12683, "b": 349.8047199999999, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "mAP", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 394.927, "t": 352.69394000000005, "r": 418.47278, "b": 360.7637, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "(0.75)", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 430.771, "t": 341.73495, "r": 467.1423, "b": 349.8047199999999, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 7, "end_col_offset_idx": 8, "text": "Inference", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 427.14801, "t": 352.69394000000005, "r": 470.76056, "b": 360.7637, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 7, "end_col_offset_idx": 8, "text": "time (secs)", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 286.686, "t": 354.68594, "r": 312.33261, "b": 362.75570999999997, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "simple", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 320.702, "t": 354.68594, "r": 353.71988, "b": 362.75570999999997, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "complex", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 369.306, "t": 354.68594, "r": 379.03094, "b": 362.75570999999997, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "all", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 161.90601, "t": 373.51596, "r": 166.51294, "b": 381.58572, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "6", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 209.509, "t": 373.51596, "r": 214.11594, "b": 381.58572, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "6", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 246.71000999999998, "t": 368.03595, "r": 271.40527, "b": 376.10571, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 289.017, "t": 368.03595, "r": 310.00375, "b": 376.10571, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.965 0.969", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 326.71701, "t": 368.03595, "r": 347.70377, "b": 376.10571, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.934 0.927", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 363.67599, "t": 368.03595, "r": 384.66275, "b": 376.10571, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.955 0.955", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 397.26999, "t": 367.97317999999996, "r": 416.12723, "b": 375.89948, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "0.88 0.857", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 439.52701, "t": 367.97317999999996, "r": 458.38425, "b": 375.89948, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 7, "end_col_offset_idx": 8, "text": "2.73 5.39", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 161.90601, "t": 399.81696, "r": 166.51294, "b": 407.88672, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "4", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 209.509, "t": 399.81696, "r": 214.11594, "b": 407.88672, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "4", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 246.71000999999998, "t": 394.33795, "r": 271.40527, "b": 402.40771, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 289.017, "t": 394.33795, "r": 310.00375, "b": 402.40771, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.938 0.952", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 326.71701, "t": 394.33795, "r": 347.70377, "b": 402.40771, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.904 0.909", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 363.67599, "t": 394.33795, "r": 384.66275, "b": 402.40771, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.927 0.938", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 394.61801, "t": 394.27518, "r": 418.77887, "b": 402.20148, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "0.853 0.843", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 439.52701, "t": 394.27518, "r": 458.38425, "b": 402.20148, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 7, "end_col_offset_idx": 8, "text": "1.97 3.77", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 161.90601, "t": 426.11795, "r": 166.51294, "b": 434.1877099999999, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "2", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 209.509, "t": 426.11795, "r": 214.11594, "b": 434.1877099999999, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "4", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 246.71000999999998, "t": 420.63895, "r": 271.40527, "b": 428.70871, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 289.017, "t": 420.63895, "r": 310.00375, "b": 428.70871, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.923 0.945", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 326.71701, "t": 420.63895, "r": 347.70377, "b": 428.70871, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.897 0.901", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 363.67599, "t": 420.63895, "r": 384.66275, "b": 428.70871, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.915 0.931", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 394.61801, "t": 420.57617, "r": 418.77887, "b": 428.50247, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "0.859 0.834", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 439.52701, "t": 420.57617, "r": 458.38425, "b": 428.50247, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 7, "end_col_offset_idx": 8, "text": "1.91 3.81", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 161.90601, "t": 452.41995, "r": 166.51294, "b": 460.48972, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "4", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 209.509, "t": 452.41995, "r": 214.11594, "b": 460.48972, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "2", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 246.71000999999998, "t": 446.9399399999999, "r": 271.40527, "b": 455.0097, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 289.017, "t": 446.9399399999999, "r": 310.00375, "b": 455.0097, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.952 0.944", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 329.021, "t": 446.9399399999999, "r": 345.40082, "b": 455.0097, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.92 0.903", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 362.08801, "t": 446.87717, "r": 386.24887, "b": 454.80347, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.942 0.931", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 394.61801, "t": 446.87717, "r": 418.77887, "b": 454.80347, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "0.857 0.824", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 439.52701, "t": 446.87717, "r": 458.38425, "b": 454.80347, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 7, "end_col_offset_idx": 8, "text": "1.22 2", "column_header": false, "row_header": false, "row_section": false } ] } } }, "figures_classification": null, "equations_prediction": null, "vlm_response": null }, "assembled": { "elements": [ { "label": "page_header", "id": 8, "page_no": 8, "cluster": { "id": 8, "label": "page_header", "bbox": { "l": 194.478, "t": 93.77099999999996, "r": 447.54291000000006, "b": 101.84069999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.9373378753662109, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.478, "r_y0": 101.84069999999997, "r_x1": 447.54291000000006, "r_y1": 101.84069999999997, "r_x2": 447.54291000000006, "r_y2": 93.77099999999996, "r_x3": 194.478, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Optimized Table Tokenization for Table Structure Recognition" }, { "label": "page_header", "id": 9, "page_no": 8, "cluster": { "id": 9, "label": "page_header", "bbox": { "l": 475.98431, "t": 93.77099999999996, "r": 480.59125000000006, "b": 101.84069999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.8857625722885132, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 475.98431, "r_y0": 101.84069999999997, "r_x1": 480.59125000000006, "r_y1": 101.84069999999997, "r_x2": 480.59125000000006, "r_y2": 93.77099999999996, "r_x3": 475.98431, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "9" }, { "label": "text", "id": 4, "page_no": 8, "cluster": { "id": 4, "label": "text", "bbox": { "l": 134.765, "t": 118.93377999999996, "r": 480.59579, "b": 151.64178000000004, "coord_origin": "TOPLEFT" }, "confidence": 0.9805440306663513, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 127.73077, "r_x1": 480.5936899999999, "r_y1": 127.73077, "r_x2": 480.5936899999999, "r_y2": 118.93377999999996, "r_x3": 134.765, "r_y3": 118.93377999999996, "coord_origin": "TOPLEFT" }, "text": "order to compute the TED score. Inference timing results for all experiments", "orig": "order to compute the TED score. Inference timing results for all experiments", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 139.68579, "r_x1": 480.59579, "r_y1": 139.68579, "r_x2": 480.59579, "r_y2": 130.88878999999997, "r_x3": 134.765, "r_y3": 130.88878999999997, "coord_origin": "TOPLEFT" }, "text": "were obtained from the same machine on a single core with AMD EPYC 7763", "orig": "were obtained from the same machine on a single core with AMD EPYC 7763", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 151.64178000000004, "r_x1": 210.78462, "r_y1": 151.64178000000004, "r_x2": 210.78462, "r_y2": 142.84479, "r_x3": 134.765, "r_y3": 142.84479, "coord_origin": "TOPLEFT" }, "text": "CPU @2.45 GHz.", "orig": "CPU @2.45 GHz.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "order to compute the TED score. Inference timing results for all experiments were obtained from the same machine on a single core with AMD EPYC 7763 CPU @2.45 GHz." }, { "label": "section_header", "id": 6, "page_no": 8, "cluster": { "id": 6, "label": "section_header", "bbox": { "l": 134.765, "t": 169.18584999999996, "r": 318.44843, "b": 177.9928, "coord_origin": "TOPLEFT" }, "confidence": 0.9579681158065796, "cells": [ { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 177.9928, "r_x1": 149.40205, "r_y1": 177.9928, "r_x2": 149.40205, "r_y2": 169.18584999999996, "r_x3": 134.765, "r_y3": 169.18584999999996, "coord_origin": "TOPLEFT" }, "text": "5.1", "orig": "5.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.85904, "r_y0": 177.9928, "r_x1": 318.44843, "r_y1": 177.9928, "r_x2": 318.44843, "r_y2": 169.18584999999996, "r_x3": 160.85904, "r_y3": 169.18584999999996, "coord_origin": "TOPLEFT" }, "text": "Hyper Parameter Optimization", "orig": "Hyper Parameter Optimization", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "5.1 Hyper Parameter Optimization" }, { "label": "text", "id": 3, "page_no": 8, "cluster": { "id": 3, "label": "text", "bbox": { "l": 134.76498, "t": 185.58582, "r": 480.59277, "b": 254.15886999999998, "coord_origin": "TOPLEFT" }, "confidence": 0.9842326641082764, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 194.38280999999995, "r_x1": 480.59183, "r_y1": 194.38280999999995, "r_x2": 480.59183, "r_y2": 185.58582, "r_x3": 134.765, "r_y3": 185.58582, "coord_origin": "TOPLEFT" }, "text": "We have chosen the PubTabNet data set to perform HPO, since it includes a", "orig": "We have chosen the PubTabNet data set to perform HPO, since it includes a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 206.33783000000005, "r_x1": 480.59183, "r_y1": 206.33783000000005, "r_x2": 480.59183, "r_y2": 197.54083000000003, "r_x3": 134.765, "r_y3": 197.54083000000003, "coord_origin": "TOPLEFT" }, "text": "highly diverse set of tables. Also we report TED scores separately for simple and", "orig": "highly diverse set of tables. Also we report TED scores separately for simple and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 218.29285000000004, "r_x1": 480.59177000000005, "r_y1": 218.29285000000004, "r_x2": 480.59177000000005, "r_y2": 209.49585000000002, "r_x3": 134.765, "r_y3": 209.49585000000002, "coord_origin": "TOPLEFT" }, "text": "complex tables (tables with cell spans). Results are presented in Table. 1. It is", "orig": "complex tables (tables with cell spans). Results are presented in Table. 1. It is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 230.24785999999995, "r_x1": 480.59277, "r_y1": 230.24785999999995, "r_x2": 480.59277, "r_y2": 221.45087, "r_x3": 134.765, "r_y3": 221.45087, "coord_origin": "TOPLEFT" }, "text": "evident that with OTSL, our model achieves the same TED score and slightly", "orig": "evident that with OTSL, our model achieves the same TED score and slightly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 242.20288000000005, "r_x1": 440.94159, "r_y1": 242.20288000000005, "r_x2": 440.94159, "r_y2": 233.40588000000002, "r_x3": 134.765, "r_y3": 233.40588000000002, "coord_origin": "TOPLEFT" }, "text": "better mAP scores in comparison to HTML. However OTSL yields a", "orig": "better mAP scores in comparison to HTML. However OTSL yields a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 444.86798, "r_y0": 242.20288000000005, "r_x1": 480.58786000000003, "r_y1": 242.20288000000005, "r_x2": 480.58786000000003, "r_y2": 233.40588000000002, "r_x3": 444.86798, "r_y3": 233.40588000000002, "coord_origin": "TOPLEFT" }, "text": "2x speed", "orig": "2x speed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 254.15886999999998, "r_x1": 145.20081, "r_y1": 254.15886999999998, "r_x2": 145.20081, "r_y2": 245.36188000000004, "r_x3": 134.76498, "r_y3": 245.36188000000004, "coord_origin": "TOPLEFT" }, "text": "up", "orig": "up", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.14899, "r_y0": 254.15886999999998, "r_x1": 311.21957, "r_y1": 254.15886999999998, "r_x2": 311.21957, "r_y2": 245.36188000000004, "r_x3": 149.14899, "r_y3": 245.36188000000004, "coord_origin": "TOPLEFT" }, "text": "in the inference runtime over HTML.", "orig": "in the inference runtime over HTML.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "We have chosen the PubTabNet data set to perform HPO, since it includes a highly diverse set of tables. Also we report TED scores separately for simple and complex tables (tables with cell spans). Results are presented in Table. 1. It is evident that with OTSL, our model achieves the same TED score and slightly better mAP scores in comparison to HTML. However OTSL yields a 2x speed up in the inference runtime over HTML." }, { "label": "caption", "id": 7, "page_no": 8, "cluster": { "id": 7, "label": "caption", "bbox": { "l": 134.76498, "t": 275.07232999999997, "r": 480.5954, "b": 327.0408, "coord_origin": "TOPLEFT" }, "confidence": 0.9570781588554382, "cells": [ { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 282.9986, "r_x1": 160.11836, "r_y1": 282.9986, "r_x2": 160.11836, "r_y2": 275.07232999999997, "r_x3": 134.76498, "r_y3": 275.07232999999997, "coord_origin": "TOPLEFT" }, "text": "Table", "orig": "Table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.34528, "r_y0": 282.9986, "r_x1": 175.59526, "r_y1": 282.9986, "r_x2": 175.59526, "r_y2": 275.07232999999997, "r_x3": 167.34528, "r_y3": 275.07232999999997, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 188.13298, "r_y0": 283.2048300000001, "r_x1": 480.59365999999994, "r_y1": 283.2048300000001, "r_x2": 480.59365999999994, "r_y2": 275.13507000000004, "r_x3": 188.13298, "r_y3": 275.13507000000004, "coord_origin": "TOPLEFT" }, "text": "HPO performed in OTSL and HTML representation on the same", "orig": "HPO performed in OTSL and HTML representation on the same", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 294.16385, "r_x1": 480.59444999999994, "r_y1": 294.16385, "r_x2": 480.59444999999994, "r_y2": 286.09409, "r_x3": 134.76498, "r_y3": 286.09409, "coord_origin": "TOPLEFT" }, "text": "transformer-based TableFormer [9] architecture, trained only on PubTabNet [22]. Ef-", "orig": "transformer-based TableFormer [9] architecture, trained only on PubTabNet [22]. Ef-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 305.12283, "r_x1": 480.5954, "r_y1": 305.12283, "r_x2": 480.5954, "r_y2": 297.05307, "r_x3": 134.76498, "r_y3": 297.05307, "coord_origin": "TOPLEFT" }, "text": "fects of reducing the # of layers in encoder and decoder stages of the model show that", "orig": "fects of reducing the # of layers in encoder and decoder stages of the model show that", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 316.08182, "r_x1": 480.59451, "r_y1": 316.08182, "r_x2": 480.59451, "r_y2": 308.01205, "r_x3": 134.76498, "r_y3": 308.01205, "coord_origin": "TOPLEFT" }, "text": "smaller models trained on OTSL perform better, especially in recognizing complex", "orig": "smaller models trained on OTSL perform better, especially in recognizing complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 327.0408, "r_x1": 480.59441999999996, "r_y1": 327.0408, "r_x2": 480.59441999999996, "r_y2": 318.97104, "r_x3": 134.76498, "r_y3": 318.97104, "coord_origin": "TOPLEFT" }, "text": "table structures, and maintain a much higher mAP score than the HTML counterpart.", "orig": "table structures, and maintain a much higher mAP score than the HTML counterpart.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Table 1. HPO performed in OTSL and HTML representation on the same transformer-based TableFormer [9] architecture, trained only on PubTabNet [22]. Effects of reducing the # of layers in encoder and decoder stages of the model show that smaller models trained on OTSL perform better, especially in recognizing complex table structures, and maintain a much higher mAP score than the HTML counterpart." }, { "label": "table", "id": 0, "page_no": 8, "cluster": { "id": 0, "label": "table", "bbox": { "l": 139.66845703125, "t": 337.5747985839844, "r": 475.00372314453125, "b": 469.4721374511719, "coord_origin": "TOPLEFT" }, "confidence": 0.9901032447814941, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.37, "r_y0": 349.8047199999999, "r_x1": 168.04793, "r_y1": 349.8047199999999, "r_x2": 168.04793, "r_y2": 341.73495, "r_x3": 160.37, "r_y3": 341.73495, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 144.592, "r_y0": 362.75570999999997, "r_x1": 183.82806, "r_y1": 362.75570999999997, "r_x2": 183.82806, "r_y2": 354.68594, "r_x3": 144.592, "r_y3": 354.68594, "coord_origin": "TOPLEFT" }, "text": "enc-layers", "orig": "enc-layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 207.974, "r_y0": 349.8047199999999, "r_x1": 215.65193, "r_y1": 349.8047199999999, "r_x2": 215.65193, "r_y2": 341.73495, "r_x3": 207.974, "r_y3": 341.73495, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 192.19499, "r_y0": 362.75570999999997, "r_x1": 231.43106, "r_y1": 362.75570999999997, "r_x2": 231.43106, "r_y2": 354.68594, "r_x3": 192.19499, "r_y3": 354.68594, "coord_origin": "TOPLEFT" }, "text": "dec-layers", "orig": "dec-layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.79799999999997, "r_y0": 355.28372, "r_x1": 278.31766, "r_y1": 355.28372, "r_x2": 278.31766, "r_y2": 347.21396, "r_x3": 239.79799999999997, "r_y3": 347.21396, "coord_origin": "TOPLEFT" }, "text": "Language", "orig": "Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 324.67001, "r_y0": 349.8047199999999, "r_x1": 348.26419, "r_y1": 349.8047199999999, "r_x2": 348.26419, "r_y2": 341.73495, "r_x3": 324.67001, "r_y3": 341.73495, "coord_origin": "TOPLEFT" }, "text": "TEDs", "orig": "TEDs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.271, "r_y0": 349.8047199999999, "r_x1": 417.12683, "r_y1": 349.8047199999999, "r_x2": 417.12683, "r_y2": 341.73495, "r_x3": 396.271, "r_y3": 341.73495, "coord_origin": "TOPLEFT" }, "text": "mAP", "orig": "mAP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.927, "r_y0": 360.7637, "r_x1": 418.47278, "r_y1": 360.7637, "r_x2": 418.47278, "r_y2": 352.69394000000005, "r_x3": 394.927, "r_y3": 352.69394000000005, "coord_origin": "TOPLEFT" }, "text": "(0.75)", "orig": "(0.75)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 430.771, "r_y0": 349.8047199999999, "r_x1": 467.1423, "r_y1": 349.8047199999999, "r_x2": 467.1423, "r_y2": 341.73495, "r_x3": 430.771, "r_y3": 341.73495, "coord_origin": "TOPLEFT" }, "text": "Inference", "orig": "Inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 427.14801, "r_y0": 360.7637, "r_x1": 470.76056, "r_y1": 360.7637, "r_x2": 470.76056, "r_y2": 352.69394000000005, "r_x3": 427.14801, "r_y3": 352.69394000000005, "coord_origin": "TOPLEFT" }, "text": "time (secs)", "orig": "time (secs)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 286.686, "r_y0": 362.75570999999997, "r_x1": 312.33261, "r_y1": 362.75570999999997, "r_x2": 312.33261, "r_y2": 354.68594, "r_x3": 286.686, "r_y3": 354.68594, "coord_origin": "TOPLEFT" }, "text": "simple", "orig": "simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.702, "r_y0": 362.75570999999997, "r_x1": 353.71988, "r_y1": 362.75570999999997, "r_x2": 353.71988, "r_y2": 354.68594, "r_x3": 320.702, "r_y3": 354.68594, "coord_origin": "TOPLEFT" }, "text": "complex", "orig": "complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 369.306, "r_y0": 362.75570999999997, "r_x1": 379.03094, "r_y1": 362.75570999999997, "r_x2": 379.03094, "r_y2": 354.68594, "r_x3": 369.306, "r_y3": 354.68594, "coord_origin": "TOPLEFT" }, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.90601, "r_y0": 381.58572, "r_x1": 166.51294, "r_y1": 381.58572, "r_x2": 166.51294, "r_y2": 373.51596, "r_x3": 161.90601, "r_y3": 373.51596, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.509, "r_y0": 381.58572, "r_x1": 214.11594, "r_y1": 381.58572, "r_x2": 214.11594, "r_y2": 373.51596, "r_x3": 209.509, "r_y3": 373.51596, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.71000999999998, "r_y0": 376.10571, "r_x1": 271.40527, "r_y1": 376.10571, "r_x2": 271.40527, "r_y2": 368.03595, "r_x3": 246.71000999999998, "r_y3": 368.03595, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.017, "r_y0": 376.10571, "r_x1": 310.00375, "r_y1": 376.10571, "r_x2": 310.00375, "r_y2": 368.03595, "r_x3": 289.017, "r_y3": 368.03595, "coord_origin": "TOPLEFT" }, "text": "0.965", "orig": "0.965", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.71701, "r_y0": 376.10571, "r_x1": 347.70377, "r_y1": 376.10571, "r_x2": 347.70377, "r_y2": 368.03595, "r_x3": 326.71701, "r_y3": 368.03595, "coord_origin": "TOPLEFT" }, "text": "0.934", "orig": "0.934", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.67599, "r_y0": 376.10571, "r_x1": 384.66275, "r_y1": 376.10571, "r_x2": 384.66275, "r_y2": 368.03595, "r_x3": 363.67599, "r_y3": 368.03595, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.26999, "r_y0": 375.89948, "r_x1": 416.12723, "r_y1": 375.89948, "r_x2": 416.12723, "r_y2": 367.97317999999996, "r_x3": 397.26999, "r_y3": 367.97317999999996, "coord_origin": "TOPLEFT" }, "text": "0.88", "orig": "0.88", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.52701, "r_y0": 375.89948, "r_x1": 458.38425, "r_y1": 375.89948, "r_x2": 458.38425, "r_y2": 367.97317999999996, "r_x3": 439.52701, "r_y3": 367.97317999999996, "coord_origin": "TOPLEFT" }, "text": "2.73", "orig": "2.73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.17598999999998, "r_y0": 389.05771, "r_x1": 272.93954, "r_y1": 389.05771, "r_x2": 272.93954, "r_y2": 380.98795, "r_x3": 245.17598999999998, "r_y3": 380.98795, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.017, "r_y0": 389.05771, "r_x1": 310.00375, "r_y1": 389.05771, "r_x2": 310.00375, "r_y2": 380.98795, "r_x3": 289.017, "r_y3": 380.98795, "coord_origin": "TOPLEFT" }, "text": "0.969", "orig": "0.969", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.71701, "r_y0": 389.05771, "r_x1": 347.70377, "r_y1": 389.05771, "r_x2": 347.70377, "r_y2": 380.98795, "r_x3": 326.71701, "r_y3": 380.98795, "coord_origin": "TOPLEFT" }, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.67599, "r_y0": 389.05771, "r_x1": 384.66275, "r_y1": 389.05771, "r_x2": 384.66275, "r_y2": 380.98795, "r_x3": 363.67599, "r_y3": 380.98795, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.20599, "r_y0": 389.05771, "r_x1": 417.19275, "r_y1": 389.05771, "r_x2": 417.19275, "r_y2": 380.98795, "r_x3": 396.20599, "r_y3": 380.98795, "coord_origin": "TOPLEFT" }, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.767, "r_y0": 389.05771, "r_x1": 457.14682, "r_y1": 389.05771, "r_x2": 457.14682, "r_y2": 380.98795, "r_x3": 440.767, "r_y3": 380.98795, "coord_origin": "TOPLEFT" }, "text": "5.39", "orig": "5.39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.90601, "r_y0": 407.88672, "r_x1": 166.51294, "r_y1": 407.88672, "r_x2": 166.51294, "r_y2": 399.81696, "r_x3": 161.90601, "r_y3": 399.81696, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.509, "r_y0": 407.88672, "r_x1": 214.11594, "r_y1": 407.88672, "r_x2": 214.11594, "r_y2": 399.81696, "r_x3": 209.509, "r_y3": 399.81696, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.71000999999998, "r_y0": 402.40771, "r_x1": 271.40527, "r_y1": 402.40771, "r_x2": 271.40527, "r_y2": 394.33795, "r_x3": 246.71000999999998, "r_y3": 394.33795, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.017, "r_y0": 402.40771, "r_x1": 310.00375, "r_y1": 402.40771, "r_x2": 310.00375, "r_y2": 394.33795, "r_x3": 289.017, "r_y3": 394.33795, "coord_origin": "TOPLEFT" }, "text": "0.938", "orig": "0.938", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.71701, "r_y0": 402.40771, "r_x1": 347.70377, "r_y1": 402.40771, "r_x2": 347.70377, "r_y2": 394.33795, "r_x3": 326.71701, "r_y3": 394.33795, "coord_origin": "TOPLEFT" }, "text": "0.904", "orig": "0.904", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.67599, "r_y0": 402.40771, "r_x1": 384.66275, "r_y1": 402.40771, "r_x2": 384.66275, "r_y2": 394.33795, "r_x3": 363.67599, "r_y3": 394.33795, "coord_origin": "TOPLEFT" }, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.61801, "r_y0": 402.20148, "r_x1": 418.77887, "r_y1": 402.20148, "r_x2": 418.77887, "r_y2": 394.27518, "r_x3": 394.61801, "r_y3": 394.27518, "coord_origin": "TOPLEFT" }, "text": "0.853", "orig": "0.853", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.52701, "r_y0": 402.20148, "r_x1": 458.38425, "r_y1": 402.20148, "r_x2": 458.38425, "r_y2": 394.27518, "r_x3": 439.52701, "r_y3": 394.27518, "coord_origin": "TOPLEFT" }, "text": "1.97", "orig": "1.97", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.17598999999998, "r_y0": 415.3587, "r_x1": 272.93954, "r_y1": 415.3587, "r_x2": 272.93954, "r_y2": 407.28894, "r_x3": 245.17598999999998, "r_y3": 407.28894, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.017, "r_y0": 415.3587, "r_x1": 310.00375, "r_y1": 415.3587, "r_x2": 310.00375, "r_y2": 407.28894, "r_x3": 289.017, "r_y3": 407.28894, "coord_origin": "TOPLEFT" }, "text": "0.952", "orig": "0.952", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.71701, "r_y0": 415.3587, "r_x1": 347.70377, "r_y1": 415.3587, "r_x2": 347.70377, "r_y2": 407.28894, "r_x3": 326.71701, "r_y3": 407.28894, "coord_origin": "TOPLEFT" }, "text": "0.909", "orig": "0.909", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.08801, "r_y0": 415.15247, "r_x1": 386.24887, "r_y1": 415.15247, "r_x2": 386.24887, "r_y2": 407.22617, "r_x3": 362.08801, "r_y3": 407.22617, "coord_origin": "TOPLEFT" }, "text": "0.938", "orig": "0.938", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.20599, "r_y0": 415.3587, "r_x1": 417.19275, "r_y1": 415.3587, "r_x2": 417.19275, "r_y2": 407.28894, "r_x3": 396.20599, "r_y3": 407.28894, "coord_origin": "TOPLEFT" }, "text": "0.843", "orig": "0.843", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.767, "r_y0": 415.3587, "r_x1": 457.14682, "r_y1": 415.3587, "r_x2": 457.14682, "r_y2": 407.28894, "r_x3": 440.767, "r_y3": 407.28894, "coord_origin": "TOPLEFT" }, "text": "3.77", "orig": "3.77", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.90601, "r_y0": 434.1877099999999, "r_x1": 166.51294, "r_y1": 434.1877099999999, "r_x2": 166.51294, "r_y2": 426.11795, "r_x3": 161.90601, "r_y3": 426.11795, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.509, "r_y0": 434.1877099999999, "r_x1": 214.11594, "r_y1": 434.1877099999999, "r_x2": 214.11594, "r_y2": 426.11795, "r_x3": 209.509, "r_y3": 426.11795, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.71000999999998, "r_y0": 428.70871, "r_x1": 271.40527, "r_y1": 428.70871, "r_x2": 271.40527, "r_y2": 420.63895, "r_x3": 246.71000999999998, "r_y3": 420.63895, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.017, "r_y0": 428.70871, "r_x1": 310.00375, "r_y1": 428.70871, "r_x2": 310.00375, "r_y2": 420.63895, "r_x3": 289.017, "r_y3": 420.63895, "coord_origin": "TOPLEFT" }, "text": "0.923", "orig": "0.923", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.71701, "r_y0": 428.70871, "r_x1": 347.70377, "r_y1": 428.70871, "r_x2": 347.70377, "r_y2": 420.63895, "r_x3": 326.71701, "r_y3": 420.63895, "coord_origin": "TOPLEFT" }, "text": "0.897", "orig": "0.897", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.67599, "r_y0": 428.70871, "r_x1": 384.66275, "r_y1": 428.70871, "r_x2": 384.66275, "r_y2": 420.63895, "r_x3": 363.67599, "r_y3": 420.63895, "coord_origin": "TOPLEFT" }, "text": "0.915", "orig": "0.915", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.61801, "r_y0": 428.50247, "r_x1": 418.77887, "r_y1": 428.50247, "r_x2": 418.77887, "r_y2": 420.57617, "r_x3": 394.61801, "r_y3": 420.57617, "coord_origin": "TOPLEFT" }, "text": "0.859", "orig": "0.859", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.52701, "r_y0": 428.50247, "r_x1": 458.38425, "r_y1": 428.50247, "r_x2": 458.38425, "r_y2": 420.57617, "r_x3": 439.52701, "r_y3": 420.57617, "coord_origin": "TOPLEFT" }, "text": "1.91", "orig": "1.91", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.17598999999998, "r_y0": 441.6597, "r_x1": 272.93954, "r_y1": 441.6597, "r_x2": 272.93954, "r_y2": 433.58994, "r_x3": 245.17598999999998, "r_y3": 433.58994, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.017, "r_y0": 441.6597, "r_x1": 310.00375, "r_y1": 441.6597, "r_x2": 310.00375, "r_y2": 433.58994, "r_x3": 289.017, "r_y3": 433.58994, "coord_origin": "TOPLEFT" }, "text": "0.945", "orig": "0.945", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.71701, "r_y0": 441.6597, "r_x1": 347.70377, "r_y1": 441.6597, "r_x2": 347.70377, "r_y2": 433.58994, "r_x3": 326.71701, "r_y3": 433.58994, "coord_origin": "TOPLEFT" }, "text": "0.901", "orig": "0.901", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.08801, "r_y0": 441.45346, "r_x1": 386.24887, "r_y1": 441.45346, "r_x2": 386.24887, "r_y2": 433.5271599999999, "r_x3": 362.08801, "r_y3": 433.5271599999999, "coord_origin": "TOPLEFT" }, "text": "0.931", "orig": "0.931", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.20599, "r_y0": 441.6597, "r_x1": 417.19275, "r_y1": 441.6597, "r_x2": 417.19275, "r_y2": 433.58994, "r_x3": 396.20599, "r_y3": 433.58994, "coord_origin": "TOPLEFT" }, "text": "0.834", "orig": "0.834", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.767, "r_y0": 441.6597, "r_x1": 457.14682, "r_y1": 441.6597, "r_x2": 457.14682, "r_y2": 433.58994, "r_x3": 440.767, "r_y3": 433.58994, "coord_origin": "TOPLEFT" }, "text": "3.81", "orig": "3.81", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.90601, "r_y0": 460.48972, "r_x1": 166.51294, "r_y1": 460.48972, "r_x2": 166.51294, "r_y2": 452.41995, "r_x3": 161.90601, "r_y3": 452.41995, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.509, "r_y0": 460.48972, "r_x1": 214.11594, "r_y1": 460.48972, "r_x2": 214.11594, "r_y2": 452.41995, "r_x3": 209.509, "r_y3": 452.41995, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.71000999999998, "r_y0": 455.0097, "r_x1": 271.40527, "r_y1": 455.0097, "r_x2": 271.40527, "r_y2": 446.9399399999999, "r_x3": 246.71000999999998, "r_y3": 446.9399399999999, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.017, "r_y0": 455.0097, "r_x1": 310.00375, "r_y1": 455.0097, "r_x2": 310.00375, "r_y2": 446.9399399999999, "r_x3": 289.017, "r_y3": 446.9399399999999, "coord_origin": "TOPLEFT" }, "text": "0.952", "orig": "0.952", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 329.021, "r_y0": 455.0097, "r_x1": 345.40082, "r_y1": 455.0097, "r_x2": 345.40082, "r_y2": 446.9399399999999, "r_x3": 329.021, "r_y3": 446.9399399999999, "coord_origin": "TOPLEFT" }, "text": "0.92", "orig": "0.92", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.08801, "r_y0": 454.80347, "r_x1": 386.24887, "r_y1": 454.80347, "r_x2": 386.24887, "r_y2": 446.87717, "r_x3": 362.08801, "r_y3": 446.87717, "coord_origin": "TOPLEFT" }, "text": "0.942", "orig": "0.942", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.61801, "r_y0": 454.80347, "r_x1": 418.77887, "r_y1": 454.80347, "r_x2": 418.77887, "r_y2": 446.87717, "r_x3": 394.61801, "r_y3": 446.87717, "coord_origin": "TOPLEFT" }, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.52701, "r_y0": 454.80347, "r_x1": 458.38425, "r_y1": 454.80347, "r_x2": 458.38425, "r_y2": 446.87717, "r_x3": 439.52701, "r_y3": 446.87717, "coord_origin": "TOPLEFT" }, "text": "1.22", "orig": "1.22", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.17598999999998, "r_y0": 467.9617, "r_x1": 272.93954, "r_y1": 467.9617, "r_x2": 272.93954, "r_y2": 459.8919399999999, "r_x3": 245.17598999999998, "r_y3": 459.8919399999999, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.017, "r_y0": 467.9617, "r_x1": 310.00375, "r_y1": 467.9617, "r_x2": 310.00375, "r_y2": 459.8919399999999, "r_x3": 289.017, "r_y3": 459.8919399999999, "coord_origin": "TOPLEFT" }, "text": "0.944", "orig": "0.944", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.71701, "r_y0": 467.9617, "r_x1": 347.70377, "r_y1": 467.9617, "r_x2": 347.70377, "r_y2": 459.8919399999999, "r_x3": 326.71701, "r_y3": 459.8919399999999, "coord_origin": "TOPLEFT" }, "text": "0.903", "orig": "0.903", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.67599, "r_y0": 467.9617, "r_x1": 384.66275, "r_y1": 467.9617, "r_x2": 384.66275, "r_y2": 459.8919399999999, "r_x3": 363.67599, "r_y3": 459.8919399999999, "coord_origin": "TOPLEFT" }, "text": "0.931", "orig": "0.931", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.20599, "r_y0": 467.9617, "r_x1": 417.19275, "r_y1": 467.9617, "r_x2": 417.19275, "r_y2": 459.8919399999999, "r_x3": 396.20599, "r_y3": 459.8919399999999, "coord_origin": "TOPLEFT" }, "text": "0.824", "orig": "0.824", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 446.65302, "r_y0": 467.9617, "r_x1": 451.25995, "r_y1": 467.9617, "r_x2": 451.25995, "r_y2": 459.8919399999999, "r_x3": 446.65302, "r_y3": 459.8919399999999, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 11, "label": "text", "bbox": { "l": 160.37, "t": 341.73495, "r": 168.04793, "b": 349.8047199999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.37, "r_y0": 349.8047199999999, "r_x1": 168.04793, "r_y1": 349.8047199999999, "r_x2": 168.04793, "r_y2": 341.73495, "r_x3": 160.37, "r_y3": 341.73495, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 12, "label": "text", "bbox": { "l": 144.592, "t": 354.68594, "r": 183.82806, "b": 362.75570999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 144.592, "r_y0": 362.75570999999997, "r_x1": 183.82806, "r_y1": 362.75570999999997, "r_x2": 183.82806, "r_y2": 354.68594, "r_x3": 144.592, "r_y3": 354.68594, "coord_origin": "TOPLEFT" }, "text": "enc-layers", "orig": "enc-layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 13, "label": "text", "bbox": { "l": 207.974, "t": 341.73495, "r": 215.65193, "b": 349.8047199999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 207.974, "r_y0": 349.8047199999999, "r_x1": 215.65193, "r_y1": 349.8047199999999, "r_x2": 215.65193, "r_y2": 341.73495, "r_x3": 207.974, "r_y3": 341.73495, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 14, "label": "text", "bbox": { "l": 192.19499, "t": 354.68594, "r": 231.43106, "b": 362.75570999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 192.19499, "r_y0": 362.75570999999997, "r_x1": 231.43106, "r_y1": 362.75570999999997, "r_x2": 231.43106, "r_y2": 354.68594, "r_x3": 192.19499, "r_y3": 354.68594, "coord_origin": "TOPLEFT" }, "text": "dec-layers", "orig": "dec-layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 15, "label": "text", "bbox": { "l": 239.79799999999997, "t": 347.21396, "r": 278.31766, "b": 355.28372, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.79799999999997, "r_y0": 355.28372, "r_x1": 278.31766, "r_y1": 355.28372, "r_x2": 278.31766, "r_y2": 347.21396, "r_x3": 239.79799999999997, "r_y3": 347.21396, "coord_origin": "TOPLEFT" }, "text": "Language", "orig": "Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 16, "label": "text", "bbox": { "l": 324.67001, "t": 341.73495, "r": 348.26419, "b": 349.8047199999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 324.67001, "r_y0": 349.8047199999999, "r_x1": 348.26419, "r_y1": 349.8047199999999, "r_x2": 348.26419, "r_y2": 341.73495, "r_x3": 324.67001, "r_y3": 341.73495, "coord_origin": "TOPLEFT" }, "text": "TEDs", "orig": "TEDs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 17, "label": "text", "bbox": { "l": 396.271, "t": 341.73495, "r": 417.12683, "b": 349.8047199999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.271, "r_y0": 349.8047199999999, "r_x1": 417.12683, "r_y1": 349.8047199999999, "r_x2": 417.12683, "r_y2": 341.73495, "r_x3": 396.271, "r_y3": 341.73495, "coord_origin": "TOPLEFT" }, "text": "mAP", "orig": "mAP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 18, "label": "text", "bbox": { "l": 394.927, "t": 352.69394000000005, "r": 418.47278, "b": 360.7637, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.927, "r_y0": 360.7637, "r_x1": 418.47278, "r_y1": 360.7637, "r_x2": 418.47278, "r_y2": 352.69394000000005, "r_x3": 394.927, "r_y3": 352.69394000000005, "coord_origin": "TOPLEFT" }, "text": "(0.75)", "orig": "(0.75)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 19, "label": "text", "bbox": { "l": 430.771, "t": 341.73495, "r": 467.1423, "b": 349.8047199999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 430.771, "r_y0": 349.8047199999999, "r_x1": 467.1423, "r_y1": 349.8047199999999, "r_x2": 467.1423, "r_y2": 341.73495, "r_x3": 430.771, "r_y3": 341.73495, "coord_origin": "TOPLEFT" }, "text": "Inference", "orig": "Inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 20, "label": "text", "bbox": { "l": 427.14801, "t": 352.69394000000005, "r": 470.76056, "b": 360.7637, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 427.14801, "r_y0": 360.7637, "r_x1": 470.76056, "r_y1": 360.7637, "r_x2": 470.76056, "r_y2": 352.69394000000005, "r_x3": 427.14801, "r_y3": 352.69394000000005, "coord_origin": "TOPLEFT" }, "text": "time (secs)", "orig": "time (secs)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 21, "label": "text", "bbox": { "l": 286.686, "t": 354.68594, "r": 312.33261, "b": 362.75570999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 286.686, "r_y0": 362.75570999999997, "r_x1": 312.33261, "r_y1": 362.75570999999997, "r_x2": 312.33261, "r_y2": 354.68594, "r_x3": 286.686, "r_y3": 354.68594, "coord_origin": "TOPLEFT" }, "text": "simple", "orig": "simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 22, "label": "text", "bbox": { "l": 320.702, "t": 354.68594, "r": 353.71988, "b": 362.75570999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.702, "r_y0": 362.75570999999997, "r_x1": 353.71988, "r_y1": 362.75570999999997, "r_x2": 353.71988, "r_y2": 354.68594, "r_x3": 320.702, "r_y3": 354.68594, "coord_origin": "TOPLEFT" }, "text": "complex", "orig": "complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 23, "label": "text", "bbox": { "l": 369.306, "t": 354.68594, "r": 379.03094, "b": 362.75570999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 369.306, "r_y0": 362.75570999999997, "r_x1": 379.03094, "r_y1": 362.75570999999997, "r_x2": 379.03094, "r_y2": 354.68594, "r_x3": 369.306, "r_y3": 354.68594, "coord_origin": "TOPLEFT" }, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 24, "label": "text", "bbox": { "l": 161.90601, "t": 373.51596, "r": 166.51294, "b": 381.58572, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.90601, "r_y0": 381.58572, "r_x1": 166.51294, "r_y1": 381.58572, "r_x2": 166.51294, "r_y2": 373.51596, "r_x3": 161.90601, "r_y3": 373.51596, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 25, "label": "text", "bbox": { "l": 209.509, "t": 373.51596, "r": 214.11594, "b": 381.58572, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.509, "r_y0": 381.58572, "r_x1": 214.11594, "r_y1": 381.58572, "r_x2": 214.11594, "r_y2": 373.51596, "r_x3": 209.509, "r_y3": 373.51596, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 26, "label": "text", "bbox": { "l": 246.71000999999998, "t": 368.03595, "r": 271.40527, "b": 376.10571, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.71000999999998, "r_y0": 376.10571, "r_x1": 271.40527, "r_y1": 376.10571, "r_x2": 271.40527, "r_y2": 368.03595, "r_x3": 246.71000999999998, "r_y3": 368.03595, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 27, "label": "text", "bbox": { "l": 289.017, "t": 368.03595, "r": 310.00375, "b": 376.10571, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.017, "r_y0": 376.10571, "r_x1": 310.00375, "r_y1": 376.10571, "r_x2": 310.00375, "r_y2": 368.03595, "r_x3": 289.017, "r_y3": 368.03595, "coord_origin": "TOPLEFT" }, "text": "0.965", "orig": "0.965", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 28, "label": "text", "bbox": { "l": 326.71701, "t": 368.03595, "r": 347.70377, "b": 376.10571, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.71701, "r_y0": 376.10571, "r_x1": 347.70377, "r_y1": 376.10571, "r_x2": 347.70377, "r_y2": 368.03595, "r_x3": 326.71701, "r_y3": 368.03595, "coord_origin": "TOPLEFT" }, "text": "0.934", "orig": "0.934", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 29, "label": "text", "bbox": { "l": 363.67599, "t": 368.03595, "r": 384.66275, "b": 376.10571, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.67599, "r_y0": 376.10571, "r_x1": 384.66275, "r_y1": 376.10571, "r_x2": 384.66275, "r_y2": 368.03595, "r_x3": 363.67599, "r_y3": 368.03595, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 30, "label": "text", "bbox": { "l": 397.26999, "t": 367.97317999999996, "r": 416.12723, "b": 375.89948, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.26999, "r_y0": 375.89948, "r_x1": 416.12723, "r_y1": 375.89948, "r_x2": 416.12723, "r_y2": 367.97317999999996, "r_x3": 397.26999, "r_y3": 367.97317999999996, "coord_origin": "TOPLEFT" }, "text": "0.88", "orig": "0.88", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 31, "label": "text", "bbox": { "l": 439.52701, "t": 367.97317999999996, "r": 458.38425, "b": 375.89948, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.52701, "r_y0": 375.89948, "r_x1": 458.38425, "r_y1": 375.89948, "r_x2": 458.38425, "r_y2": 367.97317999999996, "r_x3": 439.52701, "r_y3": 367.97317999999996, "coord_origin": "TOPLEFT" }, "text": "2.73", "orig": "2.73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 32, "label": "text", "bbox": { "l": 245.17598999999998, "t": 380.98795, "r": 272.93954, "b": 389.05771, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.17598999999998, "r_y0": 389.05771, "r_x1": 272.93954, "r_y1": 389.05771, "r_x2": 272.93954, "r_y2": 380.98795, "r_x3": 245.17598999999998, "r_y3": 380.98795, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 33, "label": "text", "bbox": { "l": 289.017, "t": 380.98795, "r": 310.00375, "b": 389.05771, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.017, "r_y0": 389.05771, "r_x1": 310.00375, "r_y1": 389.05771, "r_x2": 310.00375, "r_y2": 380.98795, "r_x3": 289.017, "r_y3": 380.98795, "coord_origin": "TOPLEFT" }, "text": "0.969", "orig": "0.969", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 34, "label": "text", "bbox": { "l": 326.71701, "t": 380.98795, "r": 347.70377, "b": 389.05771, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.71701, "r_y0": 389.05771, "r_x1": 347.70377, "r_y1": 389.05771, "r_x2": 347.70377, "r_y2": 380.98795, "r_x3": 326.71701, "r_y3": 380.98795, "coord_origin": "TOPLEFT" }, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 35, "label": "text", "bbox": { "l": 363.67599, "t": 380.98795, "r": 384.66275, "b": 389.05771, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.67599, "r_y0": 389.05771, "r_x1": 384.66275, "r_y1": 389.05771, "r_x2": 384.66275, "r_y2": 380.98795, "r_x3": 363.67599, "r_y3": 380.98795, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 36, "label": "text", "bbox": { "l": 396.20599, "t": 380.98795, "r": 417.19275, "b": 389.05771, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.20599, "r_y0": 389.05771, "r_x1": 417.19275, "r_y1": 389.05771, "r_x2": 417.19275, "r_y2": 380.98795, "r_x3": 396.20599, "r_y3": 380.98795, "coord_origin": "TOPLEFT" }, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 37, "label": "text", "bbox": { "l": 440.767, "t": 380.98795, "r": 457.14682, "b": 389.05771, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.767, "r_y0": 389.05771, "r_x1": 457.14682, "r_y1": 389.05771, "r_x2": 457.14682, "r_y2": 380.98795, "r_x3": 440.767, "r_y3": 380.98795, "coord_origin": "TOPLEFT" }, "text": "5.39", "orig": "5.39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 38, "label": "text", "bbox": { "l": 161.90601, "t": 399.81696, "r": 166.51294, "b": 407.88672, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.90601, "r_y0": 407.88672, "r_x1": 166.51294, "r_y1": 407.88672, "r_x2": 166.51294, "r_y2": 399.81696, "r_x3": 161.90601, "r_y3": 399.81696, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 39, "label": "text", "bbox": { "l": 209.509, "t": 399.81696, "r": 214.11594, "b": 407.88672, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.509, "r_y0": 407.88672, "r_x1": 214.11594, "r_y1": 407.88672, "r_x2": 214.11594, "r_y2": 399.81696, "r_x3": 209.509, "r_y3": 399.81696, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 40, "label": "text", "bbox": { "l": 246.71000999999998, "t": 394.33795, "r": 271.40527, "b": 402.40771, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.71000999999998, "r_y0": 402.40771, "r_x1": 271.40527, "r_y1": 402.40771, "r_x2": 271.40527, "r_y2": 394.33795, "r_x3": 246.71000999999998, "r_y3": 394.33795, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 289.017, "t": 394.33795, "r": 310.00375, "b": 402.40771, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.017, "r_y0": 402.40771, "r_x1": 310.00375, "r_y1": 402.40771, "r_x2": 310.00375, "r_y2": 394.33795, "r_x3": 289.017, "r_y3": 394.33795, "coord_origin": "TOPLEFT" }, "text": "0.938", "orig": "0.938", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 326.71701, "t": 394.33795, "r": 347.70377, "b": 402.40771, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.71701, "r_y0": 402.40771, "r_x1": 347.70377, "r_y1": 402.40771, "r_x2": 347.70377, "r_y2": 394.33795, "r_x3": 326.71701, "r_y3": 394.33795, "coord_origin": "TOPLEFT" }, "text": "0.904", "orig": "0.904", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 363.67599, "t": 394.33795, "r": 384.66275, "b": 402.40771, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.67599, "r_y0": 402.40771, "r_x1": 384.66275, "r_y1": 402.40771, "r_x2": 384.66275, "r_y2": 394.33795, "r_x3": 363.67599, "r_y3": 394.33795, "coord_origin": "TOPLEFT" }, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 394.61801, "t": 394.27518, "r": 418.77887, "b": 402.20148, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.61801, "r_y0": 402.20148, "r_x1": 418.77887, "r_y1": 402.20148, "r_x2": 418.77887, "r_y2": 394.27518, "r_x3": 394.61801, "r_y3": 394.27518, "coord_origin": "TOPLEFT" }, "text": "0.853", "orig": "0.853", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 439.52701, "t": 394.27518, "r": 458.38425, "b": 402.20148, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.52701, "r_y0": 402.20148, "r_x1": 458.38425, "r_y1": 402.20148, "r_x2": 458.38425, "r_y2": 394.27518, "r_x3": 439.52701, "r_y3": 394.27518, "coord_origin": "TOPLEFT" }, "text": "1.97", "orig": "1.97", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 245.17598999999998, "t": 407.28894, "r": 272.93954, "b": 415.3587, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.17598999999998, "r_y0": 415.3587, "r_x1": 272.93954, "r_y1": 415.3587, "r_x2": 272.93954, "r_y2": 407.28894, "r_x3": 245.17598999999998, "r_y3": 407.28894, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 289.017, "t": 407.28894, "r": 310.00375, "b": 415.3587, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.017, "r_y0": 415.3587, "r_x1": 310.00375, "r_y1": 415.3587, "r_x2": 310.00375, "r_y2": 407.28894, "r_x3": 289.017, "r_y3": 407.28894, "coord_origin": "TOPLEFT" }, "text": "0.952", "orig": "0.952", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 326.71701, "t": 407.28894, "r": 347.70377, "b": 415.3587, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.71701, "r_y0": 415.3587, "r_x1": 347.70377, "r_y1": 415.3587, "r_x2": 347.70377, "r_y2": 407.28894, "r_x3": 326.71701, "r_y3": 407.28894, "coord_origin": "TOPLEFT" }, "text": "0.909", "orig": "0.909", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 362.08801, "t": 407.22617, "r": 386.24887, "b": 415.15247, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.08801, "r_y0": 415.15247, "r_x1": 386.24887, "r_y1": 415.15247, "r_x2": 386.24887, "r_y2": 407.22617, "r_x3": 362.08801, "r_y3": 407.22617, "coord_origin": "TOPLEFT" }, "text": "0.938", "orig": "0.938", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 396.20599, "t": 407.28894, "r": 417.19275, "b": 415.3587, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.20599, "r_y0": 415.3587, "r_x1": 417.19275, "r_y1": 415.3587, "r_x2": 417.19275, "r_y2": 407.28894, "r_x3": 396.20599, "r_y3": 407.28894, "coord_origin": "TOPLEFT" }, "text": "0.843", "orig": "0.843", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 51, "label": "text", "bbox": { "l": 440.767, "t": 407.28894, "r": 457.14682, "b": 415.3587, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.767, "r_y0": 415.3587, "r_x1": 457.14682, "r_y1": 415.3587, "r_x2": 457.14682, "r_y2": 407.28894, "r_x3": 440.767, "r_y3": 407.28894, "coord_origin": "TOPLEFT" }, "text": "3.77", "orig": "3.77", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 52, "label": "text", "bbox": { "l": 161.90601, "t": 426.11795, "r": 166.51294, "b": 434.1877099999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.90601, "r_y0": 434.1877099999999, "r_x1": 166.51294, "r_y1": 434.1877099999999, "r_x2": 166.51294, "r_y2": 426.11795, "r_x3": 161.90601, "r_y3": 426.11795, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 53, "label": "text", "bbox": { "l": 209.509, "t": 426.11795, "r": 214.11594, "b": 434.1877099999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.509, "r_y0": 434.1877099999999, "r_x1": 214.11594, "r_y1": 434.1877099999999, "r_x2": 214.11594, "r_y2": 426.11795, "r_x3": 209.509, "r_y3": 426.11795, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 54, "label": "text", "bbox": { "l": 246.71000999999998, "t": 420.63895, "r": 271.40527, "b": 428.70871, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.71000999999998, "r_y0": 428.70871, "r_x1": 271.40527, "r_y1": 428.70871, "r_x2": 271.40527, "r_y2": 420.63895, "r_x3": 246.71000999999998, "r_y3": 420.63895, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 55, "label": "text", "bbox": { "l": 289.017, "t": 420.63895, "r": 310.00375, "b": 428.70871, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.017, "r_y0": 428.70871, "r_x1": 310.00375, "r_y1": 428.70871, "r_x2": 310.00375, "r_y2": 420.63895, "r_x3": 289.017, "r_y3": 420.63895, "coord_origin": "TOPLEFT" }, "text": "0.923", "orig": "0.923", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 56, "label": "text", "bbox": { "l": 326.71701, "t": 420.63895, "r": 347.70377, "b": 428.70871, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.71701, "r_y0": 428.70871, "r_x1": 347.70377, "r_y1": 428.70871, "r_x2": 347.70377, "r_y2": 420.63895, "r_x3": 326.71701, "r_y3": 420.63895, "coord_origin": "TOPLEFT" }, "text": "0.897", "orig": "0.897", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 57, "label": "text", "bbox": { "l": 363.67599, "t": 420.63895, "r": 384.66275, "b": 428.70871, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.67599, "r_y0": 428.70871, "r_x1": 384.66275, "r_y1": 428.70871, "r_x2": 384.66275, "r_y2": 420.63895, "r_x3": 363.67599, "r_y3": 420.63895, "coord_origin": "TOPLEFT" }, "text": "0.915", "orig": "0.915", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 58, "label": "text", "bbox": { "l": 394.61801, "t": 420.57617, "r": 418.77887, "b": 428.50247, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.61801, "r_y0": 428.50247, "r_x1": 418.77887, "r_y1": 428.50247, "r_x2": 418.77887, "r_y2": 420.57617, "r_x3": 394.61801, "r_y3": 420.57617, "coord_origin": "TOPLEFT" }, "text": "0.859", "orig": "0.859", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 59, "label": "text", "bbox": { "l": 439.52701, "t": 420.57617, "r": 458.38425, "b": 428.50247, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.52701, "r_y0": 428.50247, "r_x1": 458.38425, "r_y1": 428.50247, "r_x2": 458.38425, "r_y2": 420.57617, "r_x3": 439.52701, "r_y3": 420.57617, "coord_origin": "TOPLEFT" }, "text": "1.91", "orig": "1.91", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 60, "label": "text", "bbox": { "l": 245.17598999999998, "t": 433.58994, "r": 272.93954, "b": 441.6597, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.17598999999998, "r_y0": 441.6597, "r_x1": 272.93954, "r_y1": 441.6597, "r_x2": 272.93954, "r_y2": 433.58994, "r_x3": 245.17598999999998, "r_y3": 433.58994, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 61, "label": "text", "bbox": { "l": 289.017, "t": 433.58994, "r": 310.00375, "b": 441.6597, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.017, "r_y0": 441.6597, "r_x1": 310.00375, "r_y1": 441.6597, "r_x2": 310.00375, "r_y2": 433.58994, "r_x3": 289.017, "r_y3": 433.58994, "coord_origin": "TOPLEFT" }, "text": "0.945", "orig": "0.945", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 62, "label": "text", "bbox": { "l": 326.71701, "t": 433.58994, "r": 347.70377, "b": 441.6597, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.71701, "r_y0": 441.6597, "r_x1": 347.70377, "r_y1": 441.6597, "r_x2": 347.70377, "r_y2": 433.58994, "r_x3": 326.71701, "r_y3": 433.58994, "coord_origin": "TOPLEFT" }, "text": "0.901", "orig": "0.901", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 362.08801, "t": 433.5271599999999, "r": 386.24887, "b": 441.45346, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.08801, "r_y0": 441.45346, "r_x1": 386.24887, "r_y1": 441.45346, "r_x2": 386.24887, "r_y2": 433.5271599999999, "r_x3": 362.08801, "r_y3": 433.5271599999999, "coord_origin": "TOPLEFT" }, "text": "0.931", "orig": "0.931", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 396.20599, "t": 433.58994, "r": 417.19275, "b": 441.6597, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.20599, "r_y0": 441.6597, "r_x1": 417.19275, "r_y1": 441.6597, "r_x2": 417.19275, "r_y2": 433.58994, "r_x3": 396.20599, "r_y3": 433.58994, "coord_origin": "TOPLEFT" }, "text": "0.834", "orig": "0.834", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 440.767, "t": 433.58994, "r": 457.14682, "b": 441.6597, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.767, "r_y0": 441.6597, "r_x1": 457.14682, "r_y1": 441.6597, "r_x2": 457.14682, "r_y2": 433.58994, "r_x3": 440.767, "r_y3": 433.58994, "coord_origin": "TOPLEFT" }, "text": "3.81", "orig": "3.81", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 161.90601, "t": 452.41995, "r": 166.51294, "b": 460.48972, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.90601, "r_y0": 460.48972, "r_x1": 166.51294, "r_y1": 460.48972, "r_x2": 166.51294, "r_y2": 452.41995, "r_x3": 161.90601, "r_y3": 452.41995, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 209.509, "t": 452.41995, "r": 214.11594, "b": 460.48972, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.509, "r_y0": 460.48972, "r_x1": 214.11594, "r_y1": 460.48972, "r_x2": 214.11594, "r_y2": 452.41995, "r_x3": 209.509, "r_y3": 452.41995, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 246.71000999999998, "t": 446.9399399999999, "r": 271.40527, "b": 455.0097, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.71000999999998, "r_y0": 455.0097, "r_x1": 271.40527, "r_y1": 455.0097, "r_x2": 271.40527, "r_y2": 446.9399399999999, "r_x3": 246.71000999999998, "r_y3": 446.9399399999999, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 289.017, "t": 446.9399399999999, "r": 310.00375, "b": 455.0097, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.017, "r_y0": 455.0097, "r_x1": 310.00375, "r_y1": 455.0097, "r_x2": 310.00375, "r_y2": 446.9399399999999, "r_x3": 289.017, "r_y3": 446.9399399999999, "coord_origin": "TOPLEFT" }, "text": "0.952", "orig": "0.952", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 329.021, "t": 446.9399399999999, "r": 345.40082, "b": 455.0097, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 329.021, "r_y0": 455.0097, "r_x1": 345.40082, "r_y1": 455.0097, "r_x2": 345.40082, "r_y2": 446.9399399999999, "r_x3": 329.021, "r_y3": 446.9399399999999, "coord_origin": "TOPLEFT" }, "text": "0.92", "orig": "0.92", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 362.08801, "t": 446.87717, "r": 386.24887, "b": 454.80347, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.08801, "r_y0": 454.80347, "r_x1": 386.24887, "r_y1": 454.80347, "r_x2": 386.24887, "r_y2": 446.87717, "r_x3": 362.08801, "r_y3": 446.87717, "coord_origin": "TOPLEFT" }, "text": "0.942", "orig": "0.942", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 394.61801, "t": 446.87717, "r": 418.77887, "b": 454.80347, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.61801, "r_y0": 454.80347, "r_x1": 418.77887, "r_y1": 454.80347, "r_x2": 418.77887, "r_y2": 446.87717, "r_x3": 394.61801, "r_y3": 446.87717, "coord_origin": "TOPLEFT" }, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 439.52701, "t": 446.87717, "r": 458.38425, "b": 454.80347, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.52701, "r_y0": 454.80347, "r_x1": 458.38425, "r_y1": 454.80347, "r_x2": 458.38425, "r_y2": 446.87717, "r_x3": 439.52701, "r_y3": 446.87717, "coord_origin": "TOPLEFT" }, "text": "1.22", "orig": "1.22", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 245.17598999999998, "t": 459.8919399999999, "r": 272.93954, "b": 467.9617, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.17598999999998, "r_y0": 467.9617, "r_x1": 272.93954, "r_y1": 467.9617, "r_x2": 272.93954, "r_y2": 459.8919399999999, "r_x3": 245.17598999999998, "r_y3": 459.8919399999999, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 289.017, "t": 459.8919399999999, "r": 310.00375, "b": 467.9617, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.017, "r_y0": 467.9617, "r_x1": 310.00375, "r_y1": 467.9617, "r_x2": 310.00375, "r_y2": 459.8919399999999, "r_x3": 289.017, "r_y3": 459.8919399999999, "coord_origin": "TOPLEFT" }, "text": "0.944", "orig": "0.944", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 326.71701, "t": 459.8919399999999, "r": 347.70377, "b": 467.9617, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.71701, "r_y0": 467.9617, "r_x1": 347.70377, "r_y1": 467.9617, "r_x2": 347.70377, "r_y2": 459.8919399999999, "r_x3": 326.71701, "r_y3": 459.8919399999999, "coord_origin": "TOPLEFT" }, "text": "0.903", "orig": "0.903", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 363.67599, "t": 459.8919399999999, "r": 384.66275, "b": 467.9617, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.67599, "r_y0": 467.9617, "r_x1": 384.66275, "r_y1": 467.9617, "r_x2": 384.66275, "r_y2": 459.8919399999999, "r_x3": 363.67599, "r_y3": 459.8919399999999, "coord_origin": "TOPLEFT" }, "text": "0.931", "orig": "0.931", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 396.20599, "t": 459.8919399999999, "r": 417.19275, "b": 467.9617, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.20599, "r_y0": 467.9617, "r_x1": 417.19275, "r_y1": 467.9617, "r_x2": 417.19275, "r_y2": 459.8919399999999, "r_x3": 396.20599, "r_y3": 459.8919399999999, "coord_origin": "TOPLEFT" }, "text": "0.824", "orig": "0.824", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 446.65302, "t": 459.8919399999999, "r": 451.25995, "b": 467.9617, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 446.65302, "r_y0": 467.9617, "r_x1": 451.25995, "r_y1": 467.9617, "r_x2": 451.25995, "r_y2": 459.8919399999999, "r_x3": 446.65302, "r_y3": 459.8919399999999, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "lcel", "lcel", "ched", "ched", "nl", "ucel", "ucel", "ucel", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 6, "num_cols": 8, "table_cells": [ { "bbox": { "l": 160.37, "t": 341.73495, "r": 168.04793, "b": 349.8047199999999, "coord_origin": "TOPLEFT" }, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "# enc-layers", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 207.974, "t": 341.73495, "r": 215.65193, "b": 349.8047199999999, "coord_origin": "TOPLEFT" }, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "# dec-layers", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 239.79799999999997, "t": 347.21396, "r": 278.31766, "b": 355.28372, "coord_origin": "TOPLEFT" }, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "Language", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 324.67001, "t": 341.73495, "r": 348.26419, "b": 349.8047199999999, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 3, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 3, "end_col_offset_idx": 6, "text": "TEDs", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 396.271, "t": 341.73495, "r": 417.12683, "b": 349.8047199999999, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "mAP", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 394.927, "t": 352.69394000000005, "r": 418.47278, "b": 360.7637, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "(0.75)", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 430.771, "t": 341.73495, "r": 467.1423, "b": 349.8047199999999, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 7, "end_col_offset_idx": 8, "text": "Inference", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 427.14801, "t": 352.69394000000005, "r": 470.76056, "b": 360.7637, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 7, "end_col_offset_idx": 8, "text": "time (secs)", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 286.686, "t": 354.68594, "r": 312.33261, "b": 362.75570999999997, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "simple", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 320.702, "t": 354.68594, "r": 353.71988, "b": 362.75570999999997, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "complex", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 369.306, "t": 354.68594, "r": 379.03094, "b": 362.75570999999997, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "all", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 161.90601, "t": 373.51596, "r": 166.51294, "b": 381.58572, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "6", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 209.509, "t": 373.51596, "r": 214.11594, "b": 381.58572, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "6", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 246.71000999999998, "t": 368.03595, "r": 271.40527, "b": 376.10571, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 289.017, "t": 368.03595, "r": 310.00375, "b": 376.10571, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.965 0.969", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 326.71701, "t": 368.03595, "r": 347.70377, "b": 376.10571, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.934 0.927", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 363.67599, "t": 368.03595, "r": 384.66275, "b": 376.10571, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.955 0.955", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 397.26999, "t": 367.97317999999996, "r": 416.12723, "b": 375.89948, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "0.88 0.857", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 439.52701, "t": 367.97317999999996, "r": 458.38425, "b": 375.89948, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 7, "end_col_offset_idx": 8, "text": "2.73 5.39", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 161.90601, "t": 399.81696, "r": 166.51294, "b": 407.88672, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "4", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 209.509, "t": 399.81696, "r": 214.11594, "b": 407.88672, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "4", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 246.71000999999998, "t": 394.33795, "r": 271.40527, "b": 402.40771, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 289.017, "t": 394.33795, "r": 310.00375, "b": 402.40771, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.938 0.952", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 326.71701, "t": 394.33795, "r": 347.70377, "b": 402.40771, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.904 0.909", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 363.67599, "t": 394.33795, "r": 384.66275, "b": 402.40771, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.927 0.938", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 394.61801, "t": 394.27518, "r": 418.77887, "b": 402.20148, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "0.853 0.843", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 439.52701, "t": 394.27518, "r": 458.38425, "b": 402.20148, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 7, "end_col_offset_idx": 8, "text": "1.97 3.77", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 161.90601, "t": 426.11795, "r": 166.51294, "b": 434.1877099999999, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "2", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 209.509, "t": 426.11795, "r": 214.11594, "b": 434.1877099999999, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "4", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 246.71000999999998, "t": 420.63895, "r": 271.40527, "b": 428.70871, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 289.017, "t": 420.63895, "r": 310.00375, "b": 428.70871, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.923 0.945", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 326.71701, "t": 420.63895, "r": 347.70377, "b": 428.70871, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.897 0.901", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 363.67599, "t": 420.63895, "r": 384.66275, "b": 428.70871, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.915 0.931", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 394.61801, "t": 420.57617, "r": 418.77887, "b": 428.50247, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "0.859 0.834", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 439.52701, "t": 420.57617, "r": 458.38425, "b": 428.50247, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 7, "end_col_offset_idx": 8, "text": "1.91 3.81", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 161.90601, "t": 452.41995, "r": 166.51294, "b": 460.48972, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "4", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 209.509, "t": 452.41995, "r": 214.11594, "b": 460.48972, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "2", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 246.71000999999998, "t": 446.9399399999999, "r": 271.40527, "b": 455.0097, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 289.017, "t": 446.9399399999999, "r": 310.00375, "b": 455.0097, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.952 0.944", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 329.021, "t": 446.9399399999999, "r": 345.40082, "b": 455.0097, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.92 0.903", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 362.08801, "t": 446.87717, "r": 386.24887, "b": 454.80347, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.942 0.931", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 394.61801, "t": 446.87717, "r": 418.77887, "b": 454.80347, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "0.857 0.824", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 439.52701, "t": 446.87717, "r": 458.38425, "b": 454.80347, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 7, "end_col_offset_idx": 8, "text": "1.22 2", "column_header": false, "row_header": false, "row_section": false } ] }, { "label": "section_header", "id": 5, "page_no": 8, "cluster": { "id": 5, "label": "section_header", "bbox": { "l": 134.765, "t": 508.15179, "r": 264.40332, "b": 516.95874, "coord_origin": "TOPLEFT" }, "confidence": 0.9592539668083191, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 516.95874, "r_x1": 149.40205, "r_y1": 516.95874, "r_x2": 149.40205, "r_y2": 508.15179, "r_x3": 134.765, "r_y3": 508.15179, "coord_origin": "TOPLEFT" }, "text": "5.2", "orig": "5.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.85904, "r_y0": 516.95874, "r_x1": 264.40332, "r_y1": 516.95874, "r_x2": 264.40332, "r_y2": 508.15179, "r_x3": 160.85904, "r_y3": 508.15179, "coord_origin": "TOPLEFT" }, "text": "Quantitative Results", "orig": "Quantitative Results", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "5.2 Quantitative Results" }, { "label": "text", "id": 1, "page_no": 8, "cluster": { "id": 1, "label": "text", "bbox": { "l": 134.765, "t": 524.55078, "r": 480.5957599999999, "b": 617.03474, "coord_origin": "TOPLEFT" }, "confidence": 0.9854757189750671, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 533.34775, "r_x1": 480.59075999999993, "r_y1": 533.34775, "r_x2": 480.59075999999993, "r_y2": 524.55078, "r_x3": 134.765, "r_y3": 524.55078, "coord_origin": "TOPLEFT" }, "text": "We picked the model parameter configuration that produced the best prediction", "orig": "We picked the model parameter configuration that produced the best prediction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 545.3037400000001, "r_x1": 480.58675999999997, "r_y1": 545.3037400000001, "r_x2": 480.58675999999997, "r_y2": 536.50677, "r_x3": 134.765, "r_y3": 536.50677, "coord_origin": "TOPLEFT" }, "text": "quality (enc=6, dec=6, heads=8) with PubTabNet alone, then independently", "orig": "quality (enc=6, dec=6, heads=8) with PubTabNet alone, then independently", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 557.25874, "r_x1": 480.59572999999995, "r_y1": 557.25874, "r_x2": 480.59572999999995, "r_y2": 548.4617800000001, "r_x3": 134.765, "r_y3": 548.4617800000001, "coord_origin": "TOPLEFT" }, "text": "trained and evaluated it on three publicly available data sets: PubTabNet (395k", "orig": "trained and evaluated it on three publicly available data sets: PubTabNet (395k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 569.21375, "r_x1": 480.59177000000005, "r_y1": 569.21375, "r_x2": 480.59177000000005, "r_y2": 560.41678, "r_x3": 134.765, "r_y3": 560.41678, "coord_origin": "TOPLEFT" }, "text": "samples), FinTabNet (113k samples) and PubTables-1M (about 1M samples).", "orig": "samples), FinTabNet (113k samples) and PubTables-1M (about 1M samples).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 581.16875, "r_x1": 480.59069999999997, "r_y1": 581.16875, "r_x2": 480.59069999999997, "r_y2": 572.37178, "r_x3": 134.765, "r_y3": 572.37178, "coord_origin": "TOPLEFT" }, "text": "Performance results are presented in Table. 2. It is clearly evident that the model", "orig": "Performance results are presented in Table. 2. It is clearly evident that the model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 593.12375, "r_x1": 480.5957599999999, "r_y1": 593.12375, "r_x2": 480.5957599999999, "r_y2": 584.32678, "r_x3": 134.765, "r_y3": 584.32678, "coord_origin": "TOPLEFT" }, "text": "trained on OTSL outperforms HTML across the board, keeping high TEDs and", "orig": "trained on OTSL outperforms HTML across the board, keeping high TEDs and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 605.07974, "r_x1": 480.58774, "r_y1": 605.07974, "r_x2": 480.58774, "r_y2": 596.28278, "r_x3": 134.765, "r_y3": 596.28278, "coord_origin": "TOPLEFT" }, "text": "mAP scores even on difficult financial tables (FinTabNet) that contain sparse", "orig": "mAP scores even on difficult financial tables (FinTabNet) that contain sparse", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 617.03474, "r_x1": 206.78664, "r_y1": 617.03474, "r_x2": 206.78664, "r_y2": 608.2377799999999, "r_x3": 134.765, "r_y3": 608.2377799999999, "coord_origin": "TOPLEFT" }, "text": "and large tables.", "orig": "and large tables.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "We picked the model parameter configuration that produced the best prediction quality (enc=6, dec=6, heads=8) with PubTabNet alone, then independently trained and evaluated it on three publicly available data sets: PubTabNet (395k samples), FinTabNet (113k samples) and PubTables-1M (about 1M samples). Performance results are presented in Table. 2. It is clearly evident that the model trained on OTSL outperforms HTML across the board, keeping high TEDs and mAP scores even on difficult financial tables (FinTabNet) that contain sparse and large tables." }, { "label": "text", "id": 2, "page_no": 8, "cluster": { "id": 2, "label": "text", "bbox": { "l": 134.765, "t": 620.19278, "r": 480.5957599999999, "b": 664.8547599999999, "coord_origin": "TOPLEFT" }, "confidence": 0.9851234555244446, "cells": [ { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.709, "r_y0": 628.98975, "r_x1": 480.59271, "r_y1": 628.98975, "r_x2": 480.59271, "r_y2": 620.19278, "r_x3": 149.709, "r_y3": 620.19278, "coord_origin": "TOPLEFT" }, "text": "Additionally, the results show that OTSL has an advantage over HTML", "orig": "Additionally, the results show that OTSL has an advantage over HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 640.94475, "r_x1": 480.5957599999999, "r_y1": 640.94475, "r_x2": 480.5957599999999, "r_y2": 632.14778, "r_x3": 134.765, "r_y3": 632.14778, "coord_origin": "TOPLEFT" }, "text": "when applied on a bigger data set like PubTables-1M and achieves significantly", "orig": "when applied on a bigger data set like PubTables-1M and achieves significantly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 652.89975, "r_x1": 480.59283000000005, "r_y1": 652.89975, "r_x2": 480.59283000000005, "r_y2": 644.1027799999999, "r_x3": 134.765, "r_y3": 644.1027799999999, "coord_origin": "TOPLEFT" }, "text": "improved scores. Finally, OTSL achieves faster inference due to fewer decoding", "orig": "improved scores. Finally, OTSL achieves faster inference due to fewer decoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 664.8547599999999, "r_x1": 405.79651, "r_y1": 664.8547599999999, "r_x2": 405.79651, "r_y2": 656.0577900000001, "r_x3": 134.765, "r_y3": 656.0577900000001, "coord_origin": "TOPLEFT" }, "text": "steps which is a result of the reduced sequence representation.", "orig": "steps which is a result of the reduced sequence representation.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Additionally, the results show that OTSL has an advantage over HTML when applied on a bigger data set like PubTables-1M and achieves significantly improved scores. Finally, OTSL achieves faster inference due to fewer decoding steps which is a result of the reduced sequence representation." } ], "body": [ { "label": "text", "id": 4, "page_no": 8, "cluster": { "id": 4, "label": "text", "bbox": { "l": 134.765, "t": 118.93377999999996, "r": 480.59579, "b": 151.64178000000004, "coord_origin": "TOPLEFT" }, "confidence": 0.9805440306663513, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 127.73077, "r_x1": 480.5936899999999, "r_y1": 127.73077, "r_x2": 480.5936899999999, "r_y2": 118.93377999999996, "r_x3": 134.765, "r_y3": 118.93377999999996, "coord_origin": "TOPLEFT" }, "text": "order to compute the TED score. Inference timing results for all experiments", "orig": "order to compute the TED score. Inference timing results for all experiments", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 139.68579, "r_x1": 480.59579, "r_y1": 139.68579, "r_x2": 480.59579, "r_y2": 130.88878999999997, "r_x3": 134.765, "r_y3": 130.88878999999997, "coord_origin": "TOPLEFT" }, "text": "were obtained from the same machine on a single core with AMD EPYC 7763", "orig": "were obtained from the same machine on a single core with AMD EPYC 7763", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 151.64178000000004, "r_x1": 210.78462, "r_y1": 151.64178000000004, "r_x2": 210.78462, "r_y2": 142.84479, "r_x3": 134.765, "r_y3": 142.84479, "coord_origin": "TOPLEFT" }, "text": "CPU @2.45 GHz.", "orig": "CPU @2.45 GHz.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "order to compute the TED score. Inference timing results for all experiments were obtained from the same machine on a single core with AMD EPYC 7763 CPU @2.45 GHz." }, { "label": "section_header", "id": 6, "page_no": 8, "cluster": { "id": 6, "label": "section_header", "bbox": { "l": 134.765, "t": 169.18584999999996, "r": 318.44843, "b": 177.9928, "coord_origin": "TOPLEFT" }, "confidence": 0.9579681158065796, "cells": [ { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 177.9928, "r_x1": 149.40205, "r_y1": 177.9928, "r_x2": 149.40205, "r_y2": 169.18584999999996, "r_x3": 134.765, "r_y3": 169.18584999999996, "coord_origin": "TOPLEFT" }, "text": "5.1", "orig": "5.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.85904, "r_y0": 177.9928, "r_x1": 318.44843, "r_y1": 177.9928, "r_x2": 318.44843, "r_y2": 169.18584999999996, "r_x3": 160.85904, "r_y3": 169.18584999999996, "coord_origin": "TOPLEFT" }, "text": "Hyper Parameter Optimization", "orig": "Hyper Parameter Optimization", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "5.1 Hyper Parameter Optimization" }, { "label": "text", "id": 3, "page_no": 8, "cluster": { "id": 3, "label": "text", "bbox": { "l": 134.76498, "t": 185.58582, "r": 480.59277, "b": 254.15886999999998, "coord_origin": "TOPLEFT" }, "confidence": 0.9842326641082764, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 194.38280999999995, "r_x1": 480.59183, "r_y1": 194.38280999999995, "r_x2": 480.59183, "r_y2": 185.58582, "r_x3": 134.765, "r_y3": 185.58582, "coord_origin": "TOPLEFT" }, "text": "We have chosen the PubTabNet data set to perform HPO, since it includes a", "orig": "We have chosen the PubTabNet data set to perform HPO, since it includes a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 206.33783000000005, "r_x1": 480.59183, "r_y1": 206.33783000000005, "r_x2": 480.59183, "r_y2": 197.54083000000003, "r_x3": 134.765, "r_y3": 197.54083000000003, "coord_origin": "TOPLEFT" }, "text": "highly diverse set of tables. Also we report TED scores separately for simple and", "orig": "highly diverse set of tables. Also we report TED scores separately for simple and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 218.29285000000004, "r_x1": 480.59177000000005, "r_y1": 218.29285000000004, "r_x2": 480.59177000000005, "r_y2": 209.49585000000002, "r_x3": 134.765, "r_y3": 209.49585000000002, "coord_origin": "TOPLEFT" }, "text": "complex tables (tables with cell spans). Results are presented in Table. 1. It is", "orig": "complex tables (tables with cell spans). Results are presented in Table. 1. It is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 230.24785999999995, "r_x1": 480.59277, "r_y1": 230.24785999999995, "r_x2": 480.59277, "r_y2": 221.45087, "r_x3": 134.765, "r_y3": 221.45087, "coord_origin": "TOPLEFT" }, "text": "evident that with OTSL, our model achieves the same TED score and slightly", "orig": "evident that with OTSL, our model achieves the same TED score and slightly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 242.20288000000005, "r_x1": 440.94159, "r_y1": 242.20288000000005, "r_x2": 440.94159, "r_y2": 233.40588000000002, "r_x3": 134.765, "r_y3": 233.40588000000002, "coord_origin": "TOPLEFT" }, "text": "better mAP scores in comparison to HTML. However OTSL yields a", "orig": "better mAP scores in comparison to HTML. However OTSL yields a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 444.86798, "r_y0": 242.20288000000005, "r_x1": 480.58786000000003, "r_y1": 242.20288000000005, "r_x2": 480.58786000000003, "r_y2": 233.40588000000002, "r_x3": 444.86798, "r_y3": 233.40588000000002, "coord_origin": "TOPLEFT" }, "text": "2x speed", "orig": "2x speed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 254.15886999999998, "r_x1": 145.20081, "r_y1": 254.15886999999998, "r_x2": 145.20081, "r_y2": 245.36188000000004, "r_x3": 134.76498, "r_y3": 245.36188000000004, "coord_origin": "TOPLEFT" }, "text": "up", "orig": "up", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.14899, "r_y0": 254.15886999999998, "r_x1": 311.21957, "r_y1": 254.15886999999998, "r_x2": 311.21957, "r_y2": 245.36188000000004, "r_x3": 149.14899, "r_y3": 245.36188000000004, "coord_origin": "TOPLEFT" }, "text": "in the inference runtime over HTML.", "orig": "in the inference runtime over HTML.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "We have chosen the PubTabNet data set to perform HPO, since it includes a highly diverse set of tables. Also we report TED scores separately for simple and complex tables (tables with cell spans). Results are presented in Table. 1. It is evident that with OTSL, our model achieves the same TED score and slightly better mAP scores in comparison to HTML. However OTSL yields a 2x speed up in the inference runtime over HTML." }, { "label": "caption", "id": 7, "page_no": 8, "cluster": { "id": 7, "label": "caption", "bbox": { "l": 134.76498, "t": 275.07232999999997, "r": 480.5954, "b": 327.0408, "coord_origin": "TOPLEFT" }, "confidence": 0.9570781588554382, "cells": [ { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 282.9986, "r_x1": 160.11836, "r_y1": 282.9986, "r_x2": 160.11836, "r_y2": 275.07232999999997, "r_x3": 134.76498, "r_y3": 275.07232999999997, "coord_origin": "TOPLEFT" }, "text": "Table", "orig": "Table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.34528, "r_y0": 282.9986, "r_x1": 175.59526, "r_y1": 282.9986, "r_x2": 175.59526, "r_y2": 275.07232999999997, "r_x3": 167.34528, "r_y3": 275.07232999999997, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 188.13298, "r_y0": 283.2048300000001, "r_x1": 480.59365999999994, "r_y1": 283.2048300000001, "r_x2": 480.59365999999994, "r_y2": 275.13507000000004, "r_x3": 188.13298, "r_y3": 275.13507000000004, "coord_origin": "TOPLEFT" }, "text": "HPO performed in OTSL and HTML representation on the same", "orig": "HPO performed in OTSL and HTML representation on the same", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 294.16385, "r_x1": 480.59444999999994, "r_y1": 294.16385, "r_x2": 480.59444999999994, "r_y2": 286.09409, "r_x3": 134.76498, "r_y3": 286.09409, "coord_origin": "TOPLEFT" }, "text": "transformer-based TableFormer [9] architecture, trained only on PubTabNet [22]. Ef-", "orig": "transformer-based TableFormer [9] architecture, trained only on PubTabNet [22]. Ef-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 305.12283, "r_x1": 480.5954, "r_y1": 305.12283, "r_x2": 480.5954, "r_y2": 297.05307, "r_x3": 134.76498, "r_y3": 297.05307, "coord_origin": "TOPLEFT" }, "text": "fects of reducing the # of layers in encoder and decoder stages of the model show that", "orig": "fects of reducing the # of layers in encoder and decoder stages of the model show that", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 316.08182, "r_x1": 480.59451, "r_y1": 316.08182, "r_x2": 480.59451, "r_y2": 308.01205, "r_x3": 134.76498, "r_y3": 308.01205, "coord_origin": "TOPLEFT" }, "text": "smaller models trained on OTSL perform better, especially in recognizing complex", "orig": "smaller models trained on OTSL perform better, especially in recognizing complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76498, "r_y0": 327.0408, "r_x1": 480.59441999999996, "r_y1": 327.0408, "r_x2": 480.59441999999996, "r_y2": 318.97104, "r_x3": 134.76498, "r_y3": 318.97104, "coord_origin": "TOPLEFT" }, "text": "table structures, and maintain a much higher mAP score than the HTML counterpart.", "orig": "table structures, and maintain a much higher mAP score than the HTML counterpart.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Table 1. HPO performed in OTSL and HTML representation on the same transformer-based TableFormer [9] architecture, trained only on PubTabNet [22]. Effects of reducing the # of layers in encoder and decoder stages of the model show that smaller models trained on OTSL perform better, especially in recognizing complex table structures, and maintain a much higher mAP score than the HTML counterpart." }, { "label": "table", "id": 0, "page_no": 8, "cluster": { "id": 0, "label": "table", "bbox": { "l": 139.66845703125, "t": 337.5747985839844, "r": 475.00372314453125, "b": 469.4721374511719, "coord_origin": "TOPLEFT" }, "confidence": 0.9901032447814941, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.37, "r_y0": 349.8047199999999, "r_x1": 168.04793, "r_y1": 349.8047199999999, "r_x2": 168.04793, "r_y2": 341.73495, "r_x3": 160.37, "r_y3": 341.73495, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 144.592, "r_y0": 362.75570999999997, "r_x1": 183.82806, "r_y1": 362.75570999999997, "r_x2": 183.82806, "r_y2": 354.68594, "r_x3": 144.592, "r_y3": 354.68594, "coord_origin": "TOPLEFT" }, "text": "enc-layers", "orig": "enc-layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 207.974, "r_y0": 349.8047199999999, "r_x1": 215.65193, "r_y1": 349.8047199999999, "r_x2": 215.65193, "r_y2": 341.73495, "r_x3": 207.974, "r_y3": 341.73495, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 192.19499, "r_y0": 362.75570999999997, "r_x1": 231.43106, "r_y1": 362.75570999999997, "r_x2": 231.43106, "r_y2": 354.68594, "r_x3": 192.19499, "r_y3": 354.68594, "coord_origin": "TOPLEFT" }, "text": "dec-layers", "orig": "dec-layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.79799999999997, "r_y0": 355.28372, "r_x1": 278.31766, "r_y1": 355.28372, "r_x2": 278.31766, "r_y2": 347.21396, "r_x3": 239.79799999999997, "r_y3": 347.21396, "coord_origin": "TOPLEFT" }, "text": "Language", "orig": "Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 324.67001, "r_y0": 349.8047199999999, "r_x1": 348.26419, "r_y1": 349.8047199999999, "r_x2": 348.26419, "r_y2": 341.73495, "r_x3": 324.67001, "r_y3": 341.73495, "coord_origin": "TOPLEFT" }, "text": "TEDs", "orig": "TEDs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.271, "r_y0": 349.8047199999999, "r_x1": 417.12683, "r_y1": 349.8047199999999, "r_x2": 417.12683, "r_y2": 341.73495, "r_x3": 396.271, "r_y3": 341.73495, "coord_origin": "TOPLEFT" }, "text": "mAP", "orig": "mAP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.927, "r_y0": 360.7637, "r_x1": 418.47278, "r_y1": 360.7637, "r_x2": 418.47278, "r_y2": 352.69394000000005, "r_x3": 394.927, "r_y3": 352.69394000000005, "coord_origin": "TOPLEFT" }, "text": "(0.75)", "orig": "(0.75)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 430.771, "r_y0": 349.8047199999999, "r_x1": 467.1423, "r_y1": 349.8047199999999, "r_x2": 467.1423, "r_y2": 341.73495, "r_x3": 430.771, "r_y3": 341.73495, "coord_origin": "TOPLEFT" }, "text": "Inference", "orig": "Inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 427.14801, "r_y0": 360.7637, "r_x1": 470.76056, "r_y1": 360.7637, "r_x2": 470.76056, "r_y2": 352.69394000000005, "r_x3": 427.14801, "r_y3": 352.69394000000005, "coord_origin": "TOPLEFT" }, "text": "time (secs)", "orig": "time (secs)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 286.686, "r_y0": 362.75570999999997, "r_x1": 312.33261, "r_y1": 362.75570999999997, "r_x2": 312.33261, "r_y2": 354.68594, "r_x3": 286.686, "r_y3": 354.68594, "coord_origin": "TOPLEFT" }, "text": "simple", "orig": "simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.702, "r_y0": 362.75570999999997, "r_x1": 353.71988, "r_y1": 362.75570999999997, "r_x2": 353.71988, "r_y2": 354.68594, "r_x3": 320.702, "r_y3": 354.68594, "coord_origin": "TOPLEFT" }, "text": "complex", "orig": "complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 369.306, "r_y0": 362.75570999999997, "r_x1": 379.03094, "r_y1": 362.75570999999997, "r_x2": 379.03094, "r_y2": 354.68594, "r_x3": 369.306, "r_y3": 354.68594, "coord_origin": "TOPLEFT" }, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.90601, "r_y0": 381.58572, "r_x1": 166.51294, "r_y1": 381.58572, "r_x2": 166.51294, "r_y2": 373.51596, "r_x3": 161.90601, "r_y3": 373.51596, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.509, "r_y0": 381.58572, "r_x1": 214.11594, "r_y1": 381.58572, "r_x2": 214.11594, "r_y2": 373.51596, "r_x3": 209.509, "r_y3": 373.51596, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.71000999999998, "r_y0": 376.10571, "r_x1": 271.40527, "r_y1": 376.10571, "r_x2": 271.40527, "r_y2": 368.03595, "r_x3": 246.71000999999998, "r_y3": 368.03595, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.017, "r_y0": 376.10571, "r_x1": 310.00375, "r_y1": 376.10571, "r_x2": 310.00375, "r_y2": 368.03595, "r_x3": 289.017, "r_y3": 368.03595, "coord_origin": "TOPLEFT" }, "text": "0.965", "orig": "0.965", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.71701, "r_y0": 376.10571, "r_x1": 347.70377, "r_y1": 376.10571, "r_x2": 347.70377, "r_y2": 368.03595, "r_x3": 326.71701, "r_y3": 368.03595, "coord_origin": "TOPLEFT" }, "text": "0.934", "orig": "0.934", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.67599, "r_y0": 376.10571, "r_x1": 384.66275, "r_y1": 376.10571, "r_x2": 384.66275, "r_y2": 368.03595, "r_x3": 363.67599, "r_y3": 368.03595, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.26999, "r_y0": 375.89948, "r_x1": 416.12723, "r_y1": 375.89948, "r_x2": 416.12723, "r_y2": 367.97317999999996, "r_x3": 397.26999, "r_y3": 367.97317999999996, "coord_origin": "TOPLEFT" }, "text": "0.88", "orig": "0.88", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.52701, "r_y0": 375.89948, "r_x1": 458.38425, "r_y1": 375.89948, "r_x2": 458.38425, "r_y2": 367.97317999999996, "r_x3": 439.52701, "r_y3": 367.97317999999996, "coord_origin": "TOPLEFT" }, "text": "2.73", "orig": "2.73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.17598999999998, "r_y0": 389.05771, "r_x1": 272.93954, "r_y1": 389.05771, "r_x2": 272.93954, "r_y2": 380.98795, "r_x3": 245.17598999999998, "r_y3": 380.98795, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.017, "r_y0": 389.05771, "r_x1": 310.00375, "r_y1": 389.05771, "r_x2": 310.00375, "r_y2": 380.98795, "r_x3": 289.017, "r_y3": 380.98795, "coord_origin": "TOPLEFT" }, "text": "0.969", "orig": "0.969", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.71701, "r_y0": 389.05771, "r_x1": 347.70377, "r_y1": 389.05771, "r_x2": 347.70377, "r_y2": 380.98795, "r_x3": 326.71701, "r_y3": 380.98795, "coord_origin": "TOPLEFT" }, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.67599, "r_y0": 389.05771, "r_x1": 384.66275, "r_y1": 389.05771, "r_x2": 384.66275, "r_y2": 380.98795, "r_x3": 363.67599, "r_y3": 380.98795, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.20599, "r_y0": 389.05771, "r_x1": 417.19275, "r_y1": 389.05771, "r_x2": 417.19275, "r_y2": 380.98795, "r_x3": 396.20599, "r_y3": 380.98795, "coord_origin": "TOPLEFT" }, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.767, "r_y0": 389.05771, "r_x1": 457.14682, "r_y1": 389.05771, "r_x2": 457.14682, "r_y2": 380.98795, "r_x3": 440.767, "r_y3": 380.98795, "coord_origin": "TOPLEFT" }, "text": "5.39", "orig": "5.39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.90601, "r_y0": 407.88672, "r_x1": 166.51294, "r_y1": 407.88672, "r_x2": 166.51294, "r_y2": 399.81696, "r_x3": 161.90601, "r_y3": 399.81696, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.509, "r_y0": 407.88672, "r_x1": 214.11594, "r_y1": 407.88672, "r_x2": 214.11594, "r_y2": 399.81696, "r_x3": 209.509, "r_y3": 399.81696, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.71000999999998, "r_y0": 402.40771, "r_x1": 271.40527, "r_y1": 402.40771, "r_x2": 271.40527, "r_y2": 394.33795, "r_x3": 246.71000999999998, "r_y3": 394.33795, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.017, "r_y0": 402.40771, "r_x1": 310.00375, "r_y1": 402.40771, "r_x2": 310.00375, "r_y2": 394.33795, "r_x3": 289.017, "r_y3": 394.33795, "coord_origin": "TOPLEFT" }, "text": "0.938", "orig": "0.938", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.71701, "r_y0": 402.40771, "r_x1": 347.70377, "r_y1": 402.40771, "r_x2": 347.70377, "r_y2": 394.33795, "r_x3": 326.71701, "r_y3": 394.33795, "coord_origin": "TOPLEFT" }, "text": "0.904", "orig": "0.904", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.67599, "r_y0": 402.40771, "r_x1": 384.66275, "r_y1": 402.40771, "r_x2": 384.66275, "r_y2": 394.33795, "r_x3": 363.67599, "r_y3": 394.33795, "coord_origin": "TOPLEFT" }, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.61801, "r_y0": 402.20148, "r_x1": 418.77887, "r_y1": 402.20148, "r_x2": 418.77887, "r_y2": 394.27518, "r_x3": 394.61801, "r_y3": 394.27518, "coord_origin": "TOPLEFT" }, "text": "0.853", "orig": "0.853", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.52701, "r_y0": 402.20148, "r_x1": 458.38425, "r_y1": 402.20148, "r_x2": 458.38425, "r_y2": 394.27518, "r_x3": 439.52701, "r_y3": 394.27518, "coord_origin": "TOPLEFT" }, "text": "1.97", "orig": "1.97", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.17598999999998, "r_y0": 415.3587, "r_x1": 272.93954, "r_y1": 415.3587, "r_x2": 272.93954, "r_y2": 407.28894, "r_x3": 245.17598999999998, "r_y3": 407.28894, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.017, "r_y0": 415.3587, "r_x1": 310.00375, "r_y1": 415.3587, "r_x2": 310.00375, "r_y2": 407.28894, "r_x3": 289.017, "r_y3": 407.28894, "coord_origin": "TOPLEFT" }, "text": "0.952", "orig": "0.952", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.71701, "r_y0": 415.3587, "r_x1": 347.70377, "r_y1": 415.3587, "r_x2": 347.70377, "r_y2": 407.28894, "r_x3": 326.71701, "r_y3": 407.28894, "coord_origin": "TOPLEFT" }, "text": "0.909", "orig": "0.909", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.08801, "r_y0": 415.15247, "r_x1": 386.24887, "r_y1": 415.15247, "r_x2": 386.24887, "r_y2": 407.22617, "r_x3": 362.08801, "r_y3": 407.22617, "coord_origin": "TOPLEFT" }, "text": "0.938", "orig": "0.938", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.20599, "r_y0": 415.3587, "r_x1": 417.19275, "r_y1": 415.3587, "r_x2": 417.19275, "r_y2": 407.28894, "r_x3": 396.20599, "r_y3": 407.28894, "coord_origin": "TOPLEFT" }, "text": "0.843", "orig": "0.843", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.767, "r_y0": 415.3587, "r_x1": 457.14682, "r_y1": 415.3587, "r_x2": 457.14682, "r_y2": 407.28894, "r_x3": 440.767, "r_y3": 407.28894, "coord_origin": "TOPLEFT" }, "text": "3.77", "orig": "3.77", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.90601, "r_y0": 434.1877099999999, "r_x1": 166.51294, "r_y1": 434.1877099999999, "r_x2": 166.51294, "r_y2": 426.11795, "r_x3": 161.90601, "r_y3": 426.11795, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.509, "r_y0": 434.1877099999999, "r_x1": 214.11594, "r_y1": 434.1877099999999, "r_x2": 214.11594, "r_y2": 426.11795, "r_x3": 209.509, "r_y3": 426.11795, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.71000999999998, "r_y0": 428.70871, "r_x1": 271.40527, "r_y1": 428.70871, "r_x2": 271.40527, "r_y2": 420.63895, "r_x3": 246.71000999999998, "r_y3": 420.63895, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.017, "r_y0": 428.70871, "r_x1": 310.00375, "r_y1": 428.70871, "r_x2": 310.00375, "r_y2": 420.63895, "r_x3": 289.017, "r_y3": 420.63895, "coord_origin": "TOPLEFT" }, "text": "0.923", "orig": "0.923", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.71701, "r_y0": 428.70871, "r_x1": 347.70377, "r_y1": 428.70871, "r_x2": 347.70377, "r_y2": 420.63895, "r_x3": 326.71701, "r_y3": 420.63895, "coord_origin": "TOPLEFT" }, "text": "0.897", "orig": "0.897", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.67599, "r_y0": 428.70871, "r_x1": 384.66275, "r_y1": 428.70871, "r_x2": 384.66275, "r_y2": 420.63895, "r_x3": 363.67599, "r_y3": 420.63895, "coord_origin": "TOPLEFT" }, "text": "0.915", "orig": "0.915", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.61801, "r_y0": 428.50247, "r_x1": 418.77887, "r_y1": 428.50247, "r_x2": 418.77887, "r_y2": 420.57617, "r_x3": 394.61801, "r_y3": 420.57617, "coord_origin": "TOPLEFT" }, "text": "0.859", "orig": "0.859", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.52701, "r_y0": 428.50247, "r_x1": 458.38425, "r_y1": 428.50247, "r_x2": 458.38425, "r_y2": 420.57617, "r_x3": 439.52701, "r_y3": 420.57617, "coord_origin": "TOPLEFT" }, "text": "1.91", "orig": "1.91", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.17598999999998, "r_y0": 441.6597, "r_x1": 272.93954, "r_y1": 441.6597, "r_x2": 272.93954, "r_y2": 433.58994, "r_x3": 245.17598999999998, "r_y3": 433.58994, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.017, "r_y0": 441.6597, "r_x1": 310.00375, "r_y1": 441.6597, "r_x2": 310.00375, "r_y2": 433.58994, "r_x3": 289.017, "r_y3": 433.58994, "coord_origin": "TOPLEFT" }, "text": "0.945", "orig": "0.945", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.71701, "r_y0": 441.6597, "r_x1": 347.70377, "r_y1": 441.6597, "r_x2": 347.70377, "r_y2": 433.58994, "r_x3": 326.71701, "r_y3": 433.58994, "coord_origin": "TOPLEFT" }, "text": "0.901", "orig": "0.901", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.08801, "r_y0": 441.45346, "r_x1": 386.24887, "r_y1": 441.45346, "r_x2": 386.24887, "r_y2": 433.5271599999999, "r_x3": 362.08801, "r_y3": 433.5271599999999, "coord_origin": "TOPLEFT" }, "text": "0.931", "orig": "0.931", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.20599, "r_y0": 441.6597, "r_x1": 417.19275, "r_y1": 441.6597, "r_x2": 417.19275, "r_y2": 433.58994, "r_x3": 396.20599, "r_y3": 433.58994, "coord_origin": "TOPLEFT" }, "text": "0.834", "orig": "0.834", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.767, "r_y0": 441.6597, "r_x1": 457.14682, "r_y1": 441.6597, "r_x2": 457.14682, "r_y2": 433.58994, "r_x3": 440.767, "r_y3": 433.58994, "coord_origin": "TOPLEFT" }, "text": "3.81", "orig": "3.81", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.90601, "r_y0": 460.48972, "r_x1": 166.51294, "r_y1": 460.48972, "r_x2": 166.51294, "r_y2": 452.41995, "r_x3": 161.90601, "r_y3": 452.41995, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.509, "r_y0": 460.48972, "r_x1": 214.11594, "r_y1": 460.48972, "r_x2": 214.11594, "r_y2": 452.41995, "r_x3": 209.509, "r_y3": 452.41995, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.71000999999998, "r_y0": 455.0097, "r_x1": 271.40527, "r_y1": 455.0097, "r_x2": 271.40527, "r_y2": 446.9399399999999, "r_x3": 246.71000999999998, "r_y3": 446.9399399999999, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.017, "r_y0": 455.0097, "r_x1": 310.00375, "r_y1": 455.0097, "r_x2": 310.00375, "r_y2": 446.9399399999999, "r_x3": 289.017, "r_y3": 446.9399399999999, "coord_origin": "TOPLEFT" }, "text": "0.952", "orig": "0.952", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 329.021, "r_y0": 455.0097, "r_x1": 345.40082, "r_y1": 455.0097, "r_x2": 345.40082, "r_y2": 446.9399399999999, "r_x3": 329.021, "r_y3": 446.9399399999999, "coord_origin": "TOPLEFT" }, "text": "0.92", "orig": "0.92", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.08801, "r_y0": 454.80347, "r_x1": 386.24887, "r_y1": 454.80347, "r_x2": 386.24887, "r_y2": 446.87717, "r_x3": 362.08801, "r_y3": 446.87717, "coord_origin": "TOPLEFT" }, "text": "0.942", "orig": "0.942", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.61801, "r_y0": 454.80347, "r_x1": 418.77887, "r_y1": 454.80347, "r_x2": 418.77887, "r_y2": 446.87717, "r_x3": 394.61801, "r_y3": 446.87717, "coord_origin": "TOPLEFT" }, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.52701, "r_y0": 454.80347, "r_x1": 458.38425, "r_y1": 454.80347, "r_x2": 458.38425, "r_y2": 446.87717, "r_x3": 439.52701, "r_y3": 446.87717, "coord_origin": "TOPLEFT" }, "text": "1.22", "orig": "1.22", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.17598999999998, "r_y0": 467.9617, "r_x1": 272.93954, "r_y1": 467.9617, "r_x2": 272.93954, "r_y2": 459.8919399999999, "r_x3": 245.17598999999998, "r_y3": 459.8919399999999, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.017, "r_y0": 467.9617, "r_x1": 310.00375, "r_y1": 467.9617, "r_x2": 310.00375, "r_y2": 459.8919399999999, "r_x3": 289.017, "r_y3": 459.8919399999999, "coord_origin": "TOPLEFT" }, "text": "0.944", "orig": "0.944", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.71701, "r_y0": 467.9617, "r_x1": 347.70377, "r_y1": 467.9617, "r_x2": 347.70377, "r_y2": 459.8919399999999, "r_x3": 326.71701, "r_y3": 459.8919399999999, "coord_origin": "TOPLEFT" }, "text": "0.903", "orig": "0.903", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.67599, "r_y0": 467.9617, "r_x1": 384.66275, "r_y1": 467.9617, "r_x2": 384.66275, "r_y2": 459.8919399999999, "r_x3": 363.67599, "r_y3": 459.8919399999999, "coord_origin": "TOPLEFT" }, "text": "0.931", "orig": "0.931", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.20599, "r_y0": 467.9617, "r_x1": 417.19275, "r_y1": 467.9617, "r_x2": 417.19275, "r_y2": 459.8919399999999, "r_x3": 396.20599, "r_y3": 459.8919399999999, "coord_origin": "TOPLEFT" }, "text": "0.824", "orig": "0.824", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 446.65302, "r_y0": 467.9617, "r_x1": 451.25995, "r_y1": 467.9617, "r_x2": 451.25995, "r_y2": 459.8919399999999, "r_x3": 446.65302, "r_y3": 459.8919399999999, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 11, "label": "text", "bbox": { "l": 160.37, "t": 341.73495, "r": 168.04793, "b": 349.8047199999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.37, "r_y0": 349.8047199999999, "r_x1": 168.04793, "r_y1": 349.8047199999999, "r_x2": 168.04793, "r_y2": 341.73495, "r_x3": 160.37, "r_y3": 341.73495, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 12, "label": "text", "bbox": { "l": 144.592, "t": 354.68594, "r": 183.82806, "b": 362.75570999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 144.592, "r_y0": 362.75570999999997, "r_x1": 183.82806, "r_y1": 362.75570999999997, "r_x2": 183.82806, "r_y2": 354.68594, "r_x3": 144.592, "r_y3": 354.68594, "coord_origin": "TOPLEFT" }, "text": "enc-layers", "orig": "enc-layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 13, "label": "text", "bbox": { "l": 207.974, "t": 341.73495, "r": 215.65193, "b": 349.8047199999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 207.974, "r_y0": 349.8047199999999, "r_x1": 215.65193, "r_y1": 349.8047199999999, "r_x2": 215.65193, "r_y2": 341.73495, "r_x3": 207.974, "r_y3": 341.73495, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 14, "label": "text", "bbox": { "l": 192.19499, "t": 354.68594, "r": 231.43106, "b": 362.75570999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 192.19499, "r_y0": 362.75570999999997, "r_x1": 231.43106, "r_y1": 362.75570999999997, "r_x2": 231.43106, "r_y2": 354.68594, "r_x3": 192.19499, "r_y3": 354.68594, "coord_origin": "TOPLEFT" }, "text": "dec-layers", "orig": "dec-layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 15, "label": "text", "bbox": { "l": 239.79799999999997, "t": 347.21396, "r": 278.31766, "b": 355.28372, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.79799999999997, "r_y0": 355.28372, "r_x1": 278.31766, "r_y1": 355.28372, "r_x2": 278.31766, "r_y2": 347.21396, "r_x3": 239.79799999999997, "r_y3": 347.21396, "coord_origin": "TOPLEFT" }, "text": "Language", "orig": "Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 16, "label": "text", "bbox": { "l": 324.67001, "t": 341.73495, "r": 348.26419, "b": 349.8047199999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 324.67001, "r_y0": 349.8047199999999, "r_x1": 348.26419, "r_y1": 349.8047199999999, "r_x2": 348.26419, "r_y2": 341.73495, "r_x3": 324.67001, "r_y3": 341.73495, "coord_origin": "TOPLEFT" }, "text": "TEDs", "orig": "TEDs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 17, "label": "text", "bbox": { "l": 396.271, "t": 341.73495, "r": 417.12683, "b": 349.8047199999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.271, "r_y0": 349.8047199999999, "r_x1": 417.12683, "r_y1": 349.8047199999999, "r_x2": 417.12683, "r_y2": 341.73495, "r_x3": 396.271, "r_y3": 341.73495, "coord_origin": "TOPLEFT" }, "text": "mAP", "orig": "mAP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 18, "label": "text", "bbox": { "l": 394.927, "t": 352.69394000000005, "r": 418.47278, "b": 360.7637, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.927, "r_y0": 360.7637, "r_x1": 418.47278, "r_y1": 360.7637, "r_x2": 418.47278, "r_y2": 352.69394000000005, "r_x3": 394.927, "r_y3": 352.69394000000005, "coord_origin": "TOPLEFT" }, "text": "(0.75)", "orig": "(0.75)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 19, "label": "text", "bbox": { "l": 430.771, "t": 341.73495, "r": 467.1423, "b": 349.8047199999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 430.771, "r_y0": 349.8047199999999, "r_x1": 467.1423, "r_y1": 349.8047199999999, "r_x2": 467.1423, "r_y2": 341.73495, "r_x3": 430.771, "r_y3": 341.73495, "coord_origin": "TOPLEFT" }, "text": "Inference", "orig": "Inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 20, "label": "text", "bbox": { "l": 427.14801, "t": 352.69394000000005, "r": 470.76056, "b": 360.7637, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 427.14801, "r_y0": 360.7637, "r_x1": 470.76056, "r_y1": 360.7637, "r_x2": 470.76056, "r_y2": 352.69394000000005, "r_x3": 427.14801, "r_y3": 352.69394000000005, "coord_origin": "TOPLEFT" }, "text": "time (secs)", "orig": "time (secs)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 21, "label": "text", "bbox": { "l": 286.686, "t": 354.68594, "r": 312.33261, "b": 362.75570999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 286.686, "r_y0": 362.75570999999997, "r_x1": 312.33261, "r_y1": 362.75570999999997, "r_x2": 312.33261, "r_y2": 354.68594, "r_x3": 286.686, "r_y3": 354.68594, "coord_origin": "TOPLEFT" }, "text": "simple", "orig": "simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 22, "label": "text", "bbox": { "l": 320.702, "t": 354.68594, "r": 353.71988, "b": 362.75570999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.702, "r_y0": 362.75570999999997, "r_x1": 353.71988, "r_y1": 362.75570999999997, "r_x2": 353.71988, "r_y2": 354.68594, "r_x3": 320.702, "r_y3": 354.68594, "coord_origin": "TOPLEFT" }, "text": "complex", "orig": "complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 23, "label": "text", "bbox": { "l": 369.306, "t": 354.68594, "r": 379.03094, "b": 362.75570999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 369.306, "r_y0": 362.75570999999997, "r_x1": 379.03094, "r_y1": 362.75570999999997, "r_x2": 379.03094, "r_y2": 354.68594, "r_x3": 369.306, "r_y3": 354.68594, "coord_origin": "TOPLEFT" }, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 24, "label": "text", "bbox": { "l": 161.90601, "t": 373.51596, "r": 166.51294, "b": 381.58572, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.90601, "r_y0": 381.58572, "r_x1": 166.51294, "r_y1": 381.58572, "r_x2": 166.51294, "r_y2": 373.51596, "r_x3": 161.90601, "r_y3": 373.51596, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 25, "label": "text", "bbox": { "l": 209.509, "t": 373.51596, "r": 214.11594, "b": 381.58572, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.509, "r_y0": 381.58572, "r_x1": 214.11594, "r_y1": 381.58572, "r_x2": 214.11594, "r_y2": 373.51596, "r_x3": 209.509, "r_y3": 373.51596, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 26, "label": "text", "bbox": { "l": 246.71000999999998, "t": 368.03595, "r": 271.40527, "b": 376.10571, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.71000999999998, "r_y0": 376.10571, "r_x1": 271.40527, "r_y1": 376.10571, "r_x2": 271.40527, "r_y2": 368.03595, "r_x3": 246.71000999999998, "r_y3": 368.03595, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 27, "label": "text", "bbox": { "l": 289.017, "t": 368.03595, "r": 310.00375, "b": 376.10571, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.017, "r_y0": 376.10571, "r_x1": 310.00375, "r_y1": 376.10571, "r_x2": 310.00375, "r_y2": 368.03595, "r_x3": 289.017, "r_y3": 368.03595, "coord_origin": "TOPLEFT" }, "text": "0.965", "orig": "0.965", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 28, "label": "text", "bbox": { "l": 326.71701, "t": 368.03595, "r": 347.70377, "b": 376.10571, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.71701, "r_y0": 376.10571, "r_x1": 347.70377, "r_y1": 376.10571, "r_x2": 347.70377, "r_y2": 368.03595, "r_x3": 326.71701, "r_y3": 368.03595, "coord_origin": "TOPLEFT" }, "text": "0.934", "orig": "0.934", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 29, "label": "text", "bbox": { "l": 363.67599, "t": 368.03595, "r": 384.66275, "b": 376.10571, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.67599, "r_y0": 376.10571, "r_x1": 384.66275, "r_y1": 376.10571, "r_x2": 384.66275, "r_y2": 368.03595, "r_x3": 363.67599, "r_y3": 368.03595, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 30, "label": "text", "bbox": { "l": 397.26999, "t": 367.97317999999996, "r": 416.12723, "b": 375.89948, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.26999, "r_y0": 375.89948, "r_x1": 416.12723, "r_y1": 375.89948, "r_x2": 416.12723, "r_y2": 367.97317999999996, "r_x3": 397.26999, "r_y3": 367.97317999999996, "coord_origin": "TOPLEFT" }, "text": "0.88", "orig": "0.88", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 31, "label": "text", "bbox": { "l": 439.52701, "t": 367.97317999999996, "r": 458.38425, "b": 375.89948, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.52701, "r_y0": 375.89948, "r_x1": 458.38425, "r_y1": 375.89948, "r_x2": 458.38425, "r_y2": 367.97317999999996, "r_x3": 439.52701, "r_y3": 367.97317999999996, "coord_origin": "TOPLEFT" }, "text": "2.73", "orig": "2.73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 32, "label": "text", "bbox": { "l": 245.17598999999998, "t": 380.98795, "r": 272.93954, "b": 389.05771, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.17598999999998, "r_y0": 389.05771, "r_x1": 272.93954, "r_y1": 389.05771, "r_x2": 272.93954, "r_y2": 380.98795, "r_x3": 245.17598999999998, "r_y3": 380.98795, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 33, "label": "text", "bbox": { "l": 289.017, "t": 380.98795, "r": 310.00375, "b": 389.05771, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.017, "r_y0": 389.05771, "r_x1": 310.00375, "r_y1": 389.05771, "r_x2": 310.00375, "r_y2": 380.98795, "r_x3": 289.017, "r_y3": 380.98795, "coord_origin": "TOPLEFT" }, "text": "0.969", "orig": "0.969", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 34, "label": "text", "bbox": { "l": 326.71701, "t": 380.98795, "r": 347.70377, "b": 389.05771, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.71701, "r_y0": 389.05771, "r_x1": 347.70377, "r_y1": 389.05771, "r_x2": 347.70377, "r_y2": 380.98795, "r_x3": 326.71701, "r_y3": 380.98795, "coord_origin": "TOPLEFT" }, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 35, "label": "text", "bbox": { "l": 363.67599, "t": 380.98795, "r": 384.66275, "b": 389.05771, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.67599, "r_y0": 389.05771, "r_x1": 384.66275, "r_y1": 389.05771, "r_x2": 384.66275, "r_y2": 380.98795, "r_x3": 363.67599, "r_y3": 380.98795, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 36, "label": "text", "bbox": { "l": 396.20599, "t": 380.98795, "r": 417.19275, "b": 389.05771, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.20599, "r_y0": 389.05771, "r_x1": 417.19275, "r_y1": 389.05771, "r_x2": 417.19275, "r_y2": 380.98795, "r_x3": 396.20599, "r_y3": 380.98795, "coord_origin": "TOPLEFT" }, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 37, "label": "text", "bbox": { "l": 440.767, "t": 380.98795, "r": 457.14682, "b": 389.05771, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.767, "r_y0": 389.05771, "r_x1": 457.14682, "r_y1": 389.05771, "r_x2": 457.14682, "r_y2": 380.98795, "r_x3": 440.767, "r_y3": 380.98795, "coord_origin": "TOPLEFT" }, "text": "5.39", "orig": "5.39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 38, "label": "text", "bbox": { "l": 161.90601, "t": 399.81696, "r": 166.51294, "b": 407.88672, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.90601, "r_y0": 407.88672, "r_x1": 166.51294, "r_y1": 407.88672, "r_x2": 166.51294, "r_y2": 399.81696, "r_x3": 161.90601, "r_y3": 399.81696, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 39, "label": "text", "bbox": { "l": 209.509, "t": 399.81696, "r": 214.11594, "b": 407.88672, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.509, "r_y0": 407.88672, "r_x1": 214.11594, "r_y1": 407.88672, "r_x2": 214.11594, "r_y2": 399.81696, "r_x3": 209.509, "r_y3": 399.81696, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 40, "label": "text", "bbox": { "l": 246.71000999999998, "t": 394.33795, "r": 271.40527, "b": 402.40771, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.71000999999998, "r_y0": 402.40771, "r_x1": 271.40527, "r_y1": 402.40771, "r_x2": 271.40527, "r_y2": 394.33795, "r_x3": 246.71000999999998, "r_y3": 394.33795, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 289.017, "t": 394.33795, "r": 310.00375, "b": 402.40771, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.017, "r_y0": 402.40771, "r_x1": 310.00375, "r_y1": 402.40771, "r_x2": 310.00375, "r_y2": 394.33795, "r_x3": 289.017, "r_y3": 394.33795, "coord_origin": "TOPLEFT" }, "text": "0.938", "orig": "0.938", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 326.71701, "t": 394.33795, "r": 347.70377, "b": 402.40771, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.71701, "r_y0": 402.40771, "r_x1": 347.70377, "r_y1": 402.40771, "r_x2": 347.70377, "r_y2": 394.33795, "r_x3": 326.71701, "r_y3": 394.33795, "coord_origin": "TOPLEFT" }, "text": "0.904", "orig": "0.904", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 363.67599, "t": 394.33795, "r": 384.66275, "b": 402.40771, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.67599, "r_y0": 402.40771, "r_x1": 384.66275, "r_y1": 402.40771, "r_x2": 384.66275, "r_y2": 394.33795, "r_x3": 363.67599, "r_y3": 394.33795, "coord_origin": "TOPLEFT" }, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 394.61801, "t": 394.27518, "r": 418.77887, "b": 402.20148, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.61801, "r_y0": 402.20148, "r_x1": 418.77887, "r_y1": 402.20148, "r_x2": 418.77887, "r_y2": 394.27518, "r_x3": 394.61801, "r_y3": 394.27518, "coord_origin": "TOPLEFT" }, "text": "0.853", "orig": "0.853", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 439.52701, "t": 394.27518, "r": 458.38425, "b": 402.20148, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.52701, "r_y0": 402.20148, "r_x1": 458.38425, "r_y1": 402.20148, "r_x2": 458.38425, "r_y2": 394.27518, "r_x3": 439.52701, "r_y3": 394.27518, "coord_origin": "TOPLEFT" }, "text": "1.97", "orig": "1.97", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 245.17598999999998, "t": 407.28894, "r": 272.93954, "b": 415.3587, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.17598999999998, "r_y0": 415.3587, "r_x1": 272.93954, "r_y1": 415.3587, "r_x2": 272.93954, "r_y2": 407.28894, "r_x3": 245.17598999999998, "r_y3": 407.28894, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 289.017, "t": 407.28894, "r": 310.00375, "b": 415.3587, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.017, "r_y0": 415.3587, "r_x1": 310.00375, "r_y1": 415.3587, "r_x2": 310.00375, "r_y2": 407.28894, "r_x3": 289.017, "r_y3": 407.28894, "coord_origin": "TOPLEFT" }, "text": "0.952", "orig": "0.952", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 326.71701, "t": 407.28894, "r": 347.70377, "b": 415.3587, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.71701, "r_y0": 415.3587, "r_x1": 347.70377, "r_y1": 415.3587, "r_x2": 347.70377, "r_y2": 407.28894, "r_x3": 326.71701, "r_y3": 407.28894, "coord_origin": "TOPLEFT" }, "text": "0.909", "orig": "0.909", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 362.08801, "t": 407.22617, "r": 386.24887, "b": 415.15247, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.08801, "r_y0": 415.15247, "r_x1": 386.24887, "r_y1": 415.15247, "r_x2": 386.24887, "r_y2": 407.22617, "r_x3": 362.08801, "r_y3": 407.22617, "coord_origin": "TOPLEFT" }, "text": "0.938", "orig": "0.938", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 396.20599, "t": 407.28894, "r": 417.19275, "b": 415.3587, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.20599, "r_y0": 415.3587, "r_x1": 417.19275, "r_y1": 415.3587, "r_x2": 417.19275, "r_y2": 407.28894, "r_x3": 396.20599, "r_y3": 407.28894, "coord_origin": "TOPLEFT" }, "text": "0.843", "orig": "0.843", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 51, "label": "text", "bbox": { "l": 440.767, "t": 407.28894, "r": 457.14682, "b": 415.3587, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.767, "r_y0": 415.3587, "r_x1": 457.14682, "r_y1": 415.3587, "r_x2": 457.14682, "r_y2": 407.28894, "r_x3": 440.767, "r_y3": 407.28894, "coord_origin": "TOPLEFT" }, "text": "3.77", "orig": "3.77", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 52, "label": "text", "bbox": { "l": 161.90601, "t": 426.11795, "r": 166.51294, "b": 434.1877099999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.90601, "r_y0": 434.1877099999999, "r_x1": 166.51294, "r_y1": 434.1877099999999, "r_x2": 166.51294, "r_y2": 426.11795, "r_x3": 161.90601, "r_y3": 426.11795, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 53, "label": "text", "bbox": { "l": 209.509, "t": 426.11795, "r": 214.11594, "b": 434.1877099999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.509, "r_y0": 434.1877099999999, "r_x1": 214.11594, "r_y1": 434.1877099999999, "r_x2": 214.11594, "r_y2": 426.11795, "r_x3": 209.509, "r_y3": 426.11795, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 54, "label": "text", "bbox": { "l": 246.71000999999998, "t": 420.63895, "r": 271.40527, "b": 428.70871, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.71000999999998, "r_y0": 428.70871, "r_x1": 271.40527, "r_y1": 428.70871, "r_x2": 271.40527, "r_y2": 420.63895, "r_x3": 246.71000999999998, "r_y3": 420.63895, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 55, "label": "text", "bbox": { "l": 289.017, "t": 420.63895, "r": 310.00375, "b": 428.70871, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.017, "r_y0": 428.70871, "r_x1": 310.00375, "r_y1": 428.70871, "r_x2": 310.00375, "r_y2": 420.63895, "r_x3": 289.017, "r_y3": 420.63895, "coord_origin": "TOPLEFT" }, "text": "0.923", "orig": "0.923", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 56, "label": "text", "bbox": { "l": 326.71701, "t": 420.63895, "r": 347.70377, "b": 428.70871, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.71701, "r_y0": 428.70871, "r_x1": 347.70377, "r_y1": 428.70871, "r_x2": 347.70377, "r_y2": 420.63895, "r_x3": 326.71701, "r_y3": 420.63895, "coord_origin": "TOPLEFT" }, "text": "0.897", "orig": "0.897", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 57, "label": "text", "bbox": { "l": 363.67599, "t": 420.63895, "r": 384.66275, "b": 428.70871, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.67599, "r_y0": 428.70871, "r_x1": 384.66275, "r_y1": 428.70871, "r_x2": 384.66275, "r_y2": 420.63895, "r_x3": 363.67599, "r_y3": 420.63895, "coord_origin": "TOPLEFT" }, "text": "0.915", "orig": "0.915", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 58, "label": "text", "bbox": { "l": 394.61801, "t": 420.57617, "r": 418.77887, "b": 428.50247, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.61801, "r_y0": 428.50247, "r_x1": 418.77887, "r_y1": 428.50247, "r_x2": 418.77887, "r_y2": 420.57617, "r_x3": 394.61801, "r_y3": 420.57617, "coord_origin": "TOPLEFT" }, "text": "0.859", "orig": "0.859", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 59, "label": "text", "bbox": { "l": 439.52701, "t": 420.57617, "r": 458.38425, "b": 428.50247, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.52701, "r_y0": 428.50247, "r_x1": 458.38425, "r_y1": 428.50247, "r_x2": 458.38425, "r_y2": 420.57617, "r_x3": 439.52701, "r_y3": 420.57617, "coord_origin": "TOPLEFT" }, "text": "1.91", "orig": "1.91", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 60, "label": "text", "bbox": { "l": 245.17598999999998, "t": 433.58994, "r": 272.93954, "b": 441.6597, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.17598999999998, "r_y0": 441.6597, "r_x1": 272.93954, "r_y1": 441.6597, "r_x2": 272.93954, "r_y2": 433.58994, "r_x3": 245.17598999999998, "r_y3": 433.58994, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 61, "label": "text", "bbox": { "l": 289.017, "t": 433.58994, "r": 310.00375, "b": 441.6597, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.017, "r_y0": 441.6597, "r_x1": 310.00375, "r_y1": 441.6597, "r_x2": 310.00375, "r_y2": 433.58994, "r_x3": 289.017, "r_y3": 433.58994, "coord_origin": "TOPLEFT" }, "text": "0.945", "orig": "0.945", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 62, "label": "text", "bbox": { "l": 326.71701, "t": 433.58994, "r": 347.70377, "b": 441.6597, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.71701, "r_y0": 441.6597, "r_x1": 347.70377, "r_y1": 441.6597, "r_x2": 347.70377, "r_y2": 433.58994, "r_x3": 326.71701, "r_y3": 433.58994, "coord_origin": "TOPLEFT" }, "text": "0.901", "orig": "0.901", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 362.08801, "t": 433.5271599999999, "r": 386.24887, "b": 441.45346, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.08801, "r_y0": 441.45346, "r_x1": 386.24887, "r_y1": 441.45346, "r_x2": 386.24887, "r_y2": 433.5271599999999, "r_x3": 362.08801, "r_y3": 433.5271599999999, "coord_origin": "TOPLEFT" }, "text": "0.931", "orig": "0.931", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 396.20599, "t": 433.58994, "r": 417.19275, "b": 441.6597, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.20599, "r_y0": 441.6597, "r_x1": 417.19275, "r_y1": 441.6597, "r_x2": 417.19275, "r_y2": 433.58994, "r_x3": 396.20599, "r_y3": 433.58994, "coord_origin": "TOPLEFT" }, "text": "0.834", "orig": "0.834", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 440.767, "t": 433.58994, "r": 457.14682, "b": 441.6597, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.767, "r_y0": 441.6597, "r_x1": 457.14682, "r_y1": 441.6597, "r_x2": 457.14682, "r_y2": 433.58994, "r_x3": 440.767, "r_y3": 433.58994, "coord_origin": "TOPLEFT" }, "text": "3.81", "orig": "3.81", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 161.90601, "t": 452.41995, "r": 166.51294, "b": 460.48972, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.90601, "r_y0": 460.48972, "r_x1": 166.51294, "r_y1": 460.48972, "r_x2": 166.51294, "r_y2": 452.41995, "r_x3": 161.90601, "r_y3": 452.41995, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 209.509, "t": 452.41995, "r": 214.11594, "b": 460.48972, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.509, "r_y0": 460.48972, "r_x1": 214.11594, "r_y1": 460.48972, "r_x2": 214.11594, "r_y2": 452.41995, "r_x3": 209.509, "r_y3": 452.41995, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 246.71000999999998, "t": 446.9399399999999, "r": 271.40527, "b": 455.0097, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.71000999999998, "r_y0": 455.0097, "r_x1": 271.40527, "r_y1": 455.0097, "r_x2": 271.40527, "r_y2": 446.9399399999999, "r_x3": 246.71000999999998, "r_y3": 446.9399399999999, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 289.017, "t": 446.9399399999999, "r": 310.00375, "b": 455.0097, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.017, "r_y0": 455.0097, "r_x1": 310.00375, "r_y1": 455.0097, "r_x2": 310.00375, "r_y2": 446.9399399999999, "r_x3": 289.017, "r_y3": 446.9399399999999, "coord_origin": "TOPLEFT" }, "text": "0.952", "orig": "0.952", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 329.021, "t": 446.9399399999999, "r": 345.40082, "b": 455.0097, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 329.021, "r_y0": 455.0097, "r_x1": 345.40082, "r_y1": 455.0097, "r_x2": 345.40082, "r_y2": 446.9399399999999, "r_x3": 329.021, "r_y3": 446.9399399999999, "coord_origin": "TOPLEFT" }, "text": "0.92", "orig": "0.92", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 362.08801, "t": 446.87717, "r": 386.24887, "b": 454.80347, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.08801, "r_y0": 454.80347, "r_x1": 386.24887, "r_y1": 454.80347, "r_x2": 386.24887, "r_y2": 446.87717, "r_x3": 362.08801, "r_y3": 446.87717, "coord_origin": "TOPLEFT" }, "text": "0.942", "orig": "0.942", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 394.61801, "t": 446.87717, "r": 418.77887, "b": 454.80347, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.61801, "r_y0": 454.80347, "r_x1": 418.77887, "r_y1": 454.80347, "r_x2": 418.77887, "r_y2": 446.87717, "r_x3": 394.61801, "r_y3": 446.87717, "coord_origin": "TOPLEFT" }, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 439.52701, "t": 446.87717, "r": 458.38425, "b": 454.80347, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.52701, "r_y0": 454.80347, "r_x1": 458.38425, "r_y1": 454.80347, "r_x2": 458.38425, "r_y2": 446.87717, "r_x3": 439.52701, "r_y3": 446.87717, "coord_origin": "TOPLEFT" }, "text": "1.22", "orig": "1.22", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 245.17598999999998, "t": 459.8919399999999, "r": 272.93954, "b": 467.9617, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.17598999999998, "r_y0": 467.9617, "r_x1": 272.93954, "r_y1": 467.9617, "r_x2": 272.93954, "r_y2": 459.8919399999999, "r_x3": 245.17598999999998, "r_y3": 459.8919399999999, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 289.017, "t": 459.8919399999999, "r": 310.00375, "b": 467.9617, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.017, "r_y0": 467.9617, "r_x1": 310.00375, "r_y1": 467.9617, "r_x2": 310.00375, "r_y2": 459.8919399999999, "r_x3": 289.017, "r_y3": 459.8919399999999, "coord_origin": "TOPLEFT" }, "text": "0.944", "orig": "0.944", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 326.71701, "t": 459.8919399999999, "r": 347.70377, "b": 467.9617, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.71701, "r_y0": 467.9617, "r_x1": 347.70377, "r_y1": 467.9617, "r_x2": 347.70377, "r_y2": 459.8919399999999, "r_x3": 326.71701, "r_y3": 459.8919399999999, "coord_origin": "TOPLEFT" }, "text": "0.903", "orig": "0.903", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 363.67599, "t": 459.8919399999999, "r": 384.66275, "b": 467.9617, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.67599, "r_y0": 467.9617, "r_x1": 384.66275, "r_y1": 467.9617, "r_x2": 384.66275, "r_y2": 459.8919399999999, "r_x3": 363.67599, "r_y3": 459.8919399999999, "coord_origin": "TOPLEFT" }, "text": "0.931", "orig": "0.931", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 396.20599, "t": 459.8919399999999, "r": 417.19275, "b": 467.9617, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.20599, "r_y0": 467.9617, "r_x1": 417.19275, "r_y1": 467.9617, "r_x2": 417.19275, "r_y2": 459.8919399999999, "r_x3": 396.20599, "r_y3": 459.8919399999999, "coord_origin": "TOPLEFT" }, "text": "0.824", "orig": "0.824", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 446.65302, "t": 459.8919399999999, "r": 451.25995, "b": 467.9617, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 446.65302, "r_y0": 467.9617, "r_x1": 451.25995, "r_y1": 467.9617, "r_x2": 451.25995, "r_y2": 459.8919399999999, "r_x3": 446.65302, "r_y3": 459.8919399999999, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "lcel", "lcel", "ched", "ched", "nl", "ucel", "ucel", "ucel", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 6, "num_cols": 8, "table_cells": [ { "bbox": { "l": 160.37, "t": 341.73495, "r": 168.04793, "b": 349.8047199999999, "coord_origin": "TOPLEFT" }, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "# enc-layers", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 207.974, "t": 341.73495, "r": 215.65193, "b": 349.8047199999999, "coord_origin": "TOPLEFT" }, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "# dec-layers", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 239.79799999999997, "t": 347.21396, "r": 278.31766, "b": 355.28372, "coord_origin": "TOPLEFT" }, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "Language", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 324.67001, "t": 341.73495, "r": 348.26419, "b": 349.8047199999999, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 3, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 3, "end_col_offset_idx": 6, "text": "TEDs", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 396.271, "t": 341.73495, "r": 417.12683, "b": 349.8047199999999, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "mAP", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 394.927, "t": 352.69394000000005, "r": 418.47278, "b": 360.7637, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "(0.75)", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 430.771, "t": 341.73495, "r": 467.1423, "b": 349.8047199999999, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 7, "end_col_offset_idx": 8, "text": "Inference", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 427.14801, "t": 352.69394000000005, "r": 470.76056, "b": 360.7637, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 7, "end_col_offset_idx": 8, "text": "time (secs)", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 286.686, "t": 354.68594, "r": 312.33261, "b": 362.75570999999997, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "simple", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 320.702, "t": 354.68594, "r": 353.71988, "b": 362.75570999999997, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "complex", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 369.306, "t": 354.68594, "r": 379.03094, "b": 362.75570999999997, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "all", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 161.90601, "t": 373.51596, "r": 166.51294, "b": 381.58572, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "6", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 209.509, "t": 373.51596, "r": 214.11594, "b": 381.58572, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "6", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 246.71000999999998, "t": 368.03595, "r": 271.40527, "b": 376.10571, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 289.017, "t": 368.03595, "r": 310.00375, "b": 376.10571, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.965 0.969", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 326.71701, "t": 368.03595, "r": 347.70377, "b": 376.10571, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.934 0.927", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 363.67599, "t": 368.03595, "r": 384.66275, "b": 376.10571, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.955 0.955", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 397.26999, "t": 367.97317999999996, "r": 416.12723, "b": 375.89948, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "0.88 0.857", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 439.52701, "t": 367.97317999999996, "r": 458.38425, "b": 375.89948, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 7, "end_col_offset_idx": 8, "text": "2.73 5.39", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 161.90601, "t": 399.81696, "r": 166.51294, "b": 407.88672, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "4", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 209.509, "t": 399.81696, "r": 214.11594, "b": 407.88672, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "4", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 246.71000999999998, "t": 394.33795, "r": 271.40527, "b": 402.40771, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 289.017, "t": 394.33795, "r": 310.00375, "b": 402.40771, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.938 0.952", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 326.71701, "t": 394.33795, "r": 347.70377, "b": 402.40771, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.904 0.909", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 363.67599, "t": 394.33795, "r": 384.66275, "b": 402.40771, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.927 0.938", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 394.61801, "t": 394.27518, "r": 418.77887, "b": 402.20148, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "0.853 0.843", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 439.52701, "t": 394.27518, "r": 458.38425, "b": 402.20148, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 7, "end_col_offset_idx": 8, "text": "1.97 3.77", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 161.90601, "t": 426.11795, "r": 166.51294, "b": 434.1877099999999, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "2", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 209.509, "t": 426.11795, "r": 214.11594, "b": 434.1877099999999, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "4", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 246.71000999999998, "t": 420.63895, "r": 271.40527, "b": 428.70871, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 289.017, "t": 420.63895, "r": 310.00375, "b": 428.70871, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.923 0.945", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 326.71701, "t": 420.63895, "r": 347.70377, "b": 428.70871, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.897 0.901", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 363.67599, "t": 420.63895, "r": 384.66275, "b": 428.70871, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.915 0.931", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 394.61801, "t": 420.57617, "r": 418.77887, "b": 428.50247, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "0.859 0.834", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 439.52701, "t": 420.57617, "r": 458.38425, "b": 428.50247, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 7, "end_col_offset_idx": 8, "text": "1.91 3.81", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 161.90601, "t": 452.41995, "r": 166.51294, "b": 460.48972, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "4", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 209.509, "t": 452.41995, "r": 214.11594, "b": 460.48972, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "2", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 246.71000999999998, "t": 446.9399399999999, "r": 271.40527, "b": 455.0097, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 289.017, "t": 446.9399399999999, "r": 310.00375, "b": 455.0097, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.952 0.944", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 329.021, "t": 446.9399399999999, "r": 345.40082, "b": 455.0097, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.92 0.903", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 362.08801, "t": 446.87717, "r": 386.24887, "b": 454.80347, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.942 0.931", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 394.61801, "t": 446.87717, "r": 418.77887, "b": 454.80347, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "0.857 0.824", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 439.52701, "t": 446.87717, "r": 458.38425, "b": 454.80347, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 7, "end_col_offset_idx": 8, "text": "1.22 2", "column_header": false, "row_header": false, "row_section": false } ] }, { "label": "section_header", "id": 5, "page_no": 8, "cluster": { "id": 5, "label": "section_header", "bbox": { "l": 134.765, "t": 508.15179, "r": 264.40332, "b": 516.95874, "coord_origin": "TOPLEFT" }, "confidence": 0.9592539668083191, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 516.95874, "r_x1": 149.40205, "r_y1": 516.95874, "r_x2": 149.40205, "r_y2": 508.15179, "r_x3": 134.765, "r_y3": 508.15179, "coord_origin": "TOPLEFT" }, "text": "5.2", "orig": "5.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.85904, "r_y0": 516.95874, "r_x1": 264.40332, "r_y1": 516.95874, "r_x2": 264.40332, "r_y2": 508.15179, "r_x3": 160.85904, "r_y3": 508.15179, "coord_origin": "TOPLEFT" }, "text": "Quantitative Results", "orig": "Quantitative Results", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "5.2 Quantitative Results" }, { "label": "text", "id": 1, "page_no": 8, "cluster": { "id": 1, "label": "text", "bbox": { "l": 134.765, "t": 524.55078, "r": 480.5957599999999, "b": 617.03474, "coord_origin": "TOPLEFT" }, "confidence": 0.9854757189750671, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 533.34775, "r_x1": 480.59075999999993, "r_y1": 533.34775, "r_x2": 480.59075999999993, "r_y2": 524.55078, "r_x3": 134.765, "r_y3": 524.55078, "coord_origin": "TOPLEFT" }, "text": "We picked the model parameter configuration that produced the best prediction", "orig": "We picked the model parameter configuration that produced the best prediction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 545.3037400000001, "r_x1": 480.58675999999997, "r_y1": 545.3037400000001, "r_x2": 480.58675999999997, "r_y2": 536.50677, "r_x3": 134.765, "r_y3": 536.50677, "coord_origin": "TOPLEFT" }, "text": "quality (enc=6, dec=6, heads=8) with PubTabNet alone, then independently", "orig": "quality (enc=6, dec=6, heads=8) with PubTabNet alone, then independently", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 557.25874, "r_x1": 480.59572999999995, "r_y1": 557.25874, "r_x2": 480.59572999999995, "r_y2": 548.4617800000001, "r_x3": 134.765, "r_y3": 548.4617800000001, "coord_origin": "TOPLEFT" }, "text": "trained and evaluated it on three publicly available data sets: PubTabNet (395k", "orig": "trained and evaluated it on three publicly available data sets: PubTabNet (395k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 569.21375, "r_x1": 480.59177000000005, "r_y1": 569.21375, "r_x2": 480.59177000000005, "r_y2": 560.41678, "r_x3": 134.765, "r_y3": 560.41678, "coord_origin": "TOPLEFT" }, "text": "samples), FinTabNet (113k samples) and PubTables-1M (about 1M samples).", "orig": "samples), FinTabNet (113k samples) and PubTables-1M (about 1M samples).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 581.16875, "r_x1": 480.59069999999997, "r_y1": 581.16875, "r_x2": 480.59069999999997, "r_y2": 572.37178, "r_x3": 134.765, "r_y3": 572.37178, "coord_origin": "TOPLEFT" }, "text": "Performance results are presented in Table. 2. It is clearly evident that the model", "orig": "Performance results are presented in Table. 2. It is clearly evident that the model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 593.12375, "r_x1": 480.5957599999999, "r_y1": 593.12375, "r_x2": 480.5957599999999, "r_y2": 584.32678, "r_x3": 134.765, "r_y3": 584.32678, "coord_origin": "TOPLEFT" }, "text": "trained on OTSL outperforms HTML across the board, keeping high TEDs and", "orig": "trained on OTSL outperforms HTML across the board, keeping high TEDs and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 605.07974, "r_x1": 480.58774, "r_y1": 605.07974, "r_x2": 480.58774, "r_y2": 596.28278, "r_x3": 134.765, "r_y3": 596.28278, "coord_origin": "TOPLEFT" }, "text": "mAP scores even on difficult financial tables (FinTabNet) that contain sparse", "orig": "mAP scores even on difficult financial tables (FinTabNet) that contain sparse", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 617.03474, "r_x1": 206.78664, "r_y1": 617.03474, "r_x2": 206.78664, "r_y2": 608.2377799999999, "r_x3": 134.765, "r_y3": 608.2377799999999, "coord_origin": "TOPLEFT" }, "text": "and large tables.", "orig": "and large tables.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "We picked the model parameter configuration that produced the best prediction quality (enc=6, dec=6, heads=8) with PubTabNet alone, then independently trained and evaluated it on three publicly available data sets: PubTabNet (395k samples), FinTabNet (113k samples) and PubTables-1M (about 1M samples). Performance results are presented in Table. 2. It is clearly evident that the model trained on OTSL outperforms HTML across the board, keeping high TEDs and mAP scores even on difficult financial tables (FinTabNet) that contain sparse and large tables." }, { "label": "text", "id": 2, "page_no": 8, "cluster": { "id": 2, "label": "text", "bbox": { "l": 134.765, "t": 620.19278, "r": 480.5957599999999, "b": 664.8547599999999, "coord_origin": "TOPLEFT" }, "confidence": 0.9851234555244446, "cells": [ { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.709, "r_y0": 628.98975, "r_x1": 480.59271, "r_y1": 628.98975, "r_x2": 480.59271, "r_y2": 620.19278, "r_x3": 149.709, "r_y3": 620.19278, "coord_origin": "TOPLEFT" }, "text": "Additionally, the results show that OTSL has an advantage over HTML", "orig": "Additionally, the results show that OTSL has an advantage over HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 640.94475, "r_x1": 480.5957599999999, "r_y1": 640.94475, "r_x2": 480.5957599999999, "r_y2": 632.14778, "r_x3": 134.765, "r_y3": 632.14778, "coord_origin": "TOPLEFT" }, "text": "when applied on a bigger data set like PubTables-1M and achieves significantly", "orig": "when applied on a bigger data set like PubTables-1M and achieves significantly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 652.89975, "r_x1": 480.59283000000005, "r_y1": 652.89975, "r_x2": 480.59283000000005, "r_y2": 644.1027799999999, "r_x3": 134.765, "r_y3": 644.1027799999999, "coord_origin": "TOPLEFT" }, "text": "improved scores. Finally, OTSL achieves faster inference due to fewer decoding", "orig": "improved scores. Finally, OTSL achieves faster inference due to fewer decoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 664.8547599999999, "r_x1": 405.79651, "r_y1": 664.8547599999999, "r_x2": 405.79651, "r_y2": 656.0577900000001, "r_x3": 134.765, "r_y3": 656.0577900000001, "coord_origin": "TOPLEFT" }, "text": "steps which is a result of the reduced sequence representation.", "orig": "steps which is a result of the reduced sequence representation.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Additionally, the results show that OTSL has an advantage over HTML when applied on a bigger data set like PubTables-1M and achieves significantly improved scores. Finally, OTSL achieves faster inference due to fewer decoding steps which is a result of the reduced sequence representation." } ], "headers": [ { "label": "page_header", "id": 8, "page_no": 8, "cluster": { "id": 8, "label": "page_header", "bbox": { "l": 194.478, "t": 93.77099999999996, "r": 447.54291000000006, "b": 101.84069999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.9373378753662109, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.478, "r_y0": 101.84069999999997, "r_x1": 447.54291000000006, "r_y1": 101.84069999999997, "r_x2": 447.54291000000006, "r_y2": 93.77099999999996, "r_x3": 194.478, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Optimized Table Tokenization for Table Structure Recognition" }, { "label": "page_header", "id": 9, "page_no": 8, "cluster": { "id": 9, "label": "page_header", "bbox": { "l": 475.98431, "t": 93.77099999999996, "r": 480.59125000000006, "b": 101.84069999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.8857625722885132, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 475.98431, "r_y0": 101.84069999999997, "r_x1": 480.59125000000006, "r_y1": 101.84069999999997, "r_x2": 480.59125000000006, "r_y2": 93.77099999999996, "r_x3": 475.98431, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "9" } ] } }, { "page_no": 9, "size": { "width": 612.0, "height": 792.0 }, "parsed_page": { "dimension": { "angle": 0.0, "rect": { "r_x0": 0.0, "r_y0": 0.0, "r_x1": 612.0, "r_y1": 0.0, "r_x2": 612.0, "r_y2": 792.0, "r_x3": 0.0, "r_y3": 792.0, "coord_origin": "BOTTOMLEFT" }, "boundary_type": "crop_box", "art_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "bleed_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "crop_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "media_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "trim_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" } }, "bitmap_resources": [], "char_cells": [], "word_cells": [], "textline_cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 101.84069999999997, "r_x1": 143.97887, "r_y1": 101.84069999999997, "r_x2": 143.97887, "r_y2": 93.77099999999996, "r_x3": 134.765, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.82053, "r_y0": 101.84069999999997, "r_x1": 178.08249, "r_y1": 101.84069999999997, "r_x2": 178.08249, "r_y2": 93.77099999999996, "r_x3": 167.82053, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.37929, "r_y0": 101.84069999999997, "r_x1": 231.72049000000004, "r_y1": 101.84069999999997, "r_x2": 231.72049000000004, "r_y2": 93.77099999999996, "r_x3": 182.37929, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 123.76251000000002, "r_x1": 173.09366, "r_y1": 123.76251000000002, "r_x2": 173.09366, "r_y2": 115.83618000000001, "r_x3": 134.765, "r_y3": 115.83618000000001, "coord_origin": "TOPLEFT" }, "text": "Table 2.", "orig": "Table 2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 181.30299, "r_y0": 123.96868999999992, "r_x1": 480.59151999999995, "r_y1": 123.96868999999992, "r_x2": 480.59151999999995, "r_y2": 115.89899000000003, "r_x3": 181.30299, "r_y3": 115.89899000000003, "coord_origin": "TOPLEFT" }, "text": "TSR and cell detection results compared between OTSL and HTML on", "orig": "TSR and cell detection results compared between OTSL and HTML on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 134.92767000000003, "r_x1": 480.59357000000006, "r_y1": 134.92767000000003, "r_x2": 480.59357000000006, "r_y2": 126.85797000000014, "r_x3": 134.765, "r_y3": 126.85797000000014, "coord_origin": "TOPLEFT" }, "text": "the PubTabNet [22], FinTabNet [21] and PubTables-1M [14] data sets using Table-", "orig": "the PubTabNet [22], FinTabNet [21] and PubTables-1M [14] data sets using Table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 145.88666, "r_x1": 305.95691, "r_y1": 145.88666, "r_x2": 305.95691, "r_y2": 137.81696, "r_x3": 134.765, "r_y3": 137.81696, "coord_origin": "TOPLEFT" }, "text": "Former [9] (with enc=6, dec=6, heads=8).", "orig": "Former [9] (with enc=6, dec=6, heads=8).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.782, "r_y0": 174.62865999999997, "r_x1": 194.99779, "r_y1": 174.62865999999997, "r_x2": 194.99779, "r_y2": 166.55895999999996, "r_x3": 160.782, "r_y3": 166.55895999999996, "coord_origin": "TOPLEFT" }, "text": "Data set", "orig": "Data set", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 215.52499000000003, "r_y0": 174.6037, "r_x1": 254.04465, "r_y1": 174.6037, "r_x2": 254.04465, "r_y2": 166.534, "r_x3": 215.52499000000003, "r_y3": 166.534, "coord_origin": "TOPLEFT" }, "text": "Language", "orig": "Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 300.397, "r_y0": 169.14868, "r_x1": 323.99118, "r_y1": 169.14868, "r_x2": 323.99118, "r_y2": 161.07898, "r_x3": 300.397, "r_y3": 161.07898, "coord_origin": "TOPLEFT" }, "text": "TEDs", "orig": "TEDs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 370.345, "r_y0": 174.62865999999997, "r_x1": 414.74661, "r_y1": 174.62865999999997, "r_x2": 414.74661, "r_y2": 166.55895999999996, "r_x3": 370.345, "r_y3": 166.55895999999996, "coord_origin": "TOPLEFT" }, "text": "mAP(0.75)", "orig": "mAP(0.75)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 426.737, "r_y0": 169.14868, "r_x1": 463.10830999999996, "r_y1": 169.14868, "r_x2": 463.10830999999996, "r_y2": 161.07898, "r_x3": 426.737, "r_y3": 161.07898, "coord_origin": "TOPLEFT" }, "text": "Inference", "orig": "Inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.11401, "r_y0": 180.10766999999998, "r_x1": 466.72656, "r_y1": 180.10766999999998, "r_x2": 466.72656, "r_y2": 172.03796, "r_x3": 423.11401, "r_y3": 172.03796, "coord_origin": "TOPLEFT" }, "text": "time (secs)", "orig": "time (secs)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.41299, "r_y0": 182.10071000000005, "r_x1": 288.0596, "r_y1": 182.10071000000005, "r_x2": 288.0596, "r_y2": 174.03101000000004, "r_x3": 262.41299, "r_y3": 174.03101000000004, "coord_origin": "TOPLEFT" }, "text": "simple", "orig": "simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 296.42899, "r_y0": 182.10071000000005, "r_x1": 329.44687, "r_y1": 182.10071000000005, "r_x2": 329.44687, "r_y2": 174.03101000000004, "r_x3": 296.42899, "r_y3": 174.03101000000004, "coord_origin": "TOPLEFT" }, "text": "complex", "orig": "complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.03299, "r_y0": 182.10071000000005, "r_x1": 354.75793, "r_y1": 182.10071000000005, "r_x2": 354.75793, "r_y2": 174.03101000000004, "r_x3": 345.03299, "r_y3": 174.03101000000004, "coord_origin": "TOPLEFT" }, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.53799, "r_y0": 200.92969000000005, "r_x1": 201.24129, "r_y1": 200.92969000000005, "r_x2": 201.24129, "r_y2": 192.85999000000004, "r_x3": 154.53799, "r_y3": 192.85999000000004, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.43700000000004, "r_y0": 195.45068000000003, "r_x1": 247.13226000000003, "r_y1": 195.45068000000003, "r_x2": 247.13226000000003, "r_y2": 187.38098000000002, "r_x3": 222.43700000000004, "r_y3": 187.38098000000002, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74399, "r_y0": 195.45068000000003, "r_x1": 285.73074, "r_y1": 195.45068000000003, "r_x2": 285.73074, "r_y2": 187.38098000000002, "r_x3": 264.74399, "r_y3": 187.38098000000002, "coord_origin": "TOPLEFT" }, "text": "0.965", "orig": "0.965", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.444, "r_y0": 195.45068000000003, "r_x1": 323.43076, "r_y1": 195.45068000000003, "r_x2": 323.43076, "r_y2": 187.38098000000002, "r_x3": 302.444, "r_y3": 187.38098000000002, "coord_origin": "TOPLEFT" }, "text": "0.934", "orig": "0.934", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.40302, "r_y0": 195.45068000000003, "r_x1": 360.38977, "r_y1": 195.45068000000003, "r_x2": 360.38977, "r_y2": 187.38098000000002, "r_x3": 339.40302, "r_y3": 187.38098000000002, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 383.116, "r_y0": 195.24451, "r_x1": 401.97324, "r_y1": 195.24451, "r_x2": 401.97324, "r_y2": 187.31817999999998, "r_x3": 383.116, "r_y3": 187.31817999999998, "coord_origin": "TOPLEFT" }, "text": "0.88", "orig": "0.88", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.49300999999997, "r_y0": 195.24451, "r_x1": 454.35025, "r_y1": 195.24451, "r_x2": 454.35025, "r_y2": 187.31817999999998, "r_x3": 435.49300999999997, "r_y3": 187.31817999999998, "coord_origin": "TOPLEFT" }, "text": "2.73", "orig": "2.73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.903, "r_y0": 208.40166999999997, "r_x1": 248.66655999999998, "r_y1": 208.40166999999997, "r_x2": 248.66655999999998, "r_y2": 200.33196999999996, "r_x3": 220.903, "r_y3": 200.33196999999996, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74399, "r_y0": 208.40166999999997, "r_x1": 285.73074, "r_y1": 208.40166999999997, "r_x2": 285.73074, "r_y2": 200.33196999999996, "r_x3": 264.74399, "r_y3": 200.33196999999996, "coord_origin": "TOPLEFT" }, "text": "0.969", "orig": "0.969", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.444, "r_y0": 208.40166999999997, "r_x1": 323.43076, "r_y1": 208.40166999999997, "r_x2": 323.43076, "r_y2": 200.33196999999996, "r_x3": 302.444, "r_y3": 200.33196999999996, "coord_origin": "TOPLEFT" }, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.40302, "r_y0": 208.40166999999997, "r_x1": 360.38977, "r_y1": 208.40166999999997, "r_x2": 360.38977, "r_y2": 200.33196999999996, "r_x3": 339.40302, "r_y3": 200.33196999999996, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.052, "r_y0": 208.40166999999997, "r_x1": 403.03876, "r_y1": 208.40166999999997, "r_x2": 403.03876, "r_y2": 200.33196999999996, "r_x3": 382.052, "r_y3": 200.33196999999996, "coord_origin": "TOPLEFT" }, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.73199000000005, "r_y0": 208.40166999999997, "r_x1": 453.11182, "r_y1": 208.40166999999997, "r_x2": 453.11182, "r_y2": 200.33196999999996, "r_x3": 436.73199000000005, "r_y3": 200.33196999999996, "coord_origin": "TOPLEFT" }, "text": "5.39", "orig": "5.39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 155.94501, "r_y0": 227.23168999999996, "r_x1": 199.83374, "r_y1": 227.23168999999996, "r_x2": 199.83374, "r_y2": 219.16198999999995, "r_x3": 155.94501, "r_y3": 219.16198999999995, "coord_origin": "TOPLEFT" }, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.43700000000004, "r_y0": 221.75171, "r_x1": 247.13226000000003, "r_y1": 221.75171, "r_x2": 247.13226000000003, "r_y2": 213.68201, "r_x3": 222.43700000000004, "r_y3": 213.68201, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74399, "r_y0": 221.75171, "r_x1": 285.73074, "r_y1": 221.75171, "r_x2": 285.73074, "r_y2": 213.68201, "r_x3": 264.74399, "r_y3": 213.68201, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.444, "r_y0": 221.75171, "r_x1": 323.43076, "r_y1": 221.75171, "r_x2": 323.43076, "r_y2": 213.68201, "r_x3": 302.444, "r_y3": 213.68201, "coord_origin": "TOPLEFT" }, "text": "0.961", "orig": "0.961", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.815, "r_y0": 221.54552999999999, "r_x1": 361.97586, "r_y1": 221.54552999999999, "r_x2": 361.97586, "r_y2": 213.61919999999998, "r_x3": 337.815, "r_y3": 213.61919999999998, "coord_origin": "TOPLEFT" }, "text": "0.959", "orig": "0.959", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 380.46399, "r_y0": 221.54552999999999, "r_x1": 404.62485, "r_y1": 221.54552999999999, "r_x2": 404.62485, "r_y2": 213.61919999999998, "r_x3": 380.46399, "r_y3": 213.61919999999998, "coord_origin": "TOPLEFT" }, "text": "0.862", "orig": "0.862", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.49300999999997, "r_y0": 221.54552999999999, "r_x1": 454.35025, "r_y1": 221.54552999999999, "r_x2": 454.35025, "r_y2": 213.61919999999998, "r_x3": 435.49300999999997, "r_y3": 213.61919999999998, "coord_origin": "TOPLEFT" }, "text": "1.85", "orig": "1.85", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.903, "r_y0": 234.70367, "r_x1": 248.66655999999998, "r_y1": 234.70367, "r_x2": 248.66655999999998, "r_y2": 226.63396999999998, "r_x3": 220.903, "r_y3": 226.63396999999998, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74399, "r_y0": 234.70367, "r_x1": 285.73074, "r_y1": 234.70367, "r_x2": 285.73074, "r_y2": 226.63396999999998, "r_x3": 264.74399, "r_y3": 226.63396999999998, "coord_origin": "TOPLEFT" }, "text": "0.917", "orig": "0.917", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.444, "r_y0": 234.70367, "r_x1": 323.43076, "r_y1": 234.70367, "r_x2": 323.43076, "r_y2": 226.63396999999998, "r_x3": 302.444, "r_y3": 226.63396999999998, "coord_origin": "TOPLEFT" }, "text": "0.922", "orig": "0.922", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 341.70599, "r_y0": 234.70367, "r_x1": 358.08582, "r_y1": 234.70367, "r_x2": 358.08582, "r_y2": 226.63396999999998, "r_x3": 341.70599, "r_y3": 226.63396999999998, "coord_origin": "TOPLEFT" }, "text": "0.92", "orig": "0.92", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.052, "r_y0": 234.70367, "r_x1": 403.03876, "r_y1": 234.70367, "r_x2": 403.03876, "r_y2": 226.63396999999998, "r_x3": 382.052, "r_y3": 226.63396999999998, "coord_origin": "TOPLEFT" }, "text": "0.722", "orig": "0.722", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.73199000000005, "r_y0": 234.70367, "r_x1": 453.11182, "r_y1": 234.70367, "r_x2": 453.11182, "r_y2": 226.63396999999998, "r_x3": 436.73199000000005, "r_y3": 226.63396999999998, "coord_origin": "TOPLEFT" }, "text": "3.26", "orig": "3.26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 148.62601, "r_y0": 253.53265, "r_x1": 207.1524, "r_y1": 253.53265, "r_x2": 207.1524, "r_y2": 245.46294999999998, "r_x3": 148.62601, "r_y3": 245.46294999999998, "coord_origin": "TOPLEFT" }, "text": "PubTables-1M", "orig": "PubTables-1M", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.43700000000004, "r_y0": 248.05267000000003, "r_x1": 247.13226000000003, "r_y1": 248.05267000000003, "r_x2": 247.13226000000003, "r_y2": 239.98297000000002, "r_x3": 222.43700000000004, "r_y3": 239.98297000000002, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74399, "r_y0": 248.05267000000003, "r_x1": 285.73074, "r_y1": 248.05267000000003, "r_x2": 285.73074, "r_y2": 239.98297000000002, "r_x3": 264.74399, "r_y3": 239.98297000000002, "coord_origin": "TOPLEFT" }, "text": "0.987", "orig": "0.987", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.444, "r_y0": 248.05267000000003, "r_x1": 323.43076, "r_y1": 248.05267000000003, "r_x2": 323.43076, "r_y2": 239.98297000000002, "r_x3": 302.444, "r_y3": 239.98297000000002, "coord_origin": "TOPLEFT" }, "text": "0.964", "orig": "0.964", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.815, "r_y0": 247.8465, "r_x1": 361.97586, "r_y1": 247.8465, "r_x2": 361.97586, "r_y2": 239.92016999999998, "r_x3": 337.815, "r_y3": 239.92016999999998, "coord_origin": "TOPLEFT" }, "text": "0.977", "orig": "0.977", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 380.46399, "r_y0": 247.8465, "r_x1": 404.62485, "r_y1": 247.8465, "r_x2": 404.62485, "r_y2": 239.92016999999998, "r_x3": 380.46399, "r_y3": 239.92016999999998, "coord_origin": "TOPLEFT" }, "text": "0.896", "orig": "0.896", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.49300999999997, "r_y0": 247.8465, "r_x1": 454.35025, "r_y1": 247.8465, "r_x2": 454.35025, "r_y2": 239.92016999999998, "r_x3": 435.49300999999997, "r_y3": 239.92016999999998, "coord_origin": "TOPLEFT" }, "text": "1.79", "orig": "1.79", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.903, "r_y0": 261.00469999999996, "r_x1": 248.66655999999998, "r_y1": 261.00469999999996, "r_x2": 248.66655999999998, "r_y2": 252.93499999999995, "r_x3": 220.903, "r_y3": 252.93499999999995, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74399, "r_y0": 261.00469999999996, "r_x1": 285.73074, "r_y1": 261.00469999999996, "r_x2": 285.73074, "r_y2": 252.93499999999995, "r_x3": 264.74399, "r_y3": 252.93499999999995, "coord_origin": "TOPLEFT" }, "text": "0.983", "orig": "0.983", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.444, "r_y0": 261.00469999999996, "r_x1": 323.43076, "r_y1": 261.00469999999996, "r_x2": 323.43076, "r_y2": 252.93499999999995, "r_x3": 302.444, "r_y3": 252.93499999999995, "coord_origin": "TOPLEFT" }, "text": "0.944", "orig": "0.944", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.40302, "r_y0": 261.00469999999996, "r_x1": 360.38977, "r_y1": 261.00469999999996, "r_x2": 360.38977, "r_y2": 252.93499999999995, "r_x3": 339.40302, "r_y3": 252.93499999999995, "coord_origin": "TOPLEFT" }, "text": "0.966", "orig": "0.966", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.052, "r_y0": 261.00469999999996, "r_x1": 403.03876, "r_y1": 261.00469999999996, "r_x2": 403.03876, "r_y2": 252.93499999999995, "r_x3": 382.052, "r_y3": 252.93499999999995, "coord_origin": "TOPLEFT" }, "text": "0.889", "orig": "0.889", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.73199000000005, "r_y0": 261.00469999999996, "r_x1": 453.11182, "r_y1": 261.00469999999996, "r_x2": 453.11182, "r_y2": 252.93499999999995, "r_x3": 436.73199000000005, "r_y3": 252.93499999999995, "coord_origin": "TOPLEFT" }, "text": "3.26", "orig": "3.26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 297.72173999999995, "r_x1": 149.40205, "r_y1": 297.72173999999995, "r_x2": 149.40205, "r_y2": 288.91479, "r_x3": 134.765, "r_y3": 288.91479, "coord_origin": "TOPLEFT" }, "text": "5.3", "orig": "5.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.85904, "r_y0": 297.72173999999995, "r_x1": 257.08679, "r_y1": 297.72173999999995, "r_x2": 257.08679, "r_y2": 288.91479, "r_x3": 160.85904, "r_y3": 288.91479, "coord_origin": "TOPLEFT" }, "text": "Qualitative Results", "orig": "Qualitative Results", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 318.65775, "r_x1": 480.58777, "r_y1": 318.65775, "r_x2": 480.58777, "r_y2": 309.86078, "r_x3": 134.765, "r_y3": 309.86078, "coord_origin": "TOPLEFT" }, "text": "To illustrate the qualitative differences between OTSL and HTML, Figure 5", "orig": "To illustrate the qualitative differences between OTSL and HTML, Figure 5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 330.61273, "r_x1": 480.58889999999997, "r_y1": 330.61273, "r_x2": 480.58889999999997, "r_y2": 321.81577, "r_x3": 134.765, "r_y3": 321.81577, "coord_origin": "TOPLEFT" }, "text": "demonstrates less overlap and more accurate bounding boxes with OTSL. In", "orig": "demonstrates less overlap and more accurate bounding boxes with OTSL. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 342.56772, "r_x1": 480.58681999999993, "r_y1": 342.56772, "r_x2": 480.58681999999993, "r_y2": 333.77075, "r_x3": 134.765, "r_y3": 333.77075, "coord_origin": "TOPLEFT" }, "text": "Figure 6, OTSL proves to be more effective in handling tables with longer to-", "orig": "Figure 6, OTSL proves to be more effective in handling tables with longer to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 354.52271, "r_x1": 480.58981, "r_y1": 354.52271, "r_x2": 480.58981, "r_y2": 345.72574, "r_x3": 134.765, "r_y3": 345.72574, "coord_origin": "TOPLEFT" }, "text": "ken sequences, resulting in even more precise structure prediction and bounding", "orig": "ken sequences, resulting in even more precise structure prediction and bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 366.47769, "r_x1": 161.65704, "r_y1": 366.47769, "r_x2": 161.65704, "r_y2": 357.68073, "r_x3": 134.765, "r_y3": 357.68073, "coord_origin": "TOPLEFT" }, "text": "boxes.", "orig": "boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 405.51642, "r_x1": 162.64424, "r_y1": 405.51642, "r_x2": 162.64424, "r_y2": 397.59012, "r_x3": 134.765, "r_y3": 397.59012, "coord_origin": "TOPLEFT" }, "text": "Fig. 5.", "orig": "Fig. 5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.384, "r_y0": 405.72266, "r_x1": 480.59106, "r_y1": 405.72266, "r_x2": 480.59106, "r_y2": 397.65289, "r_x3": 167.384, "r_y3": 397.65289, "coord_origin": "TOPLEFT" }, "text": "The OTSL model produces more accurate bounding boxes with less over-", "orig": "The OTSL model produces more accurate bounding boxes with less over-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 416.68167000000005, "r_x1": 480.59106, "r_y1": 416.68167000000005, "r_x2": 480.59106, "r_y2": 408.61190999999997, "r_x3": 134.765, "r_y3": 408.61190999999997, "coord_origin": "TOPLEFT" }, "text": "lap (E) than the HTML model (D), when predicting the structure of a sparse ta-", "orig": "lap (E) than the HTML model (D), when predicting the structure of a sparse ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 427.64066, "r_x1": 480.58838000000003, "r_y1": 427.64066, "r_x2": 480.58838000000003, "r_y2": 419.57089, "r_x3": 134.765, "r_y3": 419.57089, "coord_origin": "TOPLEFT" }, "text": "ble (A), at twice the inference speed because of shorter sequence length (B),(C).", "orig": "ble (A), at twice the inference speed because of shorter sequence length (B),(C).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 438.59964, "r_x1": 304.69171, "r_y1": 438.59964, "r_x2": 304.69171, "r_y2": 430.52987999999993, "r_x3": 134.765, "r_y3": 430.52987999999993, "coord_origin": "TOPLEFT" }, "text": "\"PMC2807444_006_00.png\" PubTabNet.", "orig": "\"PMC2807444_006_00.png\" PubTabNet.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 180.12473, "r_y0": 518.94992, "r_x1": 190.62042, "r_y1": 518.94992, "r_x2": 190.62042, "r_y2": 516.2332200000001, "r_x3": 180.12473, "r_y3": 516.2332200000001, "coord_origin": "TOPLEFT" }, "text": "", "orig": "
", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2438, "r_y0": 522.84879, "r_x1": 304.54797, "r_y1": 522.84879, "r_x2": 304.54797, "r_y2": 520.13208, "r_x3": 183.2438, "r_y3": 520.13208, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2438, "r_y0": 526.74765, "r_x1": 388.42313, "r_y1": 526.74765, "r_x2": 388.42313, "r_y2": 524.03094, "r_x3": 183.2438, "r_y3": 524.03094, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2438, "r_y0": 530.64648, "r_x1": 388.42313, "r_y1": 530.64648, "r_x2": 388.42313, "r_y2": 527.9297799999999, "r_x3": 183.2438, "r_y3": 527.9297799999999, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2438, "r_y0": 534.54532, "r_x1": 388.42313, "r_y1": 534.54532, "r_x2": 388.42313, "r_y2": 531.82861, "r_x3": 183.2438, "r_y3": 531.82861, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2438, "r_y0": 538.44418, "r_x1": 388.42313, "r_y1": 538.44418, "r_x2": 388.42313, "r_y2": 535.72748, "r_x3": 183.2438, "r_y3": 535.72748, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2438, "r_y0": 542.34303, "r_x1": 388.42313, "r_y1": 542.34303, "r_x2": 388.42313, "r_y2": 539.62631, "r_x3": 183.2438, "r_y3": 539.62631, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2438, "r_y0": 546.24188, "r_x1": 388.42313, "r_y1": 546.24188, "r_x2": 388.42313, "r_y2": 543.52516, "r_x3": 183.2438, "r_y3": 543.52516, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2438, "r_y0": 550.14073, "r_x1": 388.42313, "r_y1": 550.14073, "r_x2": 388.42313, "r_y2": 547.42401, "r_x3": 183.2438, "r_y3": 547.42401, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2438, "r_y0": 554.03958, "r_x1": 388.42313, "r_y1": 554.03958, "r_x2": 388.42313, "r_y2": 551.32286, "r_x3": 183.2438, "r_y3": 551.32286, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 180.12473, "r_y0": 557.93845, "r_x1": 191.86806, "r_y1": 557.93845, "r_x2": 191.86806, "r_y2": 555.22173, "r_x3": 180.12473, "r_y3": 555.22173, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38348, "r_y0": 521.01712, "r_x1": 408.82025, "r_y1": 521.01712, "r_x2": 408.82025, "r_y2": 518.30042, "r_x3": 407.38348, "r_y3": 518.30042, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.25699, "r_y0": 521.01712, "r_x1": 450.48605, "r_y1": 521.01712, "r_x2": 450.48605, "r_y2": 518.30042, "r_x3": 410.25699, "r_y3": 518.30042, "coord_origin": "TOPLEFT" }, "text": "C L L L C L L L L L C L L NL", "orig": "C L L L C L L L L L C L L NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38348, "r_y0": 524.9159500000001, "r_x1": 408.82025, "r_y1": 524.9159500000001, "r_x2": 408.82025, "r_y2": 522.19925, "r_x3": 407.38348, "r_y3": 522.19925, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.25699, "r_y0": 524.9159500000001, "r_x1": 450.48605, "r_y1": 524.9159500000001, "r_x2": 450.48605, "r_y2": 522.19925, "r_x3": 410.25699, "r_y3": 522.19925, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38348, "r_y0": 528.81479, "r_x1": 408.82025, "r_y1": 528.81479, "r_x2": 408.82025, "r_y2": 526.09808, "r_x3": 407.38348, "r_y3": 526.09808, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.25699, "r_y0": 528.81479, "r_x1": 450.48605, "r_y1": 528.81479, "r_x2": 450.48605, "r_y2": 526.09808, "r_x3": 410.25699, "r_y3": 526.09808, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38348, "r_y0": 532.7136499999999, "r_x1": 408.82025, "r_y1": 532.7136499999999, "r_x2": 408.82025, "r_y2": 529.99695, "r_x3": 407.38348, "r_y3": 529.99695, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.25699, "r_y0": 532.7136499999999, "r_x1": 450.48605, "r_y1": 532.7136499999999, "r_x2": 450.48605, "r_y2": 529.99695, "r_x3": 410.25699, "r_y3": 529.99695, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38348, "r_y0": 536.6125, "r_x1": 408.82025, "r_y1": 536.6125, "r_x2": 408.82025, "r_y2": 533.8957800000001, "r_x3": 407.38348, "r_y3": 533.8957800000001, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.25699, "r_y0": 536.6125, "r_x1": 450.48605, "r_y1": 536.6125, "r_x2": 450.48605, "r_y2": 533.8957800000001, "r_x3": 410.25699, "r_y3": 533.8957800000001, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38348, "r_y0": 540.51135, "r_x1": 408.82025, "r_y1": 540.51135, "r_x2": 408.82025, "r_y2": 537.79463, "r_x3": 407.38348, "r_y3": 537.79463, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.25699, "r_y0": 540.51135, "r_x1": 450.48605, "r_y1": 540.51135, "r_x2": 450.48605, "r_y2": 537.79463, "r_x3": 410.25699, "r_y3": 537.79463, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38348, "r_y0": 544.4102, "r_x1": 408.82025, "r_y1": 544.4102, "r_x2": 408.82025, "r_y2": 541.69348, "r_x3": 407.38348, "r_y3": 541.69348, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.25699, "r_y0": 544.4102, "r_x1": 450.48605, "r_y1": 544.4102, "r_x2": 450.48605, "r_y2": 541.69348, "r_x3": 410.25699, "r_y3": 541.69348, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38348, "r_y0": 548.3090500000001, "r_x1": 408.82025, "r_y1": 548.3090500000001, "r_x2": 408.82025, "r_y2": 545.59233, "r_x3": 407.38348, "r_y3": 545.59233, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.25699, "r_y0": 548.3090500000001, "r_x1": 450.48605, "r_y1": 548.3090500000001, "r_x2": 450.48605, "r_y2": 545.59233, "r_x3": 410.25699, "r_y3": 545.59233, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38348, "r_y0": 552.2079200000001, "r_x1": 408.82025, "r_y1": 552.2079200000001, "r_x2": 408.82025, "r_y2": 549.4911999999999, "r_x3": 407.38348, "r_y3": 549.4911999999999, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.25699, "r_y0": 552.2079200000001, "r_x1": 450.48605, "r_y1": 552.2079200000001, "r_x2": 450.48605, "r_y2": 549.4911999999999, "r_x3": 410.25699, "r_y3": 549.4911999999999, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 164.52881, "r_y0": 515.31, "r_x1": 181.8528, "r_y1": 515.31, "r_x2": 181.8528, "r_y2": 509.45859, "r_x3": 164.52881, "r_y3": 509.45859, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.58441, "r_y0": 515.31, "r_x1": 186.3974, "r_y1": 515.31, "r_x2": 186.3974, "r_y2": 509.45859, "r_x3": 183.58441, "r_y3": 509.45859, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 189.2104, "r_y0": 515.31, "r_x1": 208.90137, "r_y1": 515.31, "r_x2": 208.90137, "r_y2": 509.45859, "r_x3": 189.2104, "r_y3": 509.45859, "coord_origin": "TOPLEFT" }, "text": "tokens:", "orig": "tokens:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.63269, "r_y0": 515.31, "r_x1": 221.04044, "r_y1": 515.31, "r_x2": 221.04044, "r_y2": 509.45859, "r_x3": 210.63269, "r_y3": 509.45859, "coord_origin": "TOPLEFT" }, "text": "258", "orig": "258", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 390.20203, "r_y0": 515.45502, "r_x1": 406.83609, "r_y1": 515.45502, "r_x2": 406.83609, "r_y2": 509.60361, "r_x3": 390.20203, "r_y3": 509.60361, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.56952, "r_y0": 515.45502, "r_x1": 411.38251, "r_y1": 515.45502, "r_x2": 411.38251, "r_y2": 509.60361, "r_x3": 408.56952, "r_y3": 509.60361, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 414.1955, "r_y0": 515.45502, "r_x1": 433.88647000000003, "r_y1": 515.45502, "r_x2": 433.88647000000003, "r_y2": 509.60361, "r_x3": 414.1955, "r_y3": 509.60361, "coord_origin": "TOPLEFT" }, "text": "tokens:", "orig": "tokens:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.61737, "r_y0": 515.45502, "r_x1": 446.02512, "r_y1": 515.45502, "r_x2": 446.02512, "r_y2": 509.60361, "r_x3": 435.61737, "r_y3": 509.60361, "coord_origin": "TOPLEFT" }, "text": "135", "orig": "135", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.19316, "r_y0": 526.3866, "r_x1": 172.8231, "r_y1": 526.3866, "r_x2": 172.8231, "r_y2": 519.07236, "r_x3": 167.19316, "r_y3": 519.07236, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 187.33745, "r_y0": 455.93909, "r_x1": 192.96739, "r_y1": 455.93909, "r_x2": 192.96739, "r_y2": 448.62485, "r_x3": 187.33745, "r_y3": 448.62485, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.38654, "r_y0": 573.3194, "r_x1": 173.01648, "r_y1": 573.3194, "r_x2": 173.01648, "r_y2": 566.0051599999999, "r_x3": 167.38654, "r_y3": 566.0051599999999, "coord_origin": "TOPLEFT" }, "text": "D", "orig": "D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 248.45621000000003, "r_y0": 629.09431, "r_x1": 253.65727, "r_y1": 629.09431, "r_x2": 253.65727, "r_y2": 621.78008, "r_x3": 248.45621000000003, "r_y3": 621.78008, "coord_origin": "TOPLEFT" }, "text": "E", "orig": "E", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.90057, "r_y0": 526.5137, "r_x1": 401.53052, "r_y1": 526.5137, "r_x2": 401.53052, "r_y2": 519.19946, "r_x3": 395.90057, "r_y3": 519.19946, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.62886, "r_y0": 597.26784, "r_x1": 177.48148, "r_y1": 597.26784, "r_x2": 177.48148, "r_y2": 580.28853, "r_x3": 171.62886, "r_y3": 580.28853, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 251.05969000000002, "r_y0": 649.92345, "r_x1": 256.91235, "r_y1": 649.92345, "r_x2": 256.91235, "r_y2": 633.63408, "r_x3": 251.05969000000002, "r_y3": 633.63408, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 372.14645, "r_y0": 607.30864, "r_x1": 427.0379, "r_y1": 607.30864, "r_x2": 427.0379, "r_y2": 601.45724, "r_x3": 372.14645, "r_y3": 601.45724, "coord_origin": "TOPLEFT" }, "text": "HTML model shows", "orig": "HTML model shows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 372.14645, "r_y0": 613.75087, "r_x1": 430.06838999999997, "r_y1": 613.75087, "r_x2": 430.06838999999997, "r_y2": 607.89948, "r_x3": 372.14645, "r_y3": 607.89948, "coord_origin": "TOPLEFT" }, "text": "bounding box drifting", "orig": "bounding box drifting", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.88042, "r_y0": 648.72348, "r_x1": 231.08191, "r_y1": 648.72348, "r_x2": 231.08191, "r_y2": 642.87209, "r_x3": 176.88042, "r_y3": 642.87209, "coord_origin": "TOPLEFT" }, "text": "OTSL model shows", "orig": "OTSL model shows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.88042, "r_y0": 655.1657, "r_x1": 230.99271000000002, "r_y1": 655.1657, "r_x2": 230.99271000000002, "r_y2": 649.3143, "r_x3": 176.88042, "r_y3": 649.3143, "coord_origin": "TOPLEFT" }, "text": "clean bounding box", "orig": "clean bounding box", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.88042, "r_y0": 661.60794, "r_x1": 203.93219, "r_y1": 661.60794, "r_x2": 203.93219, "r_y2": 655.7565500000001, "r_x3": 176.88042, "r_y3": 655.7565500000001, "coord_origin": "TOPLEFT" }, "text": "alignment", "orig": "alignment", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 215.93231000000003, "r_y0": 569.15967, "r_x1": 218.4697, "r_y1": 569.15967, "r_x2": 218.4697, "r_y2": 557.56342, "r_x3": 215.93231000000003, "r_y3": 557.56342, "coord_origin": "TOPLEFT" }, "text": "\u2264", "orig": "\u2264", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.05689999999998, "r_y0": 569.15967, "r_x1": 231.71908999999997, "r_y1": 569.15967, "r_x2": 231.71908999999997, "r_y2": 557.56342, "r_x3": 229.05689999999998, "r_y3": 557.56342, "coord_origin": "TOPLEFT" }, "text": "\u03bc", "orig": "\u03bc", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 342.63354, "r_y0": 439.71716, "r_x1": 344.81915, "r_y1": 439.71716, "r_x2": 344.81915, "r_y2": 430.19678, "r_x3": 342.63354, "r_y3": 430.19678, "coord_origin": "TOPLEFT" }, "text": "\u03bc", "orig": "\u03bc", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 261.20892, "r_y0": 451.19727, "r_x1": 263.56973, "r_y1": 451.19727, "r_x2": 263.56973, "r_y2": 448.46124, "r_x3": 261.20892, "r_y3": 448.46124, "coord_origin": "TOPLEFT" }, "text": "S", "orig": "S", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.33463, "r_y0": 451.19727, "r_x1": 313.6362, "r_y1": 451.19727, "r_x2": 313.6362, "r_y2": 448.46124, "r_x3": 312.33463, "r_y3": 448.46124, "coord_origin": "TOPLEFT" }, "text": "I", "orig": "I", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 377.41125, "r_y0": 451.19727, "r_x1": 380.05737, "r_y1": 451.19727, "r_x2": 380.05737, "r_y2": 448.46124, "r_x3": 377.41125, "r_y3": 448.46124, "coord_origin": "TOPLEFT" }, "text": "R", "orig": "R", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.63976, "r_y0": 456.07599, "r_x1": 205.82492, "r_y1": 456.07599, "r_x2": 205.82492, "r_y2": 453.33997, "r_x3": 200.63976, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "ST", "orig": "ST", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.20833000000002, "r_y0": 456.07599, "r_x1": 229.76836, "r_y1": 456.07599, "r_x2": 229.76836, "r_y2": 453.33997, "r_x3": 222.20833000000002, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "0.03", "orig": "0.03", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 243.26666, "r_y0": 456.07599, "r_x1": 250.82669, "r_y1": 456.07599, "r_x2": 250.82669, "r_y2": 453.33997, "r_x3": 243.26666, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "0.06", "orig": "0.06", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.29657, "r_y0": 456.07599, "r_x1": 271.84949, "r_y1": 456.07599, "r_x2": 271.84949, "r_y2": 453.33997, "r_x3": 264.29657, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "0.12", "orig": "0.12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.31943, "r_y0": 456.07599, "r_x1": 292.87946, "r_y1": 456.07599, "r_x2": 292.87946, "r_y2": 453.33997, "r_x3": 285.31943, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "0.25", "orig": "0.25", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.37775, "r_y0": 456.07599, "r_x1": 311.77319, "r_y1": 456.07599, "r_x2": 311.77319, "r_y2": 453.33997, "r_x3": 306.37775, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "0.5", "orig": "0.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.41699, "r_y0": 456.07599, "r_x1": 325.58157, "r_y1": 456.07599, "r_x2": 325.58157, "r_y2": 453.33997, "r_x3": 323.41699, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.45807, "r_y0": 456.07599, "r_x1": 336.62265, "r_y1": 456.07599, "r_x2": 336.62265, "r_y2": 453.33997, "r_x3": 334.45807, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.52756, "r_y0": 456.07599, "r_x1": 347.69214, "r_y1": 456.07599, "r_x2": 347.69214, "r_y2": 453.33997, "r_x3": 345.52756, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 356.56863, "r_y0": 456.07599, "r_x1": 358.73322, "r_y1": 456.07599, "r_x2": 358.73322, "r_y2": 453.33997, "r_x3": 356.56863, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.63812, "r_y0": 456.07599, "r_x1": 371.97089, "r_y1": 456.07599, "r_x2": 371.97089, "r_y2": 453.33997, "r_x3": 367.63812, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.6734, "r_y0": 456.07599, "r_x1": 387.00616, "r_y1": 456.07599, "r_x2": 387.00616, "r_y2": 453.33997, "r_x3": 382.6734, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "32", "orig": "32", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.73727, "r_y0": 456.07599, "r_x1": 402.07001, "r_y1": 456.07599, "r_x2": 402.07001, "r_y2": 453.33997, "r_x3": 397.73727, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "64", "orig": "64", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 412.78879, "r_y0": 457.79964999999993, "r_x1": 414.93463, "r_y1": 457.79964999999993, "r_x2": 414.93463, "r_y2": 447.99298, "r_x3": 412.78879, "r_y3": 447.99298, "coord_origin": "TOPLEFT" }, "text": "\u2265", "orig": "\u2265", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 414.95697, "r_y0": 456.07599, "r_x1": 422.51746, "r_y1": 456.07599, "r_x2": 422.51746, "r_y2": 453.33997, "r_x3": 414.95697, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": " 128", "orig": " 128", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.63998, "r_y0": 466.66043, "r_x1": 204.57674, "r_y1": 466.66043, "r_x2": 204.57674, "r_y2": 463.92444, "r_x3": 200.63998, "r_y3": 463.92444, "coord_origin": "TOPLEFT" }, "text": "63", "orig": "63", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.62604, "r_y0": 466.66043, "r_x1": 369.58032, "r_y1": 466.66043, "r_x2": 369.58032, "r_y2": 463.92444, "r_x3": 367.62604, "r_y3": 463.92444, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.66132, "r_y0": 466.66043, "r_x1": 384.6156, "r_y1": 466.66043, "r_x2": 384.6156, "r_y2": 463.92444, "r_x3": 382.66132, "r_y3": 463.92444, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.72504, "r_y0": 466.66043, "r_x1": 399.67932, "r_y1": 466.66043, "r_x2": 399.67932, "r_y2": 463.92444, "r_x3": 397.72504, "r_y3": 463.92444, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 471.53915, "r_x1": 206.51694, "r_y1": 471.53915, "r_x2": 206.51694, "r_y2": 468.80313, "r_x3": 200.64, "r_y3": 468.80313, "coord_origin": "TOPLEFT" }, "text": "199", "orig": "199", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.29047, "r_y0": 471.53915, "r_x1": 266.25885, "r_y1": 471.53915, "r_x2": 266.25885, "r_y2": 468.80313, "r_x3": 264.29047, "r_y3": 468.80313, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.37213, "r_y0": 471.53915, "r_x1": 308.34052, "r_y1": 471.53915, "r_x2": 308.34052, "r_y2": 468.80313, "r_x3": 306.37213, "r_y3": 468.80313, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.51526, "r_y0": 471.53915, "r_x1": 347.48364, "r_y1": 471.53915, "r_x2": 347.48364, "r_y2": 468.80313, "r_x3": 345.51526, "r_y3": 468.80313, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 356.55634, "r_y0": 471.53915, "r_x1": 358.52472, "r_y1": 471.53915, "r_x2": 358.52472, "r_y2": 468.80313, "r_x3": 356.55634, "r_y3": 468.80313, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.62582, "r_y0": 471.53915, "r_x1": 369.59418, "r_y1": 471.53915, "r_x2": 369.59418, "r_y2": 468.80313, "r_x3": 367.62582, "r_y3": 468.80313, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.66107, "r_y0": 471.53915, "r_x1": 384.62946, "r_y1": 471.53915, "r_x2": 384.62946, "r_y2": 468.80313, "r_x3": 382.66107, "r_y3": 468.80313, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 476.41788, "r_x1": 206.51694, "r_y1": 476.41788, "r_x2": 206.51694, "r_y2": 473.68185, "r_x3": 200.64, "r_y3": 473.68185, "coord_origin": "TOPLEFT" }, "text": "416", "orig": "416", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.29047, "r_y0": 476.41788, "r_x1": 266.25885, "r_y1": 476.41788, "r_x2": 266.25885, "r_y2": 473.68185, "r_x3": 264.29047, "r_y3": 473.68185, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 481.26816, "r_x1": 206.51694, "r_y1": 481.26816, "r_x2": 206.51694, "r_y2": 478.53214, "r_x3": 200.64, "r_y3": 478.53214, "coord_origin": "TOPLEFT" }, "text": "230", "orig": "230", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 243.26373, "r_y0": 481.26816, "r_x1": 245.2321, "r_y1": 481.26816, "r_x2": 245.2321, "r_y2": 478.53214, "r_x3": 243.26373, "r_y3": 478.53214, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.29047, "r_y0": 481.26816, "r_x1": 266.25885, "r_y1": 481.26816, "r_x2": 266.25885, "r_y2": 478.53214, "r_x3": 264.29047, "r_y3": 478.53214, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.40466, "r_y0": 481.26816, "r_x1": 325.37305, "r_y1": 481.26816, "r_x2": 325.37305, "r_y2": 478.53214, "r_x3": 323.40466, "r_y3": 478.53214, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.72519, "r_y0": 481.26816, "r_x1": 399.69354, "r_y1": 481.26816, "r_x2": 399.69354, "r_y2": 478.53214, "r_x3": 397.72519, "r_y3": 478.53214, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 486.14688, "r_x1": 206.51694, "r_y1": 486.14688, "r_x2": 206.51694, "r_y2": 483.41086, "r_x3": 200.64, "r_y3": 483.41086, "coord_origin": "TOPLEFT" }, "text": "276", "orig": "276", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.66132, "r_y0": 486.14688, "r_x1": 384.61563, "r_y1": 486.14688, "r_x2": 384.61563, "r_y2": 483.41086, "r_x3": 382.66132, "r_y3": 483.41086, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.72513, "r_y0": 486.14688, "r_x1": 401.64819, "r_y1": 486.14688, "r_x2": 401.64819, "r_y2": 483.41086, "r_x3": 397.72513, "r_y3": 483.41086, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 158, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 412.78928, "r_y0": 486.14688, "r_x1": 414.74359, "r_y1": 486.14688, "r_x2": 414.74359, "r_y2": 483.41086, "r_x3": 412.78928, "r_y3": 483.41086, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 159, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64014, "r_y0": 491.0256, "r_x1": 207.14445, "r_y1": 491.0256, "r_x2": 207.14445, "r_y2": 488.28958, "r_x3": 200.64014, "r_y3": 488.28958, "coord_origin": "TOPLEFT" }, "text": "320", "orig": "320", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 160, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.62616, "r_y0": 491.0256, "r_x1": 369.78375, "r_y1": 491.0256, "r_x2": 369.78375, "r_y2": 488.28958, "r_x3": 367.62616, "r_y3": 488.28958, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 161, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.66141, "r_y0": 491.0256, "r_x1": 384.81897, "r_y1": 491.0256, "r_x2": 384.81897, "r_y2": 488.28958, "r_x3": 382.66141, "r_y3": 488.28958, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 162, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.7251, "r_y0": 491.0256, "r_x1": 402.05087, "r_y1": 491.0256, "r_x2": 402.05087, "r_y2": 488.28958, "r_x3": 397.7251, "r_y3": 488.28958, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 163, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64032, "r_y0": 495.90433, "r_x1": 208.48566, "r_y1": 495.90433, "r_x2": 208.48566, "r_y2": 493.1683, "r_x3": 200.64032, "r_y3": 493.1683, "coord_origin": "TOPLEFT" }, "text": "2013", "orig": "2013", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 164, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.29044, "r_y0": 495.90433, "r_x1": 266.25879, "r_y1": 495.90433, "r_x2": 266.25879, "r_y2": 493.1683, "r_x3": 264.29044, "r_y3": 493.1683, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 165, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.91466, "r_y0": 675.3464, "r_x1": 230.10028, "r_y1": 675.3464, "r_x2": 230.10028, "r_y2": 665.82603, "r_x3": 227.91466, "r_y3": 665.82603, "coord_origin": "TOPLEFT" }, "text": "\u03bc", "orig": "\u03bc", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 166, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 300.58057, "r_y0": 693.428658, "r_x1": 302.72638, "r_y1": 693.428658, "r_x2": 302.72638, "r_y2": 683.62195, "r_x3": 300.58057, "r_y3": 683.62195, "coord_origin": "TOPLEFT" }, "text": "\u2265", "orig": "\u2265", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "has_chars": false, "has_words": false, "has_lines": true, "image": null, "lines": [] }, "predictions": { "layout": { "clusters": [ { "id": 7, "label": "page_header", "bbox": { "l": 134.765, "t": 93.77099999999996, "r": 143.97887, "b": 101.84069999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.8309906721115112, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 101.84069999999997, "r_x1": 143.97887, "r_y1": 101.84069999999997, "r_x2": 143.97887, "r_y2": 93.77099999999996, "r_x3": 134.765, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 6, "label": "page_header", "bbox": { "l": 167.82053, "t": 93.77099999999996, "r": 231.72049000000004, "b": 101.84069999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.8367075324058533, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.82053, "r_y0": 101.84069999999997, "r_x1": 178.08249, "r_y1": 101.84069999999997, "r_x2": 178.08249, "r_y2": 93.77099999999996, "r_x3": 167.82053, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.37929, "r_y0": 101.84069999999997, "r_x1": 231.72049000000004, "r_y1": 101.84069999999997, "r_x2": 231.72049000000004, "r_y2": 93.77099999999996, "r_x3": 182.37929, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 4, "label": "caption", "bbox": { "l": 134.765, "t": 115.83618000000001, "r": 480.59357000000006, "b": 145.88666, "coord_origin": "TOPLEFT" }, "confidence": 0.9512290954589844, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 123.76251000000002, "r_x1": 173.09366, "r_y1": 123.76251000000002, "r_x2": 173.09366, "r_y2": 115.83618000000001, "r_x3": 134.765, "r_y3": 115.83618000000001, "coord_origin": "TOPLEFT" }, "text": "Table 2.", "orig": "Table 2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 181.30299, "r_y0": 123.96868999999992, "r_x1": 480.59151999999995, "r_y1": 123.96868999999992, "r_x2": 480.59151999999995, "r_y2": 115.89899000000003, "r_x3": 181.30299, "r_y3": 115.89899000000003, "coord_origin": "TOPLEFT" }, "text": "TSR and cell detection results compared between OTSL and HTML on", "orig": "TSR and cell detection results compared between OTSL and HTML on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 134.92767000000003, "r_x1": 480.59357000000006, "r_y1": 134.92767000000003, "r_x2": 480.59357000000006, "r_y2": 126.85797000000014, "r_x3": 134.765, "r_y3": 126.85797000000014, "coord_origin": "TOPLEFT" }, "text": "the PubTabNet [22], FinTabNet [21] and PubTables-1M [14] data sets using Table-", "orig": "the PubTabNet [22], FinTabNet [21] and PubTables-1M [14] data sets using Table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 145.88666, "r_x1": 305.95691, "r_y1": 145.88666, "r_x2": 305.95691, "r_y2": 137.81696, "r_x3": 134.765, "r_y3": 137.81696, "coord_origin": "TOPLEFT" }, "text": "Former [9] (with enc=6, dec=6, heads=8).", "orig": "Former [9] (with enc=6, dec=6, heads=8).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 0, "label": "table", "bbox": { "l": 143.6376495361328, "t": 156.3477020263672, "r": 470.8485412597656, "b": 263.2624816894531, "coord_origin": "TOPLEFT" }, "confidence": 0.9884640574455261, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.782, "r_y0": 174.62865999999997, "r_x1": 194.99779, "r_y1": 174.62865999999997, "r_x2": 194.99779, "r_y2": 166.55895999999996, "r_x3": 160.782, "r_y3": 166.55895999999996, "coord_origin": "TOPLEFT" }, "text": "Data set", "orig": "Data set", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 215.52499000000003, "r_y0": 174.6037, "r_x1": 254.04465, "r_y1": 174.6037, "r_x2": 254.04465, "r_y2": 166.534, "r_x3": 215.52499000000003, "r_y3": 166.534, "coord_origin": "TOPLEFT" }, "text": "Language", "orig": "Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 300.397, "r_y0": 169.14868, "r_x1": 323.99118, "r_y1": 169.14868, "r_x2": 323.99118, "r_y2": 161.07898, "r_x3": 300.397, "r_y3": 161.07898, "coord_origin": "TOPLEFT" }, "text": "TEDs", "orig": "TEDs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 370.345, "r_y0": 174.62865999999997, "r_x1": 414.74661, "r_y1": 174.62865999999997, "r_x2": 414.74661, "r_y2": 166.55895999999996, "r_x3": 370.345, "r_y3": 166.55895999999996, "coord_origin": "TOPLEFT" }, "text": "mAP(0.75)", "orig": "mAP(0.75)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 426.737, "r_y0": 169.14868, "r_x1": 463.10830999999996, "r_y1": 169.14868, "r_x2": 463.10830999999996, "r_y2": 161.07898, "r_x3": 426.737, "r_y3": 161.07898, "coord_origin": "TOPLEFT" }, "text": "Inference", "orig": "Inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.11401, "r_y0": 180.10766999999998, "r_x1": 466.72656, "r_y1": 180.10766999999998, "r_x2": 466.72656, "r_y2": 172.03796, "r_x3": 423.11401, "r_y3": 172.03796, "coord_origin": "TOPLEFT" }, "text": "time (secs)", "orig": "time (secs)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.41299, "r_y0": 182.10071000000005, "r_x1": 288.0596, "r_y1": 182.10071000000005, "r_x2": 288.0596, "r_y2": 174.03101000000004, "r_x3": 262.41299, "r_y3": 174.03101000000004, "coord_origin": "TOPLEFT" }, "text": "simple", "orig": "simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 296.42899, "r_y0": 182.10071000000005, "r_x1": 329.44687, "r_y1": 182.10071000000005, "r_x2": 329.44687, "r_y2": 174.03101000000004, "r_x3": 296.42899, "r_y3": 174.03101000000004, "coord_origin": "TOPLEFT" }, "text": "complex", "orig": "complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.03299, "r_y0": 182.10071000000005, "r_x1": 354.75793, "r_y1": 182.10071000000005, "r_x2": 354.75793, "r_y2": 174.03101000000004, "r_x3": 345.03299, "r_y3": 174.03101000000004, "coord_origin": "TOPLEFT" }, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.53799, "r_y0": 200.92969000000005, "r_x1": 201.24129, "r_y1": 200.92969000000005, "r_x2": 201.24129, "r_y2": 192.85999000000004, "r_x3": 154.53799, "r_y3": 192.85999000000004, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.43700000000004, "r_y0": 195.45068000000003, "r_x1": 247.13226000000003, "r_y1": 195.45068000000003, "r_x2": 247.13226000000003, "r_y2": 187.38098000000002, "r_x3": 222.43700000000004, "r_y3": 187.38098000000002, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74399, "r_y0": 195.45068000000003, "r_x1": 285.73074, "r_y1": 195.45068000000003, "r_x2": 285.73074, "r_y2": 187.38098000000002, "r_x3": 264.74399, "r_y3": 187.38098000000002, "coord_origin": "TOPLEFT" }, "text": "0.965", "orig": "0.965", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.444, "r_y0": 195.45068000000003, "r_x1": 323.43076, "r_y1": 195.45068000000003, "r_x2": 323.43076, "r_y2": 187.38098000000002, "r_x3": 302.444, "r_y3": 187.38098000000002, "coord_origin": "TOPLEFT" }, "text": "0.934", "orig": "0.934", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.40302, "r_y0": 195.45068000000003, "r_x1": 360.38977, "r_y1": 195.45068000000003, "r_x2": 360.38977, "r_y2": 187.38098000000002, "r_x3": 339.40302, "r_y3": 187.38098000000002, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 383.116, "r_y0": 195.24451, "r_x1": 401.97324, "r_y1": 195.24451, "r_x2": 401.97324, "r_y2": 187.31817999999998, "r_x3": 383.116, "r_y3": 187.31817999999998, "coord_origin": "TOPLEFT" }, "text": "0.88", "orig": "0.88", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.49300999999997, "r_y0": 195.24451, "r_x1": 454.35025, "r_y1": 195.24451, "r_x2": 454.35025, "r_y2": 187.31817999999998, "r_x3": 435.49300999999997, "r_y3": 187.31817999999998, "coord_origin": "TOPLEFT" }, "text": "2.73", "orig": "2.73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.903, "r_y0": 208.40166999999997, "r_x1": 248.66655999999998, "r_y1": 208.40166999999997, "r_x2": 248.66655999999998, "r_y2": 200.33196999999996, "r_x3": 220.903, "r_y3": 200.33196999999996, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74399, "r_y0": 208.40166999999997, "r_x1": 285.73074, "r_y1": 208.40166999999997, "r_x2": 285.73074, "r_y2": 200.33196999999996, "r_x3": 264.74399, "r_y3": 200.33196999999996, "coord_origin": "TOPLEFT" }, "text": "0.969", "orig": "0.969", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.444, "r_y0": 208.40166999999997, "r_x1": 323.43076, "r_y1": 208.40166999999997, "r_x2": 323.43076, "r_y2": 200.33196999999996, "r_x3": 302.444, "r_y3": 200.33196999999996, "coord_origin": "TOPLEFT" }, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.40302, "r_y0": 208.40166999999997, "r_x1": 360.38977, "r_y1": 208.40166999999997, "r_x2": 360.38977, "r_y2": 200.33196999999996, "r_x3": 339.40302, "r_y3": 200.33196999999996, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.052, "r_y0": 208.40166999999997, "r_x1": 403.03876, "r_y1": 208.40166999999997, "r_x2": 403.03876, "r_y2": 200.33196999999996, "r_x3": 382.052, "r_y3": 200.33196999999996, "coord_origin": "TOPLEFT" }, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.73199000000005, "r_y0": 208.40166999999997, "r_x1": 453.11182, "r_y1": 208.40166999999997, "r_x2": 453.11182, "r_y2": 200.33196999999996, "r_x3": 436.73199000000005, "r_y3": 200.33196999999996, "coord_origin": "TOPLEFT" }, "text": "5.39", "orig": "5.39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 155.94501, "r_y0": 227.23168999999996, "r_x1": 199.83374, "r_y1": 227.23168999999996, "r_x2": 199.83374, "r_y2": 219.16198999999995, "r_x3": 155.94501, "r_y3": 219.16198999999995, "coord_origin": "TOPLEFT" }, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.43700000000004, "r_y0": 221.75171, "r_x1": 247.13226000000003, "r_y1": 221.75171, "r_x2": 247.13226000000003, "r_y2": 213.68201, "r_x3": 222.43700000000004, "r_y3": 213.68201, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74399, "r_y0": 221.75171, "r_x1": 285.73074, "r_y1": 221.75171, "r_x2": 285.73074, "r_y2": 213.68201, "r_x3": 264.74399, "r_y3": 213.68201, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.444, "r_y0": 221.75171, "r_x1": 323.43076, "r_y1": 221.75171, "r_x2": 323.43076, "r_y2": 213.68201, "r_x3": 302.444, "r_y3": 213.68201, "coord_origin": "TOPLEFT" }, "text": "0.961", "orig": "0.961", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.815, "r_y0": 221.54552999999999, "r_x1": 361.97586, "r_y1": 221.54552999999999, "r_x2": 361.97586, "r_y2": 213.61919999999998, "r_x3": 337.815, "r_y3": 213.61919999999998, "coord_origin": "TOPLEFT" }, "text": "0.959", "orig": "0.959", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 380.46399, "r_y0": 221.54552999999999, "r_x1": 404.62485, "r_y1": 221.54552999999999, "r_x2": 404.62485, "r_y2": 213.61919999999998, "r_x3": 380.46399, "r_y3": 213.61919999999998, "coord_origin": "TOPLEFT" }, "text": "0.862", "orig": "0.862", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.49300999999997, "r_y0": 221.54552999999999, "r_x1": 454.35025, "r_y1": 221.54552999999999, "r_x2": 454.35025, "r_y2": 213.61919999999998, "r_x3": 435.49300999999997, "r_y3": 213.61919999999998, "coord_origin": "TOPLEFT" }, "text": "1.85", "orig": "1.85", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.903, "r_y0": 234.70367, "r_x1": 248.66655999999998, "r_y1": 234.70367, "r_x2": 248.66655999999998, "r_y2": 226.63396999999998, "r_x3": 220.903, "r_y3": 226.63396999999998, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74399, "r_y0": 234.70367, "r_x1": 285.73074, "r_y1": 234.70367, "r_x2": 285.73074, "r_y2": 226.63396999999998, "r_x3": 264.74399, "r_y3": 226.63396999999998, "coord_origin": "TOPLEFT" }, "text": "0.917", "orig": "0.917", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.444, "r_y0": 234.70367, "r_x1": 323.43076, "r_y1": 234.70367, "r_x2": 323.43076, "r_y2": 226.63396999999998, "r_x3": 302.444, "r_y3": 226.63396999999998, "coord_origin": "TOPLEFT" }, "text": "0.922", "orig": "0.922", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 341.70599, "r_y0": 234.70367, "r_x1": 358.08582, "r_y1": 234.70367, "r_x2": 358.08582, "r_y2": 226.63396999999998, "r_x3": 341.70599, "r_y3": 226.63396999999998, "coord_origin": "TOPLEFT" }, "text": "0.92", "orig": "0.92", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.052, "r_y0": 234.70367, "r_x1": 403.03876, "r_y1": 234.70367, "r_x2": 403.03876, "r_y2": 226.63396999999998, "r_x3": 382.052, "r_y3": 226.63396999999998, "coord_origin": "TOPLEFT" }, "text": "0.722", "orig": "0.722", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.73199000000005, "r_y0": 234.70367, "r_x1": 453.11182, "r_y1": 234.70367, "r_x2": 453.11182, "r_y2": 226.63396999999998, "r_x3": 436.73199000000005, "r_y3": 226.63396999999998, "coord_origin": "TOPLEFT" }, "text": "3.26", "orig": "3.26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 148.62601, "r_y0": 253.53265, "r_x1": 207.1524, "r_y1": 253.53265, "r_x2": 207.1524, "r_y2": 245.46294999999998, "r_x3": 148.62601, "r_y3": 245.46294999999998, "coord_origin": "TOPLEFT" }, "text": "PubTables-1M", "orig": "PubTables-1M", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.43700000000004, "r_y0": 248.05267000000003, "r_x1": 247.13226000000003, "r_y1": 248.05267000000003, "r_x2": 247.13226000000003, "r_y2": 239.98297000000002, "r_x3": 222.43700000000004, "r_y3": 239.98297000000002, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74399, "r_y0": 248.05267000000003, "r_x1": 285.73074, "r_y1": 248.05267000000003, "r_x2": 285.73074, "r_y2": 239.98297000000002, "r_x3": 264.74399, "r_y3": 239.98297000000002, "coord_origin": "TOPLEFT" }, "text": "0.987", "orig": "0.987", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.444, "r_y0": 248.05267000000003, "r_x1": 323.43076, "r_y1": 248.05267000000003, "r_x2": 323.43076, "r_y2": 239.98297000000002, "r_x3": 302.444, "r_y3": 239.98297000000002, "coord_origin": "TOPLEFT" }, "text": "0.964", "orig": "0.964", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.815, "r_y0": 247.8465, "r_x1": 361.97586, "r_y1": 247.8465, "r_x2": 361.97586, "r_y2": 239.92016999999998, "r_x3": 337.815, "r_y3": 239.92016999999998, "coord_origin": "TOPLEFT" }, "text": "0.977", "orig": "0.977", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 380.46399, "r_y0": 247.8465, "r_x1": 404.62485, "r_y1": 247.8465, "r_x2": 404.62485, "r_y2": 239.92016999999998, "r_x3": 380.46399, "r_y3": 239.92016999999998, "coord_origin": "TOPLEFT" }, "text": "0.896", "orig": "0.896", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.49300999999997, "r_y0": 247.8465, "r_x1": 454.35025, "r_y1": 247.8465, "r_x2": 454.35025, "r_y2": 239.92016999999998, "r_x3": 435.49300999999997, "r_y3": 239.92016999999998, "coord_origin": "TOPLEFT" }, "text": "1.79", "orig": "1.79", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.903, "r_y0": 261.00469999999996, "r_x1": 248.66655999999998, "r_y1": 261.00469999999996, "r_x2": 248.66655999999998, "r_y2": 252.93499999999995, "r_x3": 220.903, "r_y3": 252.93499999999995, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74399, "r_y0": 261.00469999999996, "r_x1": 285.73074, "r_y1": 261.00469999999996, "r_x2": 285.73074, "r_y2": 252.93499999999995, "r_x3": 264.74399, "r_y3": 252.93499999999995, "coord_origin": "TOPLEFT" }, "text": "0.983", "orig": "0.983", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.444, "r_y0": 261.00469999999996, "r_x1": 323.43076, "r_y1": 261.00469999999996, "r_x2": 323.43076, "r_y2": 252.93499999999995, "r_x3": 302.444, "r_y3": 252.93499999999995, "coord_origin": "TOPLEFT" }, "text": "0.944", "orig": "0.944", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.40302, "r_y0": 261.00469999999996, "r_x1": 360.38977, "r_y1": 261.00469999999996, "r_x2": 360.38977, "r_y2": 252.93499999999995, "r_x3": 339.40302, "r_y3": 252.93499999999995, "coord_origin": "TOPLEFT" }, "text": "0.966", "orig": "0.966", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.052, "r_y0": 261.00469999999996, "r_x1": 403.03876, "r_y1": 261.00469999999996, "r_x2": 403.03876, "r_y2": 252.93499999999995, "r_x3": 382.052, "r_y3": 252.93499999999995, "coord_origin": "TOPLEFT" }, "text": "0.889", "orig": "0.889", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.73199000000005, "r_y0": 261.00469999999996, "r_x1": 453.11182, "r_y1": 261.00469999999996, "r_x2": 453.11182, "r_y2": 252.93499999999995, "r_x3": 436.73199000000005, "r_y3": 252.93499999999995, "coord_origin": "TOPLEFT" }, "text": "3.26", "orig": "3.26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 10, "label": "text", "bbox": { "l": 160.782, "t": 166.55895999999996, "r": 194.99779, "b": 174.62865999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.782, "r_y0": 174.62865999999997, "r_x1": 194.99779, "r_y1": 174.62865999999997, "r_x2": 194.99779, "r_y2": 166.55895999999996, "r_x3": 160.782, "r_y3": 166.55895999999996, "coord_origin": "TOPLEFT" }, "text": "Data set", "orig": "Data set", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 11, "label": "text", "bbox": { "l": 215.52499000000003, "t": 166.534, "r": 254.04465, "b": 174.6037, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 215.52499000000003, "r_y0": 174.6037, "r_x1": 254.04465, "r_y1": 174.6037, "r_x2": 254.04465, "r_y2": 166.534, "r_x3": 215.52499000000003, "r_y3": 166.534, "coord_origin": "TOPLEFT" }, "text": "Language", "orig": "Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 12, "label": "text", "bbox": { "l": 300.397, "t": 161.07898, "r": 323.99118, "b": 169.14868, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 300.397, "r_y0": 169.14868, "r_x1": 323.99118, "r_y1": 169.14868, "r_x2": 323.99118, "r_y2": 161.07898, "r_x3": 300.397, "r_y3": 161.07898, "coord_origin": "TOPLEFT" }, "text": "TEDs", "orig": "TEDs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 13, "label": "text", "bbox": { "l": 370.345, "t": 166.55895999999996, "r": 414.74661, "b": 174.62865999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 370.345, "r_y0": 174.62865999999997, "r_x1": 414.74661, "r_y1": 174.62865999999997, "r_x2": 414.74661, "r_y2": 166.55895999999996, "r_x3": 370.345, "r_y3": 166.55895999999996, "coord_origin": "TOPLEFT" }, "text": "mAP(0.75)", "orig": "mAP(0.75)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 14, "label": "text", "bbox": { "l": 426.737, "t": 161.07898, "r": 463.10830999999996, "b": 169.14868, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 426.737, "r_y0": 169.14868, "r_x1": 463.10830999999996, "r_y1": 169.14868, "r_x2": 463.10830999999996, "r_y2": 161.07898, "r_x3": 426.737, "r_y3": 161.07898, "coord_origin": "TOPLEFT" }, "text": "Inference", "orig": "Inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 15, "label": "text", "bbox": { "l": 423.11401, "t": 172.03796, "r": 466.72656, "b": 180.10766999999998, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.11401, "r_y0": 180.10766999999998, "r_x1": 466.72656, "r_y1": 180.10766999999998, "r_x2": 466.72656, "r_y2": 172.03796, "r_x3": 423.11401, "r_y3": 172.03796, "coord_origin": "TOPLEFT" }, "text": "time (secs)", "orig": "time (secs)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 16, "label": "text", "bbox": { "l": 262.41299, "t": 174.03101000000004, "r": 288.0596, "b": 182.10071000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.41299, "r_y0": 182.10071000000005, "r_x1": 288.0596, "r_y1": 182.10071000000005, "r_x2": 288.0596, "r_y2": 174.03101000000004, "r_x3": 262.41299, "r_y3": 174.03101000000004, "coord_origin": "TOPLEFT" }, "text": "simple", "orig": "simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 17, "label": "text", "bbox": { "l": 296.42899, "t": 174.03101000000004, "r": 329.44687, "b": 182.10071000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 296.42899, "r_y0": 182.10071000000005, "r_x1": 329.44687, "r_y1": 182.10071000000005, "r_x2": 329.44687, "r_y2": 174.03101000000004, "r_x3": 296.42899, "r_y3": 174.03101000000004, "coord_origin": "TOPLEFT" }, "text": "complex", "orig": "complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 18, "label": "text", "bbox": { "l": 345.03299, "t": 174.03101000000004, "r": 354.75793, "b": 182.10071000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.03299, "r_y0": 182.10071000000005, "r_x1": 354.75793, "r_y1": 182.10071000000005, "r_x2": 354.75793, "r_y2": 174.03101000000004, "r_x3": 345.03299, "r_y3": 174.03101000000004, "coord_origin": "TOPLEFT" }, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 19, "label": "text", "bbox": { "l": 154.53799, "t": 192.85999000000004, "r": 201.24129, "b": 200.92969000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.53799, "r_y0": 200.92969000000005, "r_x1": 201.24129, "r_y1": 200.92969000000005, "r_x2": 201.24129, "r_y2": 192.85999000000004, "r_x3": 154.53799, "r_y3": 192.85999000000004, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 20, "label": "text", "bbox": { "l": 222.43700000000004, "t": 187.38098000000002, "r": 247.13226000000003, "b": 195.45068000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.43700000000004, "r_y0": 195.45068000000003, "r_x1": 247.13226000000003, "r_y1": 195.45068000000003, "r_x2": 247.13226000000003, "r_y2": 187.38098000000002, "r_x3": 222.43700000000004, "r_y3": 187.38098000000002, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 21, "label": "text", "bbox": { "l": 264.74399, "t": 187.38098000000002, "r": 285.73074, "b": 195.45068000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74399, "r_y0": 195.45068000000003, "r_x1": 285.73074, "r_y1": 195.45068000000003, "r_x2": 285.73074, "r_y2": 187.38098000000002, "r_x3": 264.74399, "r_y3": 187.38098000000002, "coord_origin": "TOPLEFT" }, "text": "0.965", "orig": "0.965", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 22, "label": "text", "bbox": { "l": 302.444, "t": 187.38098000000002, "r": 323.43076, "b": 195.45068000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.444, "r_y0": 195.45068000000003, "r_x1": 323.43076, "r_y1": 195.45068000000003, "r_x2": 323.43076, "r_y2": 187.38098000000002, "r_x3": 302.444, "r_y3": 187.38098000000002, "coord_origin": "TOPLEFT" }, "text": "0.934", "orig": "0.934", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 23, "label": "text", "bbox": { "l": 339.40302, "t": 187.38098000000002, "r": 360.38977, "b": 195.45068000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.40302, "r_y0": 195.45068000000003, "r_x1": 360.38977, "r_y1": 195.45068000000003, "r_x2": 360.38977, "r_y2": 187.38098000000002, "r_x3": 339.40302, "r_y3": 187.38098000000002, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 24, "label": "text", "bbox": { "l": 383.116, "t": 187.31817999999998, "r": 401.97324, "b": 195.24451, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 383.116, "r_y0": 195.24451, "r_x1": 401.97324, "r_y1": 195.24451, "r_x2": 401.97324, "r_y2": 187.31817999999998, "r_x3": 383.116, "r_y3": 187.31817999999998, "coord_origin": "TOPLEFT" }, "text": "0.88", "orig": "0.88", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 25, "label": "text", "bbox": { "l": 435.49300999999997, "t": 187.31817999999998, "r": 454.35025, "b": 195.24451, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.49300999999997, "r_y0": 195.24451, "r_x1": 454.35025, "r_y1": 195.24451, "r_x2": 454.35025, "r_y2": 187.31817999999998, "r_x3": 435.49300999999997, "r_y3": 187.31817999999998, "coord_origin": "TOPLEFT" }, "text": "2.73", "orig": "2.73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 26, "label": "text", "bbox": { "l": 220.903, "t": 200.33196999999996, "r": 248.66655999999998, "b": 208.40166999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.903, "r_y0": 208.40166999999997, "r_x1": 248.66655999999998, "r_y1": 208.40166999999997, "r_x2": 248.66655999999998, "r_y2": 200.33196999999996, "r_x3": 220.903, "r_y3": 200.33196999999996, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 27, "label": "text", "bbox": { "l": 264.74399, "t": 200.33196999999996, "r": 285.73074, "b": 208.40166999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74399, "r_y0": 208.40166999999997, "r_x1": 285.73074, "r_y1": 208.40166999999997, "r_x2": 285.73074, "r_y2": 200.33196999999996, "r_x3": 264.74399, "r_y3": 200.33196999999996, "coord_origin": "TOPLEFT" }, "text": "0.969", "orig": "0.969", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 28, "label": "text", "bbox": { "l": 302.444, "t": 200.33196999999996, "r": 323.43076, "b": 208.40166999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.444, "r_y0": 208.40166999999997, "r_x1": 323.43076, "r_y1": 208.40166999999997, "r_x2": 323.43076, "r_y2": 200.33196999999996, "r_x3": 302.444, "r_y3": 200.33196999999996, "coord_origin": "TOPLEFT" }, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 29, "label": "text", "bbox": { "l": 339.40302, "t": 200.33196999999996, "r": 360.38977, "b": 208.40166999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.40302, "r_y0": 208.40166999999997, "r_x1": 360.38977, "r_y1": 208.40166999999997, "r_x2": 360.38977, "r_y2": 200.33196999999996, "r_x3": 339.40302, "r_y3": 200.33196999999996, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 30, "label": "text", "bbox": { "l": 382.052, "t": 200.33196999999996, "r": 403.03876, "b": 208.40166999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.052, "r_y0": 208.40166999999997, "r_x1": 403.03876, "r_y1": 208.40166999999997, "r_x2": 403.03876, "r_y2": 200.33196999999996, "r_x3": 382.052, "r_y3": 200.33196999999996, "coord_origin": "TOPLEFT" }, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 31, "label": "text", "bbox": { "l": 436.73199000000005, "t": 200.33196999999996, "r": 453.11182, "b": 208.40166999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.73199000000005, "r_y0": 208.40166999999997, "r_x1": 453.11182, "r_y1": 208.40166999999997, "r_x2": 453.11182, "r_y2": 200.33196999999996, "r_x3": 436.73199000000005, "r_y3": 200.33196999999996, "coord_origin": "TOPLEFT" }, "text": "5.39", "orig": "5.39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 32, "label": "text", "bbox": { "l": 155.94501, "t": 219.16198999999995, "r": 199.83374, "b": 227.23168999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 155.94501, "r_y0": 227.23168999999996, "r_x1": 199.83374, "r_y1": 227.23168999999996, "r_x2": 199.83374, "r_y2": 219.16198999999995, "r_x3": 155.94501, "r_y3": 219.16198999999995, "coord_origin": "TOPLEFT" }, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 33, "label": "text", "bbox": { "l": 222.43700000000004, "t": 213.68201, "r": 247.13226000000003, "b": 221.75171, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.43700000000004, "r_y0": 221.75171, "r_x1": 247.13226000000003, "r_y1": 221.75171, "r_x2": 247.13226000000003, "r_y2": 213.68201, "r_x3": 222.43700000000004, "r_y3": 213.68201, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 34, "label": "text", "bbox": { "l": 264.74399, "t": 213.68201, "r": 285.73074, "b": 221.75171, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74399, "r_y0": 221.75171, "r_x1": 285.73074, "r_y1": 221.75171, "r_x2": 285.73074, "r_y2": 213.68201, "r_x3": 264.74399, "r_y3": 213.68201, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 35, "label": "text", "bbox": { "l": 302.444, "t": 213.68201, "r": 323.43076, "b": 221.75171, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.444, "r_y0": 221.75171, "r_x1": 323.43076, "r_y1": 221.75171, "r_x2": 323.43076, "r_y2": 213.68201, "r_x3": 302.444, "r_y3": 213.68201, "coord_origin": "TOPLEFT" }, "text": "0.961", "orig": "0.961", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 36, "label": "text", "bbox": { "l": 337.815, "t": 213.61919999999998, "r": 361.97586, "b": 221.54552999999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.815, "r_y0": 221.54552999999999, "r_x1": 361.97586, "r_y1": 221.54552999999999, "r_x2": 361.97586, "r_y2": 213.61919999999998, "r_x3": 337.815, "r_y3": 213.61919999999998, "coord_origin": "TOPLEFT" }, "text": "0.959", "orig": "0.959", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 37, "label": "text", "bbox": { "l": 380.46399, "t": 213.61919999999998, "r": 404.62485, "b": 221.54552999999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 380.46399, "r_y0": 221.54552999999999, "r_x1": 404.62485, "r_y1": 221.54552999999999, "r_x2": 404.62485, "r_y2": 213.61919999999998, "r_x3": 380.46399, "r_y3": 213.61919999999998, "coord_origin": "TOPLEFT" }, "text": "0.862", "orig": "0.862", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 38, "label": "text", "bbox": { "l": 435.49300999999997, "t": 213.61919999999998, "r": 454.35025, "b": 221.54552999999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.49300999999997, "r_y0": 221.54552999999999, "r_x1": 454.35025, "r_y1": 221.54552999999999, "r_x2": 454.35025, "r_y2": 213.61919999999998, "r_x3": 435.49300999999997, "r_y3": 213.61919999999998, "coord_origin": "TOPLEFT" }, "text": "1.85", "orig": "1.85", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 39, "label": "text", "bbox": { "l": 220.903, "t": 226.63396999999998, "r": 248.66655999999998, "b": 234.70367, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.903, "r_y0": 234.70367, "r_x1": 248.66655999999998, "r_y1": 234.70367, "r_x2": 248.66655999999998, "r_y2": 226.63396999999998, "r_x3": 220.903, "r_y3": 226.63396999999998, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 40, "label": "text", "bbox": { "l": 264.74399, "t": 226.63396999999998, "r": 285.73074, "b": 234.70367, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74399, "r_y0": 234.70367, "r_x1": 285.73074, "r_y1": 234.70367, "r_x2": 285.73074, "r_y2": 226.63396999999998, "r_x3": 264.74399, "r_y3": 226.63396999999998, "coord_origin": "TOPLEFT" }, "text": "0.917", "orig": "0.917", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 302.444, "t": 226.63396999999998, "r": 323.43076, "b": 234.70367, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.444, "r_y0": 234.70367, "r_x1": 323.43076, "r_y1": 234.70367, "r_x2": 323.43076, "r_y2": 226.63396999999998, "r_x3": 302.444, "r_y3": 226.63396999999998, "coord_origin": "TOPLEFT" }, "text": "0.922", "orig": "0.922", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 341.70599, "t": 226.63396999999998, "r": 358.08582, "b": 234.70367, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 341.70599, "r_y0": 234.70367, "r_x1": 358.08582, "r_y1": 234.70367, "r_x2": 358.08582, "r_y2": 226.63396999999998, "r_x3": 341.70599, "r_y3": 226.63396999999998, "coord_origin": "TOPLEFT" }, "text": "0.92", "orig": "0.92", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 382.052, "t": 226.63396999999998, "r": 403.03876, "b": 234.70367, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.052, "r_y0": 234.70367, "r_x1": 403.03876, "r_y1": 234.70367, "r_x2": 403.03876, "r_y2": 226.63396999999998, "r_x3": 382.052, "r_y3": 226.63396999999998, "coord_origin": "TOPLEFT" }, "text": "0.722", "orig": "0.722", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 436.73199000000005, "t": 226.63396999999998, "r": 453.11182, "b": 234.70367, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.73199000000005, "r_y0": 234.70367, "r_x1": 453.11182, "r_y1": 234.70367, "r_x2": 453.11182, "r_y2": 226.63396999999998, "r_x3": 436.73199000000005, "r_y3": 226.63396999999998, "coord_origin": "TOPLEFT" }, "text": "3.26", "orig": "3.26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 148.62601, "t": 245.46294999999998, "r": 207.1524, "b": 253.53265, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 148.62601, "r_y0": 253.53265, "r_x1": 207.1524, "r_y1": 253.53265, "r_x2": 207.1524, "r_y2": 245.46294999999998, "r_x3": 148.62601, "r_y3": 245.46294999999998, "coord_origin": "TOPLEFT" }, "text": "PubTables-1M", "orig": "PubTables-1M", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 222.43700000000004, "t": 239.98297000000002, "r": 247.13226000000003, "b": 248.05267000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.43700000000004, "r_y0": 248.05267000000003, "r_x1": 247.13226000000003, "r_y1": 248.05267000000003, "r_x2": 247.13226000000003, "r_y2": 239.98297000000002, "r_x3": 222.43700000000004, "r_y3": 239.98297000000002, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 264.74399, "t": 239.98297000000002, "r": 285.73074, "b": 248.05267000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74399, "r_y0": 248.05267000000003, "r_x1": 285.73074, "r_y1": 248.05267000000003, "r_x2": 285.73074, "r_y2": 239.98297000000002, "r_x3": 264.74399, "r_y3": 239.98297000000002, "coord_origin": "TOPLEFT" }, "text": "0.987", "orig": "0.987", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 302.444, "t": 239.98297000000002, "r": 323.43076, "b": 248.05267000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.444, "r_y0": 248.05267000000003, "r_x1": 323.43076, "r_y1": 248.05267000000003, "r_x2": 323.43076, "r_y2": 239.98297000000002, "r_x3": 302.444, "r_y3": 239.98297000000002, "coord_origin": "TOPLEFT" }, "text": "0.964", "orig": "0.964", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 337.815, "t": 239.92016999999998, "r": 361.97586, "b": 247.8465, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.815, "r_y0": 247.8465, "r_x1": 361.97586, "r_y1": 247.8465, "r_x2": 361.97586, "r_y2": 239.92016999999998, "r_x3": 337.815, "r_y3": 239.92016999999998, "coord_origin": "TOPLEFT" }, "text": "0.977", "orig": "0.977", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 380.46399, "t": 239.92016999999998, "r": 404.62485, "b": 247.8465, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 380.46399, "r_y0": 247.8465, "r_x1": 404.62485, "r_y1": 247.8465, "r_x2": 404.62485, "r_y2": 239.92016999999998, "r_x3": 380.46399, "r_y3": 239.92016999999998, "coord_origin": "TOPLEFT" }, "text": "0.896", "orig": "0.896", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 51, "label": "text", "bbox": { "l": 435.49300999999997, "t": 239.92016999999998, "r": 454.35025, "b": 247.8465, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.49300999999997, "r_y0": 247.8465, "r_x1": 454.35025, "r_y1": 247.8465, "r_x2": 454.35025, "r_y2": 239.92016999999998, "r_x3": 435.49300999999997, "r_y3": 239.92016999999998, "coord_origin": "TOPLEFT" }, "text": "1.79", "orig": "1.79", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 52, "label": "text", "bbox": { "l": 220.903, "t": 252.93499999999995, "r": 248.66655999999998, "b": 261.00469999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.903, "r_y0": 261.00469999999996, "r_x1": 248.66655999999998, "r_y1": 261.00469999999996, "r_x2": 248.66655999999998, "r_y2": 252.93499999999995, "r_x3": 220.903, "r_y3": 252.93499999999995, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 53, "label": "text", "bbox": { "l": 264.74399, "t": 252.93499999999995, "r": 285.73074, "b": 261.00469999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74399, "r_y0": 261.00469999999996, "r_x1": 285.73074, "r_y1": 261.00469999999996, "r_x2": 285.73074, "r_y2": 252.93499999999995, "r_x3": 264.74399, "r_y3": 252.93499999999995, "coord_origin": "TOPLEFT" }, "text": "0.983", "orig": "0.983", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 54, "label": "text", "bbox": { "l": 302.444, "t": 252.93499999999995, "r": 323.43076, "b": 261.00469999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.444, "r_y0": 261.00469999999996, "r_x1": 323.43076, "r_y1": 261.00469999999996, "r_x2": 323.43076, "r_y2": 252.93499999999995, "r_x3": 302.444, "r_y3": 252.93499999999995, "coord_origin": "TOPLEFT" }, "text": "0.944", "orig": "0.944", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 55, "label": "text", "bbox": { "l": 339.40302, "t": 252.93499999999995, "r": 360.38977, "b": 261.00469999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.40302, "r_y0": 261.00469999999996, "r_x1": 360.38977, "r_y1": 261.00469999999996, "r_x2": 360.38977, "r_y2": 252.93499999999995, "r_x3": 339.40302, "r_y3": 252.93499999999995, "coord_origin": "TOPLEFT" }, "text": "0.966", "orig": "0.966", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 56, "label": "text", "bbox": { "l": 382.052, "t": 252.93499999999995, "r": 403.03876, "b": 261.00469999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.052, "r_y0": 261.00469999999996, "r_x1": 403.03876, "r_y1": 261.00469999999996, "r_x2": 403.03876, "r_y2": 252.93499999999995, "r_x3": 382.052, "r_y3": 252.93499999999995, "coord_origin": "TOPLEFT" }, "text": "0.889", "orig": "0.889", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 57, "label": "text", "bbox": { "l": 436.73199000000005, "t": 252.93499999999995, "r": 453.11182, "b": 261.00469999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.73199000000005, "r_y0": 261.00469999999996, "r_x1": 453.11182, "r_y1": 261.00469999999996, "r_x2": 453.11182, "r_y2": 252.93499999999995, "r_x3": 436.73199000000005, "r_y3": 252.93499999999995, "coord_origin": "TOPLEFT" }, "text": "3.26", "orig": "3.26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, { "id": 3, "label": "section_header", "bbox": { "l": 134.765, "t": 288.91479, "r": 257.08679, "b": 297.72173999999995, "coord_origin": "TOPLEFT" }, "confidence": 0.9546447992324829, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 297.72173999999995, "r_x1": 149.40205, "r_y1": 297.72173999999995, "r_x2": 149.40205, "r_y2": 288.91479, "r_x3": 134.765, "r_y3": 288.91479, "coord_origin": "TOPLEFT" }, "text": "5.3", "orig": "5.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.85904, "r_y0": 297.72173999999995, "r_x1": 257.08679, "r_y1": 297.72173999999995, "r_x2": 257.08679, "r_y2": 288.91479, "r_x3": 160.85904, "r_y3": 288.91479, "coord_origin": "TOPLEFT" }, "text": "Qualitative Results", "orig": "Qualitative Results", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 1, "label": "text", "bbox": { "l": 134.765, "t": 309.86078, "r": 480.58981, "b": 366.47769, "coord_origin": "TOPLEFT" }, "confidence": 0.9834085702896118, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 318.65775, "r_x1": 480.58777, "r_y1": 318.65775, "r_x2": 480.58777, "r_y2": 309.86078, "r_x3": 134.765, "r_y3": 309.86078, "coord_origin": "TOPLEFT" }, "text": "To illustrate the qualitative differences between OTSL and HTML, Figure 5", "orig": "To illustrate the qualitative differences between OTSL and HTML, Figure 5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 330.61273, "r_x1": 480.58889999999997, "r_y1": 330.61273, "r_x2": 480.58889999999997, "r_y2": 321.81577, "r_x3": 134.765, "r_y3": 321.81577, "coord_origin": "TOPLEFT" }, "text": "demonstrates less overlap and more accurate bounding boxes with OTSL. In", "orig": "demonstrates less overlap and more accurate bounding boxes with OTSL. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 342.56772, "r_x1": 480.58681999999993, "r_y1": 342.56772, "r_x2": 480.58681999999993, "r_y2": 333.77075, "r_x3": 134.765, "r_y3": 333.77075, "coord_origin": "TOPLEFT" }, "text": "Figure 6, OTSL proves to be more effective in handling tables with longer to-", "orig": "Figure 6, OTSL proves to be more effective in handling tables with longer to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 354.52271, "r_x1": 480.58981, "r_y1": 354.52271, "r_x2": 480.58981, "r_y2": 345.72574, "r_x3": 134.765, "r_y3": 345.72574, "coord_origin": "TOPLEFT" }, "text": "ken sequences, resulting in even more precise structure prediction and bounding", "orig": "ken sequences, resulting in even more precise structure prediction and bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 366.47769, "r_x1": 161.65704, "r_y1": 366.47769, "r_x2": 161.65704, "r_y2": 357.68073, "r_x3": 134.765, "r_y3": 357.68073, "coord_origin": "TOPLEFT" }, "text": "boxes.", "orig": "boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 5, "label": "caption", "bbox": { "l": 134.765, "t": 397.59012, "r": 480.59106, "b": 439.71716, "coord_origin": "TOPLEFT" }, "confidence": 0.9482728838920593, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 405.51642, "r_x1": 162.64424, "r_y1": 405.51642, "r_x2": 162.64424, "r_y2": 397.59012, "r_x3": 134.765, "r_y3": 397.59012, "coord_origin": "TOPLEFT" }, "text": "Fig. 5.", "orig": "Fig. 5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.384, "r_y0": 405.72266, "r_x1": 480.59106, "r_y1": 405.72266, "r_x2": 480.59106, "r_y2": 397.65289, "r_x3": 167.384, "r_y3": 397.65289, "coord_origin": "TOPLEFT" }, "text": "The OTSL model produces more accurate bounding boxes with less over-", "orig": "The OTSL model produces more accurate bounding boxes with less over-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 416.68167000000005, "r_x1": 480.59106, "r_y1": 416.68167000000005, "r_x2": 480.59106, "r_y2": 408.61190999999997, "r_x3": 134.765, "r_y3": 408.61190999999997, "coord_origin": "TOPLEFT" }, "text": "lap (E) than the HTML model (D), when predicting the structure of a sparse ta-", "orig": "lap (E) than the HTML model (D), when predicting the structure of a sparse ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 427.64066, "r_x1": 480.58838000000003, "r_y1": 427.64066, "r_x2": 480.58838000000003, "r_y2": 419.57089, "r_x3": 134.765, "r_y3": 419.57089, "coord_origin": "TOPLEFT" }, "text": "ble (A), at twice the inference speed because of shorter sequence length (B),(C).", "orig": "ble (A), at twice the inference speed because of shorter sequence length (B),(C).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 438.59964, "r_x1": 304.69171, "r_y1": 438.59964, "r_x2": 304.69171, "r_y2": 430.52987999999993, "r_x3": 134.765, "r_y3": 430.52987999999993, "coord_origin": "TOPLEFT" }, "text": "\"PMC2807444_006_00.png\" PubTabNet.", "orig": "\"PMC2807444_006_00.png\" PubTabNet.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 342.63354, "r_y0": 439.71716, "r_x1": 344.81915, "r_y1": 439.71716, "r_x2": 344.81915, "r_y2": 430.19678, "r_x3": 342.63354, "r_y3": 430.19678, "coord_origin": "TOPLEFT" }, "text": "\u03bc", "orig": "\u03bc", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 2, "label": "picture", "bbox": { "l": 162.67430114746094, "t": 444.62255859375, "r": 451.70062255859375, "b": 663.2135620117188, "coord_origin": "TOPLEFT" }, "confidence": 0.9742383360862732, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 180.12473, "r_y0": 518.94992, "r_x1": 190.62042, "r_y1": 518.94992, "r_x2": 190.62042, "r_y2": 516.2332200000001, "r_x3": 180.12473, "r_y3": 516.2332200000001, "coord_origin": "TOPLEFT" }, "text": "", "orig": "
", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2438, "r_y0": 522.84879, "r_x1": 304.54797, "r_y1": 522.84879, "r_x2": 304.54797, "r_y2": 520.13208, "r_x3": 183.2438, "r_y3": 520.13208, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2438, "r_y0": 526.74765, "r_x1": 388.42313, "r_y1": 526.74765, "r_x2": 388.42313, "r_y2": 524.03094, "r_x3": 183.2438, "r_y3": 524.03094, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2438, "r_y0": 530.64648, "r_x1": 388.42313, "r_y1": 530.64648, "r_x2": 388.42313, "r_y2": 527.9297799999999, "r_x3": 183.2438, "r_y3": 527.9297799999999, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2438, "r_y0": 534.54532, "r_x1": 388.42313, "r_y1": 534.54532, "r_x2": 388.42313, "r_y2": 531.82861, "r_x3": 183.2438, "r_y3": 531.82861, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2438, "r_y0": 538.44418, "r_x1": 388.42313, "r_y1": 538.44418, "r_x2": 388.42313, "r_y2": 535.72748, "r_x3": 183.2438, "r_y3": 535.72748, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2438, "r_y0": 542.34303, "r_x1": 388.42313, "r_y1": 542.34303, "r_x2": 388.42313, "r_y2": 539.62631, "r_x3": 183.2438, "r_y3": 539.62631, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2438, "r_y0": 546.24188, "r_x1": 388.42313, "r_y1": 546.24188, "r_x2": 388.42313, "r_y2": 543.52516, "r_x3": 183.2438, "r_y3": 543.52516, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2438, "r_y0": 550.14073, "r_x1": 388.42313, "r_y1": 550.14073, "r_x2": 388.42313, "r_y2": 547.42401, "r_x3": 183.2438, "r_y3": 547.42401, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2438, "r_y0": 554.03958, "r_x1": 388.42313, "r_y1": 554.03958, "r_x2": 388.42313, "r_y2": 551.32286, "r_x3": 183.2438, "r_y3": 551.32286, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 180.12473, "r_y0": 557.93845, "r_x1": 191.86806, "r_y1": 557.93845, "r_x2": 191.86806, "r_y2": 555.22173, "r_x3": 180.12473, "r_y3": 555.22173, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38348, "r_y0": 521.01712, "r_x1": 408.82025, "r_y1": 521.01712, "r_x2": 408.82025, "r_y2": 518.30042, "r_x3": 407.38348, "r_y3": 518.30042, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.25699, "r_y0": 521.01712, "r_x1": 450.48605, "r_y1": 521.01712, "r_x2": 450.48605, "r_y2": 518.30042, "r_x3": 410.25699, "r_y3": 518.30042, "coord_origin": "TOPLEFT" }, "text": "C L L L C L L L L L C L L NL", "orig": "C L L L C L L L L L C L L NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38348, "r_y0": 524.9159500000001, "r_x1": 408.82025, "r_y1": 524.9159500000001, "r_x2": 408.82025, "r_y2": 522.19925, "r_x3": 407.38348, "r_y3": 522.19925, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.25699, "r_y0": 524.9159500000001, "r_x1": 450.48605, "r_y1": 524.9159500000001, "r_x2": 450.48605, "r_y2": 522.19925, "r_x3": 410.25699, "r_y3": 522.19925, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38348, "r_y0": 528.81479, "r_x1": 408.82025, "r_y1": 528.81479, "r_x2": 408.82025, "r_y2": 526.09808, "r_x3": 407.38348, "r_y3": 526.09808, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.25699, "r_y0": 528.81479, "r_x1": 450.48605, "r_y1": 528.81479, "r_x2": 450.48605, "r_y2": 526.09808, "r_x3": 410.25699, "r_y3": 526.09808, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38348, "r_y0": 532.7136499999999, "r_x1": 408.82025, "r_y1": 532.7136499999999, "r_x2": 408.82025, "r_y2": 529.99695, "r_x3": 407.38348, "r_y3": 529.99695, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.25699, "r_y0": 532.7136499999999, "r_x1": 450.48605, "r_y1": 532.7136499999999, "r_x2": 450.48605, "r_y2": 529.99695, "r_x3": 410.25699, "r_y3": 529.99695, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38348, "r_y0": 536.6125, "r_x1": 408.82025, "r_y1": 536.6125, "r_x2": 408.82025, "r_y2": 533.8957800000001, "r_x3": 407.38348, "r_y3": 533.8957800000001, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.25699, "r_y0": 536.6125, "r_x1": 450.48605, "r_y1": 536.6125, "r_x2": 450.48605, "r_y2": 533.8957800000001, "r_x3": 410.25699, "r_y3": 533.8957800000001, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38348, "r_y0": 540.51135, "r_x1": 408.82025, "r_y1": 540.51135, "r_x2": 408.82025, "r_y2": 537.79463, "r_x3": 407.38348, "r_y3": 537.79463, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.25699, "r_y0": 540.51135, "r_x1": 450.48605, "r_y1": 540.51135, "r_x2": 450.48605, "r_y2": 537.79463, "r_x3": 410.25699, "r_y3": 537.79463, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38348, "r_y0": 544.4102, "r_x1": 408.82025, "r_y1": 544.4102, "r_x2": 408.82025, "r_y2": 541.69348, "r_x3": 407.38348, "r_y3": 541.69348, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.25699, "r_y0": 544.4102, "r_x1": 450.48605, "r_y1": 544.4102, "r_x2": 450.48605, "r_y2": 541.69348, "r_x3": 410.25699, "r_y3": 541.69348, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38348, "r_y0": 548.3090500000001, "r_x1": 408.82025, "r_y1": 548.3090500000001, "r_x2": 408.82025, "r_y2": 545.59233, "r_x3": 407.38348, "r_y3": 545.59233, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.25699, "r_y0": 548.3090500000001, "r_x1": 450.48605, "r_y1": 548.3090500000001, "r_x2": 450.48605, "r_y2": 545.59233, "r_x3": 410.25699, "r_y3": 545.59233, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38348, "r_y0": 552.2079200000001, "r_x1": 408.82025, "r_y1": 552.2079200000001, "r_x2": 408.82025, "r_y2": 549.4911999999999, "r_x3": 407.38348, "r_y3": 549.4911999999999, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.25699, "r_y0": 552.2079200000001, "r_x1": 450.48605, "r_y1": 552.2079200000001, "r_x2": 450.48605, "r_y2": 549.4911999999999, "r_x3": 410.25699, "r_y3": 549.4911999999999, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 164.52881, "r_y0": 515.31, "r_x1": 181.8528, "r_y1": 515.31, "r_x2": 181.8528, "r_y2": 509.45859, "r_x3": 164.52881, "r_y3": 509.45859, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.58441, "r_y0": 515.31, "r_x1": 186.3974, "r_y1": 515.31, "r_x2": 186.3974, "r_y2": 509.45859, "r_x3": 183.58441, "r_y3": 509.45859, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 189.2104, "r_y0": 515.31, "r_x1": 208.90137, "r_y1": 515.31, "r_x2": 208.90137, "r_y2": 509.45859, "r_x3": 189.2104, "r_y3": 509.45859, "coord_origin": "TOPLEFT" }, "text": "tokens:", "orig": "tokens:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.63269, "r_y0": 515.31, "r_x1": 221.04044, "r_y1": 515.31, "r_x2": 221.04044, "r_y2": 509.45859, "r_x3": 210.63269, "r_y3": 509.45859, "coord_origin": "TOPLEFT" }, "text": "258", "orig": "258", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 390.20203, "r_y0": 515.45502, "r_x1": 406.83609, "r_y1": 515.45502, "r_x2": 406.83609, "r_y2": 509.60361, "r_x3": 390.20203, "r_y3": 509.60361, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.56952, "r_y0": 515.45502, "r_x1": 411.38251, "r_y1": 515.45502, "r_x2": 411.38251, "r_y2": 509.60361, "r_x3": 408.56952, "r_y3": 509.60361, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 414.1955, "r_y0": 515.45502, "r_x1": 433.88647000000003, "r_y1": 515.45502, "r_x2": 433.88647000000003, "r_y2": 509.60361, "r_x3": 414.1955, "r_y3": 509.60361, "coord_origin": "TOPLEFT" }, "text": "tokens:", "orig": "tokens:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.61737, "r_y0": 515.45502, "r_x1": 446.02512, "r_y1": 515.45502, "r_x2": 446.02512, "r_y2": 509.60361, "r_x3": 435.61737, "r_y3": 509.60361, "coord_origin": "TOPLEFT" }, "text": "135", "orig": "135", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.19316, "r_y0": 526.3866, "r_x1": 172.8231, "r_y1": 526.3866, "r_x2": 172.8231, "r_y2": 519.07236, "r_x3": 167.19316, "r_y3": 519.07236, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 187.33745, "r_y0": 455.93909, "r_x1": 192.96739, "r_y1": 455.93909, "r_x2": 192.96739, "r_y2": 448.62485, "r_x3": 187.33745, "r_y3": 448.62485, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.38654, "r_y0": 573.3194, "r_x1": 173.01648, "r_y1": 573.3194, "r_x2": 173.01648, "r_y2": 566.0051599999999, "r_x3": 167.38654, "r_y3": 566.0051599999999, "coord_origin": "TOPLEFT" }, "text": "D", "orig": "D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 248.45621000000003, "r_y0": 629.09431, "r_x1": 253.65727, "r_y1": 629.09431, "r_x2": 253.65727, "r_y2": 621.78008, "r_x3": 248.45621000000003, "r_y3": 621.78008, "coord_origin": "TOPLEFT" }, "text": "E", "orig": "E", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.90057, "r_y0": 526.5137, "r_x1": 401.53052, "r_y1": 526.5137, "r_x2": 401.53052, "r_y2": 519.19946, "r_x3": 395.90057, "r_y3": 519.19946, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.62886, "r_y0": 597.26784, "r_x1": 177.48148, "r_y1": 597.26784, "r_x2": 177.48148, "r_y2": 580.28853, "r_x3": 171.62886, "r_y3": 580.28853, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 251.05969000000002, "r_y0": 649.92345, "r_x1": 256.91235, "r_y1": 649.92345, "r_x2": 256.91235, "r_y2": 633.63408, "r_x3": 251.05969000000002, "r_y3": 633.63408, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 372.14645, "r_y0": 607.30864, "r_x1": 427.0379, "r_y1": 607.30864, "r_x2": 427.0379, "r_y2": 601.45724, "r_x3": 372.14645, "r_y3": 601.45724, "coord_origin": "TOPLEFT" }, "text": "HTML model shows", "orig": "HTML model shows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 372.14645, "r_y0": 613.75087, "r_x1": 430.06838999999997, "r_y1": 613.75087, "r_x2": 430.06838999999997, "r_y2": 607.89948, "r_x3": 372.14645, "r_y3": 607.89948, "coord_origin": "TOPLEFT" }, "text": "bounding box drifting", "orig": "bounding box drifting", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.88042, "r_y0": 648.72348, "r_x1": 231.08191, "r_y1": 648.72348, "r_x2": 231.08191, "r_y2": 642.87209, "r_x3": 176.88042, "r_y3": 642.87209, "coord_origin": "TOPLEFT" }, "text": "OTSL model shows", "orig": "OTSL model shows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.88042, "r_y0": 655.1657, "r_x1": 230.99271000000002, "r_y1": 655.1657, "r_x2": 230.99271000000002, "r_y2": 649.3143, "r_x3": 176.88042, "r_y3": 649.3143, "coord_origin": "TOPLEFT" }, "text": "clean bounding box", "orig": "clean bounding box", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.88042, "r_y0": 661.60794, "r_x1": 203.93219, "r_y1": 661.60794, "r_x2": 203.93219, "r_y2": 655.7565500000001, "r_x3": 176.88042, "r_y3": 655.7565500000001, "coord_origin": "TOPLEFT" }, "text": "alignment", "orig": "alignment", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 215.93231000000003, "r_y0": 569.15967, "r_x1": 218.4697, "r_y1": 569.15967, "r_x2": 218.4697, "r_y2": 557.56342, "r_x3": 215.93231000000003, "r_y3": 557.56342, "coord_origin": "TOPLEFT" }, "text": "\u2264", "orig": "\u2264", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.05689999999998, "r_y0": 569.15967, "r_x1": 231.71908999999997, "r_y1": 569.15967, "r_x2": 231.71908999999997, "r_y2": 557.56342, "r_x3": 229.05689999999998, "r_y3": 557.56342, "coord_origin": "TOPLEFT" }, "text": "\u03bc", "orig": "\u03bc", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 261.20892, "r_y0": 451.19727, "r_x1": 263.56973, "r_y1": 451.19727, "r_x2": 263.56973, "r_y2": 448.46124, "r_x3": 261.20892, "r_y3": 448.46124, "coord_origin": "TOPLEFT" }, "text": "S", "orig": "S", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.33463, "r_y0": 451.19727, "r_x1": 313.6362, "r_y1": 451.19727, "r_x2": 313.6362, "r_y2": 448.46124, "r_x3": 312.33463, "r_y3": 448.46124, "coord_origin": "TOPLEFT" }, "text": "I", "orig": "I", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 377.41125, "r_y0": 451.19727, "r_x1": 380.05737, "r_y1": 451.19727, "r_x2": 380.05737, "r_y2": 448.46124, "r_x3": 377.41125, "r_y3": 448.46124, "coord_origin": "TOPLEFT" }, "text": "R", "orig": "R", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.63976, "r_y0": 456.07599, "r_x1": 205.82492, "r_y1": 456.07599, "r_x2": 205.82492, "r_y2": 453.33997, "r_x3": 200.63976, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "ST", "orig": "ST", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.20833000000002, "r_y0": 456.07599, "r_x1": 229.76836, "r_y1": 456.07599, "r_x2": 229.76836, "r_y2": 453.33997, "r_x3": 222.20833000000002, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "0.03", "orig": "0.03", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 243.26666, "r_y0": 456.07599, "r_x1": 250.82669, "r_y1": 456.07599, "r_x2": 250.82669, "r_y2": 453.33997, "r_x3": 243.26666, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "0.06", "orig": "0.06", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.29657, "r_y0": 456.07599, "r_x1": 271.84949, "r_y1": 456.07599, "r_x2": 271.84949, "r_y2": 453.33997, "r_x3": 264.29657, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "0.12", "orig": "0.12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.31943, "r_y0": 456.07599, "r_x1": 292.87946, "r_y1": 456.07599, "r_x2": 292.87946, "r_y2": 453.33997, "r_x3": 285.31943, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "0.25", "orig": "0.25", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.37775, "r_y0": 456.07599, "r_x1": 311.77319, "r_y1": 456.07599, "r_x2": 311.77319, "r_y2": 453.33997, "r_x3": 306.37775, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "0.5", "orig": "0.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.41699, "r_y0": 456.07599, "r_x1": 325.58157, "r_y1": 456.07599, "r_x2": 325.58157, "r_y2": 453.33997, "r_x3": 323.41699, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.45807, "r_y0": 456.07599, "r_x1": 336.62265, "r_y1": 456.07599, "r_x2": 336.62265, "r_y2": 453.33997, "r_x3": 334.45807, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.52756, "r_y0": 456.07599, "r_x1": 347.69214, "r_y1": 456.07599, "r_x2": 347.69214, "r_y2": 453.33997, "r_x3": 345.52756, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 356.56863, "r_y0": 456.07599, "r_x1": 358.73322, "r_y1": 456.07599, "r_x2": 358.73322, "r_y2": 453.33997, "r_x3": 356.56863, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.63812, "r_y0": 456.07599, "r_x1": 371.97089, "r_y1": 456.07599, "r_x2": 371.97089, "r_y2": 453.33997, "r_x3": 367.63812, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.6734, "r_y0": 456.07599, "r_x1": 387.00616, "r_y1": 456.07599, "r_x2": 387.00616, "r_y2": 453.33997, "r_x3": 382.6734, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "32", "orig": "32", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.73727, "r_y0": 456.07599, "r_x1": 402.07001, "r_y1": 456.07599, "r_x2": 402.07001, "r_y2": 453.33997, "r_x3": 397.73727, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "64", "orig": "64", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 412.78879, "r_y0": 457.79964999999993, "r_x1": 414.93463, "r_y1": 457.79964999999993, "r_x2": 414.93463, "r_y2": 447.99298, "r_x3": 412.78879, "r_y3": 447.99298, "coord_origin": "TOPLEFT" }, "text": "\u2265", "orig": "\u2265", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 414.95697, "r_y0": 456.07599, "r_x1": 422.51746, "r_y1": 456.07599, "r_x2": 422.51746, "r_y2": 453.33997, "r_x3": 414.95697, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": " 128", "orig": " 128", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.63998, "r_y0": 466.66043, "r_x1": 204.57674, "r_y1": 466.66043, "r_x2": 204.57674, "r_y2": 463.92444, "r_x3": 200.63998, "r_y3": 463.92444, "coord_origin": "TOPLEFT" }, "text": "63", "orig": "63", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.62604, "r_y0": 466.66043, "r_x1": 369.58032, "r_y1": 466.66043, "r_x2": 369.58032, "r_y2": 463.92444, "r_x3": 367.62604, "r_y3": 463.92444, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.66132, "r_y0": 466.66043, "r_x1": 384.6156, "r_y1": 466.66043, "r_x2": 384.6156, "r_y2": 463.92444, "r_x3": 382.66132, "r_y3": 463.92444, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.72504, "r_y0": 466.66043, "r_x1": 399.67932, "r_y1": 466.66043, "r_x2": 399.67932, "r_y2": 463.92444, "r_x3": 397.72504, "r_y3": 463.92444, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 471.53915, "r_x1": 206.51694, "r_y1": 471.53915, "r_x2": 206.51694, "r_y2": 468.80313, "r_x3": 200.64, "r_y3": 468.80313, "coord_origin": "TOPLEFT" }, "text": "199", "orig": "199", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.29047, "r_y0": 471.53915, "r_x1": 266.25885, "r_y1": 471.53915, "r_x2": 266.25885, "r_y2": 468.80313, "r_x3": 264.29047, "r_y3": 468.80313, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.37213, "r_y0": 471.53915, "r_x1": 308.34052, "r_y1": 471.53915, "r_x2": 308.34052, "r_y2": 468.80313, "r_x3": 306.37213, "r_y3": 468.80313, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.51526, "r_y0": 471.53915, "r_x1": 347.48364, "r_y1": 471.53915, "r_x2": 347.48364, "r_y2": 468.80313, "r_x3": 345.51526, "r_y3": 468.80313, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 356.55634, "r_y0": 471.53915, "r_x1": 358.52472, "r_y1": 471.53915, "r_x2": 358.52472, "r_y2": 468.80313, "r_x3": 356.55634, "r_y3": 468.80313, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.62582, "r_y0": 471.53915, "r_x1": 369.59418, "r_y1": 471.53915, "r_x2": 369.59418, "r_y2": 468.80313, "r_x3": 367.62582, "r_y3": 468.80313, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.66107, "r_y0": 471.53915, "r_x1": 384.62946, "r_y1": 471.53915, "r_x2": 384.62946, "r_y2": 468.80313, "r_x3": 382.66107, "r_y3": 468.80313, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 476.41788, "r_x1": 206.51694, "r_y1": 476.41788, "r_x2": 206.51694, "r_y2": 473.68185, "r_x3": 200.64, "r_y3": 473.68185, "coord_origin": "TOPLEFT" }, "text": "416", "orig": "416", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.29047, "r_y0": 476.41788, "r_x1": 266.25885, "r_y1": 476.41788, "r_x2": 266.25885, "r_y2": 473.68185, "r_x3": 264.29047, "r_y3": 473.68185, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 481.26816, "r_x1": 206.51694, "r_y1": 481.26816, "r_x2": 206.51694, "r_y2": 478.53214, "r_x3": 200.64, "r_y3": 478.53214, "coord_origin": "TOPLEFT" }, "text": "230", "orig": "230", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 243.26373, "r_y0": 481.26816, "r_x1": 245.2321, "r_y1": 481.26816, "r_x2": 245.2321, "r_y2": 478.53214, "r_x3": 243.26373, "r_y3": 478.53214, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.29047, "r_y0": 481.26816, "r_x1": 266.25885, "r_y1": 481.26816, "r_x2": 266.25885, "r_y2": 478.53214, "r_x3": 264.29047, "r_y3": 478.53214, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.40466, "r_y0": 481.26816, "r_x1": 325.37305, "r_y1": 481.26816, "r_x2": 325.37305, "r_y2": 478.53214, "r_x3": 323.40466, "r_y3": 478.53214, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.72519, "r_y0": 481.26816, "r_x1": 399.69354, "r_y1": 481.26816, "r_x2": 399.69354, "r_y2": 478.53214, "r_x3": 397.72519, "r_y3": 478.53214, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 486.14688, "r_x1": 206.51694, "r_y1": 486.14688, "r_x2": 206.51694, "r_y2": 483.41086, "r_x3": 200.64, "r_y3": 483.41086, "coord_origin": "TOPLEFT" }, "text": "276", "orig": "276", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.66132, "r_y0": 486.14688, "r_x1": 384.61563, "r_y1": 486.14688, "r_x2": 384.61563, "r_y2": 483.41086, "r_x3": 382.66132, "r_y3": 483.41086, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.72513, "r_y0": 486.14688, "r_x1": 401.64819, "r_y1": 486.14688, "r_x2": 401.64819, "r_y2": 483.41086, "r_x3": 397.72513, "r_y3": 483.41086, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 158, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 412.78928, "r_y0": 486.14688, "r_x1": 414.74359, "r_y1": 486.14688, "r_x2": 414.74359, "r_y2": 483.41086, "r_x3": 412.78928, "r_y3": 483.41086, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 159, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64014, "r_y0": 491.0256, "r_x1": 207.14445, "r_y1": 491.0256, "r_x2": 207.14445, "r_y2": 488.28958, "r_x3": 200.64014, "r_y3": 488.28958, "coord_origin": "TOPLEFT" }, "text": "320", "orig": "320", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 160, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.62616, "r_y0": 491.0256, "r_x1": 369.78375, "r_y1": 491.0256, "r_x2": 369.78375, "r_y2": 488.28958, "r_x3": 367.62616, "r_y3": 488.28958, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 161, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.66141, "r_y0": 491.0256, "r_x1": 384.81897, "r_y1": 491.0256, "r_x2": 384.81897, "r_y2": 488.28958, "r_x3": 382.66141, "r_y3": 488.28958, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 162, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.7251, "r_y0": 491.0256, "r_x1": 402.05087, "r_y1": 491.0256, "r_x2": 402.05087, "r_y2": 488.28958, "r_x3": 397.7251, "r_y3": 488.28958, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 163, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64032, "r_y0": 495.90433, "r_x1": 208.48566, "r_y1": 495.90433, "r_x2": 208.48566, "r_y2": 493.1683, "r_x3": 200.64032, "r_y3": 493.1683, "coord_origin": "TOPLEFT" }, "text": "2013", "orig": "2013", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 164, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.29044, "r_y0": 495.90433, "r_x1": 266.25879, "r_y1": 495.90433, "r_x2": 266.25879, "r_y2": 493.1683, "r_x3": 264.29044, "r_y3": 493.1683, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 58, "label": "text", "bbox": { "l": 180.12473, "t": 516.2332200000001, "r": 190.62042, "b": 518.94992, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 180.12473, "r_y0": 518.94992, "r_x1": 190.62042, "r_y1": 518.94992, "r_x2": 190.62042, "r_y2": 516.2332200000001, "r_x3": 180.12473, "r_y3": 516.2332200000001, "coord_origin": "TOPLEFT" }, "text": "", "orig": "
", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 59, "label": "text", "bbox": { "l": 183.2438, "t": 520.13208, "r": 304.54797, "b": 522.84879, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2438, "r_y0": 522.84879, "r_x1": 304.54797, "r_y1": 522.84879, "r_x2": 304.54797, "r_y2": 520.13208, "r_x3": 183.2438, "r_y3": 520.13208, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 60, "label": "text", "bbox": { "l": 183.2438, "t": 524.03094, "r": 388.42313, "b": 526.74765, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2438, "r_y0": 526.74765, "r_x1": 388.42313, "r_y1": 526.74765, "r_x2": 388.42313, "r_y2": 524.03094, "r_x3": 183.2438, "r_y3": 524.03094, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 61, "label": "text", "bbox": { "l": 183.2438, "t": 527.9297799999999, "r": 388.42313, "b": 530.64648, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2438, "r_y0": 530.64648, "r_x1": 388.42313, "r_y1": 530.64648, "r_x2": 388.42313, "r_y2": 527.9297799999999, "r_x3": 183.2438, "r_y3": 527.9297799999999, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 62, "label": "text", "bbox": { "l": 183.2438, "t": 531.82861, "r": 388.42313, "b": 534.54532, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2438, "r_y0": 534.54532, "r_x1": 388.42313, "r_y1": 534.54532, "r_x2": 388.42313, "r_y2": 531.82861, "r_x3": 183.2438, "r_y3": 531.82861, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 183.2438, "t": 535.72748, "r": 388.42313, "b": 538.44418, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2438, "r_y0": 538.44418, "r_x1": 388.42313, "r_y1": 538.44418, "r_x2": 388.42313, "r_y2": 535.72748, "r_x3": 183.2438, "r_y3": 535.72748, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 183.2438, "t": 539.62631, "r": 388.42313, "b": 542.34303, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2438, "r_y0": 542.34303, "r_x1": 388.42313, "r_y1": 542.34303, "r_x2": 388.42313, "r_y2": 539.62631, "r_x3": 183.2438, "r_y3": 539.62631, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 183.2438, "t": 543.52516, "r": 388.42313, "b": 546.24188, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2438, "r_y0": 546.24188, "r_x1": 388.42313, "r_y1": 546.24188, "r_x2": 388.42313, "r_y2": 543.52516, "r_x3": 183.2438, "r_y3": 543.52516, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 183.2438, "t": 547.42401, "r": 388.42313, "b": 550.14073, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2438, "r_y0": 550.14073, "r_x1": 388.42313, "r_y1": 550.14073, "r_x2": 388.42313, "r_y2": 547.42401, "r_x3": 183.2438, "r_y3": 547.42401, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 183.2438, "t": 551.32286, "r": 388.42313, "b": 554.03958, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2438, "r_y0": 554.03958, "r_x1": 388.42313, "r_y1": 554.03958, "r_x2": 388.42313, "r_y2": 551.32286, "r_x3": 183.2438, "r_y3": 551.32286, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 180.12473, "t": 555.22173, "r": 191.86806, "b": 557.93845, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 180.12473, "r_y0": 557.93845, "r_x1": 191.86806, "r_y1": 557.93845, "r_x2": 191.86806, "r_y2": 555.22173, "r_x3": 180.12473, "r_y3": 555.22173, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 407.38348, "t": 518.30042, "r": 408.82025, "b": 521.01712, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38348, "r_y0": 521.01712, "r_x1": 408.82025, "r_y1": 521.01712, "r_x2": 408.82025, "r_y2": 518.30042, "r_x3": 407.38348, "r_y3": 518.30042, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 410.25699, "t": 518.30042, "r": 450.48605, "b": 521.01712, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.25699, "r_y0": 521.01712, "r_x1": 450.48605, "r_y1": 521.01712, "r_x2": 450.48605, "r_y2": 518.30042, "r_x3": 410.25699, "r_y3": 518.30042, "coord_origin": "TOPLEFT" }, "text": "C L L L C L L L L L C L L NL", "orig": "C L L L C L L L L L C L L NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 407.38348, "t": 522.19925, "r": 408.82025, "b": 524.9159500000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38348, "r_y0": 524.9159500000001, "r_x1": 408.82025, "r_y1": 524.9159500000001, "r_x2": 408.82025, "r_y2": 522.19925, "r_x3": 407.38348, "r_y3": 522.19925, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 410.25699, "t": 522.19925, "r": 450.48605, "b": 524.9159500000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.25699, "r_y0": 524.9159500000001, "r_x1": 450.48605, "r_y1": 524.9159500000001, "r_x2": 450.48605, "r_y2": 522.19925, "r_x3": 410.25699, "r_y3": 522.19925, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 407.38348, "t": 526.09808, "r": 408.82025, "b": 528.81479, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38348, "r_y0": 528.81479, "r_x1": 408.82025, "r_y1": 528.81479, "r_x2": 408.82025, "r_y2": 526.09808, "r_x3": 407.38348, "r_y3": 526.09808, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 410.25699, "t": 526.09808, "r": 450.48605, "b": 528.81479, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.25699, "r_y0": 528.81479, "r_x1": 450.48605, "r_y1": 528.81479, "r_x2": 450.48605, "r_y2": 526.09808, "r_x3": 410.25699, "r_y3": 526.09808, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 407.38348, "t": 529.99695, "r": 408.82025, "b": 532.7136499999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38348, "r_y0": 532.7136499999999, "r_x1": 408.82025, "r_y1": 532.7136499999999, "r_x2": 408.82025, "r_y2": 529.99695, "r_x3": 407.38348, "r_y3": 529.99695, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 410.25699, "t": 529.99695, "r": 450.48605, "b": 532.7136499999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.25699, "r_y0": 532.7136499999999, "r_x1": 450.48605, "r_y1": 532.7136499999999, "r_x2": 450.48605, "r_y2": 529.99695, "r_x3": 410.25699, "r_y3": 529.99695, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 407.38348, "t": 533.8957800000001, "r": 408.82025, "b": 536.6125, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38348, "r_y0": 536.6125, "r_x1": 408.82025, "r_y1": 536.6125, "r_x2": 408.82025, "r_y2": 533.8957800000001, "r_x3": 407.38348, "r_y3": 533.8957800000001, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 410.25699, "t": 533.8957800000001, "r": 450.48605, "b": 536.6125, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.25699, "r_y0": 536.6125, "r_x1": 450.48605, "r_y1": 536.6125, "r_x2": 450.48605, "r_y2": 533.8957800000001, "r_x3": 410.25699, "r_y3": 533.8957800000001, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 407.38348, "t": 537.79463, "r": 408.82025, "b": 540.51135, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38348, "r_y0": 540.51135, "r_x1": 408.82025, "r_y1": 540.51135, "r_x2": 408.82025, "r_y2": 537.79463, "r_x3": 407.38348, "r_y3": 537.79463, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 80, "label": "text", "bbox": { "l": 410.25699, "t": 537.79463, "r": 450.48605, "b": 540.51135, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.25699, "r_y0": 540.51135, "r_x1": 450.48605, "r_y1": 540.51135, "r_x2": 450.48605, "r_y2": 537.79463, "r_x3": 410.25699, "r_y3": 537.79463, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 81, "label": "text", "bbox": { "l": 407.38348, "t": 541.69348, "r": 408.82025, "b": 544.4102, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38348, "r_y0": 544.4102, "r_x1": 408.82025, "r_y1": 544.4102, "r_x2": 408.82025, "r_y2": 541.69348, "r_x3": 407.38348, "r_y3": 541.69348, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 82, "label": "text", "bbox": { "l": 410.25699, "t": 541.69348, "r": 450.48605, "b": 544.4102, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.25699, "r_y0": 544.4102, "r_x1": 450.48605, "r_y1": 544.4102, "r_x2": 450.48605, "r_y2": 541.69348, "r_x3": 410.25699, "r_y3": 541.69348, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 83, "label": "text", "bbox": { "l": 407.38348, "t": 545.59233, "r": 408.82025, "b": 548.3090500000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38348, "r_y0": 548.3090500000001, "r_x1": 408.82025, "r_y1": 548.3090500000001, "r_x2": 408.82025, "r_y2": 545.59233, "r_x3": 407.38348, "r_y3": 545.59233, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 84, "label": "text", "bbox": { "l": 410.25699, "t": 545.59233, "r": 450.48605, "b": 548.3090500000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.25699, "r_y0": 548.3090500000001, "r_x1": 450.48605, "r_y1": 548.3090500000001, "r_x2": 450.48605, "r_y2": 545.59233, "r_x3": 410.25699, "r_y3": 545.59233, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 85, "label": "text", "bbox": { "l": 407.38348, "t": 549.4911999999999, "r": 408.82025, "b": 552.2079200000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38348, "r_y0": 552.2079200000001, "r_x1": 408.82025, "r_y1": 552.2079200000001, "r_x2": 408.82025, "r_y2": 549.4911999999999, "r_x3": 407.38348, "r_y3": 549.4911999999999, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 86, "label": "text", "bbox": { "l": 410.25699, "t": 549.4911999999999, "r": 450.48605, "b": 552.2079200000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.25699, "r_y0": 552.2079200000001, "r_x1": 450.48605, "r_y1": 552.2079200000001, "r_x2": 450.48605, "r_y2": 549.4911999999999, "r_x3": 410.25699, "r_y3": 549.4911999999999, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 87, "label": "text", "bbox": { "l": 164.52881, "t": 509.45859, "r": 181.8528, "b": 515.31, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 164.52881, "r_y0": 515.31, "r_x1": 181.8528, "r_y1": 515.31, "r_x2": 181.8528, "r_y2": 509.45859, "r_x3": 164.52881, "r_y3": 509.45859, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 88, "label": "text", "bbox": { "l": 183.58441, "t": 509.45859, "r": 186.3974, "b": 515.31, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.58441, "r_y0": 515.31, "r_x1": 186.3974, "r_y1": 515.31, "r_x2": 186.3974, "r_y2": 509.45859, "r_x3": 183.58441, "r_y3": 509.45859, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 89, "label": "text", "bbox": { "l": 189.2104, "t": 509.45859, "r": 208.90137, "b": 515.31, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 189.2104, "r_y0": 515.31, "r_x1": 208.90137, "r_y1": 515.31, "r_x2": 208.90137, "r_y2": 509.45859, "r_x3": 189.2104, "r_y3": 509.45859, "coord_origin": "TOPLEFT" }, "text": "tokens:", "orig": "tokens:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 90, "label": "text", "bbox": { "l": 210.63269, "t": 509.45859, "r": 221.04044, "b": 515.31, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.63269, "r_y0": 515.31, "r_x1": 221.04044, "r_y1": 515.31, "r_x2": 221.04044, "r_y2": 509.45859, "r_x3": 210.63269, "r_y3": 509.45859, "coord_origin": "TOPLEFT" }, "text": "258", "orig": "258", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 91, "label": "text", "bbox": { "l": 390.20203, "t": 509.60361, "r": 406.83609, "b": 515.45502, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 390.20203, "r_y0": 515.45502, "r_x1": 406.83609, "r_y1": 515.45502, "r_x2": 406.83609, "r_y2": 509.60361, "r_x3": 390.20203, "r_y3": 509.60361, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 92, "label": "text", "bbox": { "l": 408.56952, "t": 509.60361, "r": 411.38251, "b": 515.45502, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.56952, "r_y0": 515.45502, "r_x1": 411.38251, "r_y1": 515.45502, "r_x2": 411.38251, "r_y2": 509.60361, "r_x3": 408.56952, "r_y3": 509.60361, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 93, "label": "text", "bbox": { "l": 414.1955, "t": 509.60361, "r": 433.88647000000003, "b": 515.45502, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 414.1955, "r_y0": 515.45502, "r_x1": 433.88647000000003, "r_y1": 515.45502, "r_x2": 433.88647000000003, "r_y2": 509.60361, "r_x3": 414.1955, "r_y3": 509.60361, "coord_origin": "TOPLEFT" }, "text": "tokens:", "orig": "tokens:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 94, "label": "text", "bbox": { "l": 435.61737, "t": 509.60361, "r": 446.02512, "b": 515.45502, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.61737, "r_y0": 515.45502, "r_x1": 446.02512, "r_y1": 515.45502, "r_x2": 446.02512, "r_y2": 509.60361, "r_x3": 435.61737, "r_y3": 509.60361, "coord_origin": "TOPLEFT" }, "text": "135", "orig": "135", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 95, "label": "text", "bbox": { "l": 167.19316, "t": 519.07236, "r": 172.8231, "b": 526.3866, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.19316, "r_y0": 526.3866, "r_x1": 172.8231, "r_y1": 526.3866, "r_x2": 172.8231, "r_y2": 519.07236, "r_x3": 167.19316, "r_y3": 519.07236, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 96, "label": "text", "bbox": { "l": 187.33745, "t": 448.62485, "r": 192.96739, "b": 455.93909, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 187.33745, "r_y0": 455.93909, "r_x1": 192.96739, "r_y1": 455.93909, "r_x2": 192.96739, "r_y2": 448.62485, "r_x3": 187.33745, "r_y3": 448.62485, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 97, "label": "text", "bbox": { "l": 167.38654, "t": 566.0051599999999, "r": 173.01648, "b": 573.3194, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.38654, "r_y0": 573.3194, "r_x1": 173.01648, "r_y1": 573.3194, "r_x2": 173.01648, "r_y2": 566.0051599999999, "r_x3": 167.38654, "r_y3": 566.0051599999999, "coord_origin": "TOPLEFT" }, "text": "D", "orig": "D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 98, "label": "text", "bbox": { "l": 248.45621000000003, "t": 621.78008, "r": 253.65727, "b": 629.09431, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 248.45621000000003, "r_y0": 629.09431, "r_x1": 253.65727, "r_y1": 629.09431, "r_x2": 253.65727, "r_y2": 621.78008, "r_x3": 248.45621000000003, "r_y3": 621.78008, "coord_origin": "TOPLEFT" }, "text": "E", "orig": "E", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 99, "label": "text", "bbox": { "l": 395.90057, "t": 519.19946, "r": 401.53052, "b": 526.5137, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.90057, "r_y0": 526.5137, "r_x1": 401.53052, "r_y1": 526.5137, "r_x2": 401.53052, "r_y2": 519.19946, "r_x3": 395.90057, "r_y3": 519.19946, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 100, "label": "text", "bbox": { "l": 171.62886, "t": 580.28853, "r": 177.48148, "b": 597.26784, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.62886, "r_y0": 597.26784, "r_x1": 177.48148, "r_y1": 597.26784, "r_x2": 177.48148, "r_y2": 580.28853, "r_x3": 171.62886, "r_y3": 580.28853, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 101, "label": "text", "bbox": { "l": 251.05969000000002, "t": 633.63408, "r": 256.91235, "b": 649.92345, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 251.05969000000002, "r_y0": 649.92345, "r_x1": 256.91235, "r_y1": 649.92345, "r_x2": 256.91235, "r_y2": 633.63408, "r_x3": 251.05969000000002, "r_y3": 633.63408, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 102, "label": "text", "bbox": { "l": 372.14645, "t": 601.45724, "r": 427.0379, "b": 607.30864, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 372.14645, "r_y0": 607.30864, "r_x1": 427.0379, "r_y1": 607.30864, "r_x2": 427.0379, "r_y2": 601.45724, "r_x3": 372.14645, "r_y3": 601.45724, "coord_origin": "TOPLEFT" }, "text": "HTML model shows", "orig": "HTML model shows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 103, "label": "text", "bbox": { "l": 372.14645, "t": 607.89948, "r": 430.06838999999997, "b": 613.75087, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 372.14645, "r_y0": 613.75087, "r_x1": 430.06838999999997, "r_y1": 613.75087, "r_x2": 430.06838999999997, "r_y2": 607.89948, "r_x3": 372.14645, "r_y3": 607.89948, "coord_origin": "TOPLEFT" }, "text": "bounding box drifting", "orig": "bounding box drifting", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 104, "label": "text", "bbox": { "l": 176.88042, "t": 642.87209, "r": 231.08191, "b": 648.72348, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.88042, "r_y0": 648.72348, "r_x1": 231.08191, "r_y1": 648.72348, "r_x2": 231.08191, "r_y2": 642.87209, "r_x3": 176.88042, "r_y3": 642.87209, "coord_origin": "TOPLEFT" }, "text": "OTSL model shows", "orig": "OTSL model shows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 105, "label": "text", "bbox": { "l": 176.88042, "t": 649.3143, "r": 230.99271000000002, "b": 655.1657, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.88042, "r_y0": 655.1657, "r_x1": 230.99271000000002, "r_y1": 655.1657, "r_x2": 230.99271000000002, "r_y2": 649.3143, "r_x3": 176.88042, "r_y3": 649.3143, "coord_origin": "TOPLEFT" }, "text": "clean bounding box", "orig": "clean bounding box", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 106, "label": "text", "bbox": { "l": 176.88042, "t": 655.7565500000001, "r": 203.93219, "b": 661.60794, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.88042, "r_y0": 661.60794, "r_x1": 203.93219, "r_y1": 661.60794, "r_x2": 203.93219, "r_y2": 655.7565500000001, "r_x3": 176.88042, "r_y3": 655.7565500000001, "coord_origin": "TOPLEFT" }, "text": "alignment", "orig": "alignment", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 107, "label": "text", "bbox": { "l": 215.93231000000003, "t": 557.56342, "r": 218.4697, "b": 569.15967, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 215.93231000000003, "r_y0": 569.15967, "r_x1": 218.4697, "r_y1": 569.15967, "r_x2": 218.4697, "r_y2": 557.56342, "r_x3": 215.93231000000003, "r_y3": 557.56342, "coord_origin": "TOPLEFT" }, "text": "\u2264", "orig": "\u2264", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 108, "label": "text", "bbox": { "l": 229.05689999999998, "t": 557.56342, "r": 231.71908999999997, "b": 569.15967, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.05689999999998, "r_y0": 569.15967, "r_x1": 231.71908999999997, "r_y1": 569.15967, "r_x2": 231.71908999999997, "r_y2": 557.56342, "r_x3": 229.05689999999998, "r_y3": 557.56342, "coord_origin": "TOPLEFT" }, "text": "\u03bc", "orig": "\u03bc", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 109, "label": "text", "bbox": { "l": 261.20892, "t": 448.46124, "r": 263.56973, "b": 451.19727, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 261.20892, "r_y0": 451.19727, "r_x1": 263.56973, "r_y1": 451.19727, "r_x2": 263.56973, "r_y2": 448.46124, "r_x3": 261.20892, "r_y3": 448.46124, "coord_origin": "TOPLEFT" }, "text": "S", "orig": "S", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 110, "label": "text", "bbox": { "l": 312.33463, "t": 448.46124, "r": 313.6362, "b": 451.19727, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.33463, "r_y0": 451.19727, "r_x1": 313.6362, "r_y1": 451.19727, "r_x2": 313.6362, "r_y2": 448.46124, "r_x3": 312.33463, "r_y3": 448.46124, "coord_origin": "TOPLEFT" }, "text": "I", "orig": "I", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 111, "label": "text", "bbox": { "l": 377.41125, "t": 448.46124, "r": 380.05737, "b": 451.19727, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 377.41125, "r_y0": 451.19727, "r_x1": 380.05737, "r_y1": 451.19727, "r_x2": 380.05737, "r_y2": 448.46124, "r_x3": 377.41125, "r_y3": 448.46124, "coord_origin": "TOPLEFT" }, "text": "R", "orig": "R", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 112, "label": "text", "bbox": { "l": 200.63976, "t": 453.33997, "r": 205.82492, "b": 456.07599, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.63976, "r_y0": 456.07599, "r_x1": 205.82492, "r_y1": 456.07599, "r_x2": 205.82492, "r_y2": 453.33997, "r_x3": 200.63976, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "ST", "orig": "ST", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 113, "label": "text", "bbox": { "l": 222.20833000000002, "t": 453.33997, "r": 229.76836, "b": 456.07599, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.20833000000002, "r_y0": 456.07599, "r_x1": 229.76836, "r_y1": 456.07599, "r_x2": 229.76836, "r_y2": 453.33997, "r_x3": 222.20833000000002, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "0.03", "orig": "0.03", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 114, "label": "text", "bbox": { "l": 243.26666, "t": 453.33997, "r": 250.82669, "b": 456.07599, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 243.26666, "r_y0": 456.07599, "r_x1": 250.82669, "r_y1": 456.07599, "r_x2": 250.82669, "r_y2": 453.33997, "r_x3": 243.26666, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "0.06", "orig": "0.06", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 115, "label": "text", "bbox": { "l": 264.29657, "t": 453.33997, "r": 271.84949, "b": 456.07599, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.29657, "r_y0": 456.07599, "r_x1": 271.84949, "r_y1": 456.07599, "r_x2": 271.84949, "r_y2": 453.33997, "r_x3": 264.29657, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "0.12", "orig": "0.12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 116, "label": "text", "bbox": { "l": 285.31943, "t": 453.33997, "r": 292.87946, "b": 456.07599, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.31943, "r_y0": 456.07599, "r_x1": 292.87946, "r_y1": 456.07599, "r_x2": 292.87946, "r_y2": 453.33997, "r_x3": 285.31943, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "0.25", "orig": "0.25", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 117, "label": "text", "bbox": { "l": 306.37775, "t": 453.33997, "r": 311.77319, "b": 456.07599, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.37775, "r_y0": 456.07599, "r_x1": 311.77319, "r_y1": 456.07599, "r_x2": 311.77319, "r_y2": 453.33997, "r_x3": 306.37775, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "0.5", "orig": "0.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 118, "label": "text", "bbox": { "l": 323.41699, "t": 453.33997, "r": 325.58157, "b": 456.07599, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.41699, "r_y0": 456.07599, "r_x1": 325.58157, "r_y1": 456.07599, "r_x2": 325.58157, "r_y2": 453.33997, "r_x3": 323.41699, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 119, "label": "text", "bbox": { "l": 334.45807, "t": 453.33997, "r": 336.62265, "b": 456.07599, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.45807, "r_y0": 456.07599, "r_x1": 336.62265, "r_y1": 456.07599, "r_x2": 336.62265, "r_y2": 453.33997, "r_x3": 334.45807, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 120, "label": "text", "bbox": { "l": 345.52756, "t": 453.33997, "r": 347.69214, "b": 456.07599, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.52756, "r_y0": 456.07599, "r_x1": 347.69214, "r_y1": 456.07599, "r_x2": 347.69214, "r_y2": 453.33997, "r_x3": 345.52756, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 121, "label": "text", "bbox": { "l": 356.56863, "t": 453.33997, "r": 358.73322, "b": 456.07599, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 356.56863, "r_y0": 456.07599, "r_x1": 358.73322, "r_y1": 456.07599, "r_x2": 358.73322, "r_y2": 453.33997, "r_x3": 356.56863, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 122, "label": "text", "bbox": { "l": 367.63812, "t": 453.33997, "r": 371.97089, "b": 456.07599, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.63812, "r_y0": 456.07599, "r_x1": 371.97089, "r_y1": 456.07599, "r_x2": 371.97089, "r_y2": 453.33997, "r_x3": 367.63812, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 123, "label": "text", "bbox": { "l": 382.6734, "t": 453.33997, "r": 387.00616, "b": 456.07599, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.6734, "r_y0": 456.07599, "r_x1": 387.00616, "r_y1": 456.07599, "r_x2": 387.00616, "r_y2": 453.33997, "r_x3": 382.6734, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "32", "orig": "32", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 124, "label": "text", "bbox": { "l": 397.73727, "t": 453.33997, "r": 402.07001, "b": 456.07599, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.73727, "r_y0": 456.07599, "r_x1": 402.07001, "r_y1": 456.07599, "r_x2": 402.07001, "r_y2": 453.33997, "r_x3": 397.73727, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "64", "orig": "64", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 125, "label": "text", "bbox": { "l": 412.78879, "t": 447.99298, "r": 414.93463, "b": 457.79964999999993, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 412.78879, "r_y0": 457.79964999999993, "r_x1": 414.93463, "r_y1": 457.79964999999993, "r_x2": 414.93463, "r_y2": 447.99298, "r_x3": 412.78879, "r_y3": 447.99298, "coord_origin": "TOPLEFT" }, "text": "\u2265", "orig": "\u2265", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 126, "label": "text", "bbox": { "l": 414.95697, "t": 453.33997, "r": 422.51746, "b": 456.07599, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 414.95697, "r_y0": 456.07599, "r_x1": 422.51746, "r_y1": 456.07599, "r_x2": 422.51746, "r_y2": 453.33997, "r_x3": 414.95697, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": " 128", "orig": " 128", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 127, "label": "text", "bbox": { "l": 200.63998, "t": 463.92444, "r": 204.57674, "b": 466.66043, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.63998, "r_y0": 466.66043, "r_x1": 204.57674, "r_y1": 466.66043, "r_x2": 204.57674, "r_y2": 463.92444, "r_x3": 200.63998, "r_y3": 463.92444, "coord_origin": "TOPLEFT" }, "text": "63", "orig": "63", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 128, "label": "text", "bbox": { "l": 367.62604, "t": 463.92444, "r": 369.58032, "b": 466.66043, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.62604, "r_y0": 466.66043, "r_x1": 369.58032, "r_y1": 466.66043, "r_x2": 369.58032, "r_y2": 463.92444, "r_x3": 367.62604, "r_y3": 463.92444, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 129, "label": "text", "bbox": { "l": 382.66132, "t": 463.92444, "r": 384.6156, "b": 466.66043, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.66132, "r_y0": 466.66043, "r_x1": 384.6156, "r_y1": 466.66043, "r_x2": 384.6156, "r_y2": 463.92444, "r_x3": 382.66132, "r_y3": 463.92444, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 130, "label": "text", "bbox": { "l": 397.72504, "t": 463.92444, "r": 399.67932, "b": 466.66043, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.72504, "r_y0": 466.66043, "r_x1": 399.67932, "r_y1": 466.66043, "r_x2": 399.67932, "r_y2": 463.92444, "r_x3": 397.72504, "r_y3": 463.92444, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 131, "label": "text", "bbox": { "l": 200.64, "t": 468.80313, "r": 206.51694, "b": 471.53915, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 471.53915, "r_x1": 206.51694, "r_y1": 471.53915, "r_x2": 206.51694, "r_y2": 468.80313, "r_x3": 200.64, "r_y3": 468.80313, "coord_origin": "TOPLEFT" }, "text": "199", "orig": "199", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 132, "label": "text", "bbox": { "l": 264.29047, "t": 468.80313, "r": 266.25885, "b": 471.53915, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.29047, "r_y0": 471.53915, "r_x1": 266.25885, "r_y1": 471.53915, "r_x2": 266.25885, "r_y2": 468.80313, "r_x3": 264.29047, "r_y3": 468.80313, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 133, "label": "text", "bbox": { "l": 306.37213, "t": 468.80313, "r": 308.34052, "b": 471.53915, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.37213, "r_y0": 471.53915, "r_x1": 308.34052, "r_y1": 471.53915, "r_x2": 308.34052, "r_y2": 468.80313, "r_x3": 306.37213, "r_y3": 468.80313, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 134, "label": "text", "bbox": { "l": 345.51526, "t": 468.80313, "r": 347.48364, "b": 471.53915, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.51526, "r_y0": 471.53915, "r_x1": 347.48364, "r_y1": 471.53915, "r_x2": 347.48364, "r_y2": 468.80313, "r_x3": 345.51526, "r_y3": 468.80313, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 135, "label": "text", "bbox": { "l": 356.55634, "t": 468.80313, "r": 358.52472, "b": 471.53915, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 356.55634, "r_y0": 471.53915, "r_x1": 358.52472, "r_y1": 471.53915, "r_x2": 358.52472, "r_y2": 468.80313, "r_x3": 356.55634, "r_y3": 468.80313, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 136, "label": "text", "bbox": { "l": 367.62582, "t": 468.80313, "r": 369.59418, "b": 471.53915, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.62582, "r_y0": 471.53915, "r_x1": 369.59418, "r_y1": 471.53915, "r_x2": 369.59418, "r_y2": 468.80313, "r_x3": 367.62582, "r_y3": 468.80313, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 137, "label": "text", "bbox": { "l": 382.66107, "t": 468.80313, "r": 384.62946, "b": 471.53915, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.66107, "r_y0": 471.53915, "r_x1": 384.62946, "r_y1": 471.53915, "r_x2": 384.62946, "r_y2": 468.80313, "r_x3": 382.66107, "r_y3": 468.80313, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 138, "label": "text", "bbox": { "l": 200.64, "t": 473.68185, "r": 206.51694, "b": 476.41788, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 476.41788, "r_x1": 206.51694, "r_y1": 476.41788, "r_x2": 206.51694, "r_y2": 473.68185, "r_x3": 200.64, "r_y3": 473.68185, "coord_origin": "TOPLEFT" }, "text": "416", "orig": "416", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 139, "label": "text", "bbox": { "l": 264.29047, "t": 473.68185, "r": 266.25885, "b": 476.41788, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.29047, "r_y0": 476.41788, "r_x1": 266.25885, "r_y1": 476.41788, "r_x2": 266.25885, "r_y2": 473.68185, "r_x3": 264.29047, "r_y3": 473.68185, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 140, "label": "text", "bbox": { "l": 200.64, "t": 478.53214, "r": 206.51694, "b": 481.26816, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 481.26816, "r_x1": 206.51694, "r_y1": 481.26816, "r_x2": 206.51694, "r_y2": 478.53214, "r_x3": 200.64, "r_y3": 478.53214, "coord_origin": "TOPLEFT" }, "text": "230", "orig": "230", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 141, "label": "text", "bbox": { "l": 243.26373, "t": 478.53214, "r": 245.2321, "b": 481.26816, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 243.26373, "r_y0": 481.26816, "r_x1": 245.2321, "r_y1": 481.26816, "r_x2": 245.2321, "r_y2": 478.53214, "r_x3": 243.26373, "r_y3": 478.53214, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 142, "label": "text", "bbox": { "l": 264.29047, "t": 478.53214, "r": 266.25885, "b": 481.26816, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.29047, "r_y0": 481.26816, "r_x1": 266.25885, "r_y1": 481.26816, "r_x2": 266.25885, "r_y2": 478.53214, "r_x3": 264.29047, "r_y3": 478.53214, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 143, "label": "text", "bbox": { "l": 323.40466, "t": 478.53214, "r": 325.37305, "b": 481.26816, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.40466, "r_y0": 481.26816, "r_x1": 325.37305, "r_y1": 481.26816, "r_x2": 325.37305, "r_y2": 478.53214, "r_x3": 323.40466, "r_y3": 478.53214, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 144, "label": "text", "bbox": { "l": 397.72519, "t": 478.53214, "r": 399.69354, "b": 481.26816, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.72519, "r_y0": 481.26816, "r_x1": 399.69354, "r_y1": 481.26816, "r_x2": 399.69354, "r_y2": 478.53214, "r_x3": 397.72519, "r_y3": 478.53214, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 145, "label": "text", "bbox": { "l": 200.64, "t": 483.41086, "r": 206.51694, "b": 486.14688, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 486.14688, "r_x1": 206.51694, "r_y1": 486.14688, "r_x2": 206.51694, "r_y2": 483.41086, "r_x3": 200.64, "r_y3": 483.41086, "coord_origin": "TOPLEFT" }, "text": "276", "orig": "276", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 146, "label": "text", "bbox": { "l": 382.66132, "t": 483.41086, "r": 384.61563, "b": 486.14688, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.66132, "r_y0": 486.14688, "r_x1": 384.61563, "r_y1": 486.14688, "r_x2": 384.61563, "r_y2": 483.41086, "r_x3": 382.66132, "r_y3": 483.41086, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 147, "label": "text", "bbox": { "l": 397.72513, "t": 483.41086, "r": 401.64819, "b": 486.14688, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.72513, "r_y0": 486.14688, "r_x1": 401.64819, "r_y1": 486.14688, "r_x2": 401.64819, "r_y2": 483.41086, "r_x3": 397.72513, "r_y3": 483.41086, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 148, "label": "text", "bbox": { "l": 412.78928, "t": 483.41086, "r": 414.74359, "b": 486.14688, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 158, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 412.78928, "r_y0": 486.14688, "r_x1": 414.74359, "r_y1": 486.14688, "r_x2": 414.74359, "r_y2": 483.41086, "r_x3": 412.78928, "r_y3": 483.41086, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 149, "label": "text", "bbox": { "l": 200.64014, "t": 488.28958, "r": 207.14445, "b": 491.0256, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 159, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64014, "r_y0": 491.0256, "r_x1": 207.14445, "r_y1": 491.0256, "r_x2": 207.14445, "r_y2": 488.28958, "r_x3": 200.64014, "r_y3": 488.28958, "coord_origin": "TOPLEFT" }, "text": "320", "orig": "320", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 150, "label": "text", "bbox": { "l": 367.62616, "t": 488.28958, "r": 369.78375, "b": 491.0256, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 160, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.62616, "r_y0": 491.0256, "r_x1": 369.78375, "r_y1": 491.0256, "r_x2": 369.78375, "r_y2": 488.28958, "r_x3": 367.62616, "r_y3": 488.28958, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 151, "label": "text", "bbox": { "l": 382.66141, "t": 488.28958, "r": 384.81897, "b": 491.0256, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 161, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.66141, "r_y0": 491.0256, "r_x1": 384.81897, "r_y1": 491.0256, "r_x2": 384.81897, "r_y2": 488.28958, "r_x3": 382.66141, "r_y3": 488.28958, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 152, "label": "text", "bbox": { "l": 397.7251, "t": 488.28958, "r": 402.05087, "b": 491.0256, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 162, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.7251, "r_y0": 491.0256, "r_x1": 402.05087, "r_y1": 491.0256, "r_x2": 402.05087, "r_y2": 488.28958, "r_x3": 397.7251, "r_y3": 488.28958, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 153, "label": "text", "bbox": { "l": 200.64032, "t": 493.1683, "r": 208.48566, "b": 495.90433, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 163, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64032, "r_y0": 495.90433, "r_x1": 208.48566, "r_y1": 495.90433, "r_x2": 208.48566, "r_y2": 493.1683, "r_x3": 200.64032, "r_y3": 493.1683, "coord_origin": "TOPLEFT" }, "text": "2013", "orig": "2013", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 154, "label": "text", "bbox": { "l": 264.29044, "t": 493.1683, "r": 266.25879, "b": 495.90433, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 164, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.29044, "r_y0": 495.90433, "r_x1": 266.25879, "r_y1": 495.90433, "r_x2": 266.25879, "r_y2": 493.1683, "r_x3": 264.29044, "r_y3": 493.1683, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, { "id": 155, "label": "text", "bbox": { "l": 227.91466, "t": 665.82603, "r": 230.10028, "b": 675.3464, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 165, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.91466, "r_y0": 675.3464, "r_x1": 230.10028, "r_y1": 675.3464, "r_x2": 230.10028, "r_y2": 665.82603, "r_x3": 227.91466, "r_y3": 665.82603, "coord_origin": "TOPLEFT" }, "text": "\u03bc", "orig": "\u03bc", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 156, "label": "text", "bbox": { "l": 300.58057, "t": 683.62195, "r": 302.72638, "b": 693.428658, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 166, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 300.58057, "r_y0": 693.428658, "r_x1": 302.72638, "r_y1": 693.428658, "r_x2": 302.72638, "r_y2": 683.62195, "r_x3": 300.58057, "r_y3": 683.62195, "coord_origin": "TOPLEFT" }, "text": "\u2265", "orig": "\u2265", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "tablestructure": { "table_map": { "0": { "label": "table", "id": 0, "page_no": 9, "cluster": { "id": 0, "label": "table", "bbox": { "l": 143.6376495361328, "t": 156.3477020263672, "r": 470.8485412597656, "b": 263.2624816894531, "coord_origin": "TOPLEFT" }, "confidence": 0.9884640574455261, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.782, "r_y0": 174.62865999999997, "r_x1": 194.99779, "r_y1": 174.62865999999997, "r_x2": 194.99779, "r_y2": 166.55895999999996, "r_x3": 160.782, "r_y3": 166.55895999999996, "coord_origin": "TOPLEFT" }, "text": "Data set", "orig": "Data set", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 215.52499000000003, "r_y0": 174.6037, "r_x1": 254.04465, "r_y1": 174.6037, "r_x2": 254.04465, "r_y2": 166.534, "r_x3": 215.52499000000003, "r_y3": 166.534, "coord_origin": "TOPLEFT" }, "text": "Language", "orig": "Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 300.397, "r_y0": 169.14868, "r_x1": 323.99118, "r_y1": 169.14868, "r_x2": 323.99118, "r_y2": 161.07898, "r_x3": 300.397, "r_y3": 161.07898, "coord_origin": "TOPLEFT" }, "text": "TEDs", "orig": "TEDs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 370.345, "r_y0": 174.62865999999997, "r_x1": 414.74661, "r_y1": 174.62865999999997, "r_x2": 414.74661, "r_y2": 166.55895999999996, "r_x3": 370.345, "r_y3": 166.55895999999996, "coord_origin": "TOPLEFT" }, "text": "mAP(0.75)", "orig": "mAP(0.75)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 426.737, "r_y0": 169.14868, "r_x1": 463.10830999999996, "r_y1": 169.14868, "r_x2": 463.10830999999996, "r_y2": 161.07898, "r_x3": 426.737, "r_y3": 161.07898, "coord_origin": "TOPLEFT" }, "text": "Inference", "orig": "Inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.11401, "r_y0": 180.10766999999998, "r_x1": 466.72656, "r_y1": 180.10766999999998, "r_x2": 466.72656, "r_y2": 172.03796, "r_x3": 423.11401, "r_y3": 172.03796, "coord_origin": "TOPLEFT" }, "text": "time (secs)", "orig": "time (secs)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.41299, "r_y0": 182.10071000000005, "r_x1": 288.0596, "r_y1": 182.10071000000005, "r_x2": 288.0596, "r_y2": 174.03101000000004, "r_x3": 262.41299, "r_y3": 174.03101000000004, "coord_origin": "TOPLEFT" }, "text": "simple", "orig": "simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 296.42899, "r_y0": 182.10071000000005, "r_x1": 329.44687, "r_y1": 182.10071000000005, "r_x2": 329.44687, "r_y2": 174.03101000000004, "r_x3": 296.42899, "r_y3": 174.03101000000004, "coord_origin": "TOPLEFT" }, "text": "complex", "orig": "complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.03299, "r_y0": 182.10071000000005, "r_x1": 354.75793, "r_y1": 182.10071000000005, "r_x2": 354.75793, "r_y2": 174.03101000000004, "r_x3": 345.03299, "r_y3": 174.03101000000004, "coord_origin": "TOPLEFT" }, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.53799, "r_y0": 200.92969000000005, "r_x1": 201.24129, "r_y1": 200.92969000000005, "r_x2": 201.24129, "r_y2": 192.85999000000004, "r_x3": 154.53799, "r_y3": 192.85999000000004, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.43700000000004, "r_y0": 195.45068000000003, "r_x1": 247.13226000000003, "r_y1": 195.45068000000003, "r_x2": 247.13226000000003, "r_y2": 187.38098000000002, "r_x3": 222.43700000000004, "r_y3": 187.38098000000002, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74399, "r_y0": 195.45068000000003, "r_x1": 285.73074, "r_y1": 195.45068000000003, "r_x2": 285.73074, "r_y2": 187.38098000000002, "r_x3": 264.74399, "r_y3": 187.38098000000002, "coord_origin": "TOPLEFT" }, "text": "0.965", "orig": "0.965", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.444, "r_y0": 195.45068000000003, "r_x1": 323.43076, "r_y1": 195.45068000000003, "r_x2": 323.43076, "r_y2": 187.38098000000002, "r_x3": 302.444, "r_y3": 187.38098000000002, "coord_origin": "TOPLEFT" }, "text": "0.934", "orig": "0.934", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.40302, "r_y0": 195.45068000000003, "r_x1": 360.38977, "r_y1": 195.45068000000003, "r_x2": 360.38977, "r_y2": 187.38098000000002, "r_x3": 339.40302, "r_y3": 187.38098000000002, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 383.116, "r_y0": 195.24451, "r_x1": 401.97324, "r_y1": 195.24451, "r_x2": 401.97324, "r_y2": 187.31817999999998, "r_x3": 383.116, "r_y3": 187.31817999999998, "coord_origin": "TOPLEFT" }, "text": "0.88", "orig": "0.88", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.49300999999997, "r_y0": 195.24451, "r_x1": 454.35025, "r_y1": 195.24451, "r_x2": 454.35025, "r_y2": 187.31817999999998, "r_x3": 435.49300999999997, "r_y3": 187.31817999999998, "coord_origin": "TOPLEFT" }, "text": "2.73", "orig": "2.73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.903, "r_y0": 208.40166999999997, "r_x1": 248.66655999999998, "r_y1": 208.40166999999997, "r_x2": 248.66655999999998, "r_y2": 200.33196999999996, "r_x3": 220.903, "r_y3": 200.33196999999996, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74399, "r_y0": 208.40166999999997, "r_x1": 285.73074, "r_y1": 208.40166999999997, "r_x2": 285.73074, "r_y2": 200.33196999999996, "r_x3": 264.74399, "r_y3": 200.33196999999996, "coord_origin": "TOPLEFT" }, "text": "0.969", "orig": "0.969", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.444, "r_y0": 208.40166999999997, "r_x1": 323.43076, "r_y1": 208.40166999999997, "r_x2": 323.43076, "r_y2": 200.33196999999996, "r_x3": 302.444, "r_y3": 200.33196999999996, "coord_origin": "TOPLEFT" }, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.40302, "r_y0": 208.40166999999997, "r_x1": 360.38977, "r_y1": 208.40166999999997, "r_x2": 360.38977, "r_y2": 200.33196999999996, "r_x3": 339.40302, "r_y3": 200.33196999999996, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.052, "r_y0": 208.40166999999997, "r_x1": 403.03876, "r_y1": 208.40166999999997, "r_x2": 403.03876, "r_y2": 200.33196999999996, "r_x3": 382.052, "r_y3": 200.33196999999996, "coord_origin": "TOPLEFT" }, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.73199000000005, "r_y0": 208.40166999999997, "r_x1": 453.11182, "r_y1": 208.40166999999997, "r_x2": 453.11182, "r_y2": 200.33196999999996, "r_x3": 436.73199000000005, "r_y3": 200.33196999999996, "coord_origin": "TOPLEFT" }, "text": "5.39", "orig": "5.39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 155.94501, "r_y0": 227.23168999999996, "r_x1": 199.83374, "r_y1": 227.23168999999996, "r_x2": 199.83374, "r_y2": 219.16198999999995, "r_x3": 155.94501, "r_y3": 219.16198999999995, "coord_origin": "TOPLEFT" }, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.43700000000004, "r_y0": 221.75171, "r_x1": 247.13226000000003, "r_y1": 221.75171, "r_x2": 247.13226000000003, "r_y2": 213.68201, "r_x3": 222.43700000000004, "r_y3": 213.68201, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74399, "r_y0": 221.75171, "r_x1": 285.73074, "r_y1": 221.75171, "r_x2": 285.73074, "r_y2": 213.68201, "r_x3": 264.74399, "r_y3": 213.68201, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.444, "r_y0": 221.75171, "r_x1": 323.43076, "r_y1": 221.75171, "r_x2": 323.43076, "r_y2": 213.68201, "r_x3": 302.444, "r_y3": 213.68201, "coord_origin": "TOPLEFT" }, "text": "0.961", "orig": "0.961", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.815, "r_y0": 221.54552999999999, "r_x1": 361.97586, "r_y1": 221.54552999999999, "r_x2": 361.97586, "r_y2": 213.61919999999998, "r_x3": 337.815, "r_y3": 213.61919999999998, "coord_origin": "TOPLEFT" }, "text": "0.959", "orig": "0.959", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 380.46399, "r_y0": 221.54552999999999, "r_x1": 404.62485, "r_y1": 221.54552999999999, "r_x2": 404.62485, "r_y2": 213.61919999999998, "r_x3": 380.46399, "r_y3": 213.61919999999998, "coord_origin": "TOPLEFT" }, "text": "0.862", "orig": "0.862", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.49300999999997, "r_y0": 221.54552999999999, "r_x1": 454.35025, "r_y1": 221.54552999999999, "r_x2": 454.35025, "r_y2": 213.61919999999998, "r_x3": 435.49300999999997, "r_y3": 213.61919999999998, "coord_origin": "TOPLEFT" }, "text": "1.85", "orig": "1.85", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.903, "r_y0": 234.70367, "r_x1": 248.66655999999998, "r_y1": 234.70367, "r_x2": 248.66655999999998, "r_y2": 226.63396999999998, "r_x3": 220.903, "r_y3": 226.63396999999998, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74399, "r_y0": 234.70367, "r_x1": 285.73074, "r_y1": 234.70367, "r_x2": 285.73074, "r_y2": 226.63396999999998, "r_x3": 264.74399, "r_y3": 226.63396999999998, "coord_origin": "TOPLEFT" }, "text": "0.917", "orig": "0.917", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.444, "r_y0": 234.70367, "r_x1": 323.43076, "r_y1": 234.70367, "r_x2": 323.43076, "r_y2": 226.63396999999998, "r_x3": 302.444, "r_y3": 226.63396999999998, "coord_origin": "TOPLEFT" }, "text": "0.922", "orig": "0.922", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 341.70599, "r_y0": 234.70367, "r_x1": 358.08582, "r_y1": 234.70367, "r_x2": 358.08582, "r_y2": 226.63396999999998, "r_x3": 341.70599, "r_y3": 226.63396999999998, "coord_origin": "TOPLEFT" }, "text": "0.92", "orig": "0.92", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.052, "r_y0": 234.70367, "r_x1": 403.03876, "r_y1": 234.70367, "r_x2": 403.03876, "r_y2": 226.63396999999998, "r_x3": 382.052, "r_y3": 226.63396999999998, "coord_origin": "TOPLEFT" }, "text": "0.722", "orig": "0.722", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.73199000000005, "r_y0": 234.70367, "r_x1": 453.11182, "r_y1": 234.70367, "r_x2": 453.11182, "r_y2": 226.63396999999998, "r_x3": 436.73199000000005, "r_y3": 226.63396999999998, "coord_origin": "TOPLEFT" }, "text": "3.26", "orig": "3.26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 148.62601, "r_y0": 253.53265, "r_x1": 207.1524, "r_y1": 253.53265, "r_x2": 207.1524, "r_y2": 245.46294999999998, "r_x3": 148.62601, "r_y3": 245.46294999999998, "coord_origin": "TOPLEFT" }, "text": "PubTables-1M", "orig": "PubTables-1M", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.43700000000004, "r_y0": 248.05267000000003, "r_x1": 247.13226000000003, "r_y1": 248.05267000000003, "r_x2": 247.13226000000003, "r_y2": 239.98297000000002, "r_x3": 222.43700000000004, "r_y3": 239.98297000000002, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74399, "r_y0": 248.05267000000003, "r_x1": 285.73074, "r_y1": 248.05267000000003, "r_x2": 285.73074, "r_y2": 239.98297000000002, "r_x3": 264.74399, "r_y3": 239.98297000000002, "coord_origin": "TOPLEFT" }, "text": "0.987", "orig": "0.987", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.444, "r_y0": 248.05267000000003, "r_x1": 323.43076, "r_y1": 248.05267000000003, "r_x2": 323.43076, "r_y2": 239.98297000000002, "r_x3": 302.444, "r_y3": 239.98297000000002, "coord_origin": "TOPLEFT" }, "text": "0.964", "orig": "0.964", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.815, "r_y0": 247.8465, "r_x1": 361.97586, "r_y1": 247.8465, "r_x2": 361.97586, "r_y2": 239.92016999999998, "r_x3": 337.815, "r_y3": 239.92016999999998, "coord_origin": "TOPLEFT" }, "text": "0.977", "orig": "0.977", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 380.46399, "r_y0": 247.8465, "r_x1": 404.62485, "r_y1": 247.8465, "r_x2": 404.62485, "r_y2": 239.92016999999998, "r_x3": 380.46399, "r_y3": 239.92016999999998, "coord_origin": "TOPLEFT" }, "text": "0.896", "orig": "0.896", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.49300999999997, "r_y0": 247.8465, "r_x1": 454.35025, "r_y1": 247.8465, "r_x2": 454.35025, "r_y2": 239.92016999999998, "r_x3": 435.49300999999997, "r_y3": 239.92016999999998, "coord_origin": "TOPLEFT" }, "text": "1.79", "orig": "1.79", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.903, "r_y0": 261.00469999999996, "r_x1": 248.66655999999998, "r_y1": 261.00469999999996, "r_x2": 248.66655999999998, "r_y2": 252.93499999999995, "r_x3": 220.903, "r_y3": 252.93499999999995, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74399, "r_y0": 261.00469999999996, "r_x1": 285.73074, "r_y1": 261.00469999999996, "r_x2": 285.73074, "r_y2": 252.93499999999995, "r_x3": 264.74399, "r_y3": 252.93499999999995, "coord_origin": "TOPLEFT" }, "text": "0.983", "orig": "0.983", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.444, "r_y0": 261.00469999999996, "r_x1": 323.43076, "r_y1": 261.00469999999996, "r_x2": 323.43076, "r_y2": 252.93499999999995, "r_x3": 302.444, "r_y3": 252.93499999999995, "coord_origin": "TOPLEFT" }, "text": "0.944", "orig": "0.944", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.40302, "r_y0": 261.00469999999996, "r_x1": 360.38977, "r_y1": 261.00469999999996, "r_x2": 360.38977, "r_y2": 252.93499999999995, "r_x3": 339.40302, "r_y3": 252.93499999999995, "coord_origin": "TOPLEFT" }, "text": "0.966", "orig": "0.966", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.052, "r_y0": 261.00469999999996, "r_x1": 403.03876, "r_y1": 261.00469999999996, "r_x2": 403.03876, "r_y2": 252.93499999999995, "r_x3": 382.052, "r_y3": 252.93499999999995, "coord_origin": "TOPLEFT" }, "text": "0.889", "orig": "0.889", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.73199000000005, "r_y0": 261.00469999999996, "r_x1": 453.11182, "r_y1": 261.00469999999996, "r_x2": 453.11182, "r_y2": 252.93499999999995, "r_x3": 436.73199000000005, "r_y3": 252.93499999999995, "coord_origin": "TOPLEFT" }, "text": "3.26", "orig": "3.26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 10, "label": "text", "bbox": { "l": 160.782, "t": 166.55895999999996, "r": 194.99779, "b": 174.62865999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.782, "r_y0": 174.62865999999997, "r_x1": 194.99779, "r_y1": 174.62865999999997, "r_x2": 194.99779, "r_y2": 166.55895999999996, "r_x3": 160.782, "r_y3": 166.55895999999996, "coord_origin": "TOPLEFT" }, "text": "Data set", "orig": "Data set", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 11, "label": "text", "bbox": { "l": 215.52499000000003, "t": 166.534, "r": 254.04465, "b": 174.6037, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 215.52499000000003, "r_y0": 174.6037, "r_x1": 254.04465, "r_y1": 174.6037, "r_x2": 254.04465, "r_y2": 166.534, "r_x3": 215.52499000000003, "r_y3": 166.534, "coord_origin": "TOPLEFT" }, "text": "Language", "orig": "Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 12, "label": "text", "bbox": { "l": 300.397, "t": 161.07898, "r": 323.99118, "b": 169.14868, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 300.397, "r_y0": 169.14868, "r_x1": 323.99118, "r_y1": 169.14868, "r_x2": 323.99118, "r_y2": 161.07898, "r_x3": 300.397, "r_y3": 161.07898, "coord_origin": "TOPLEFT" }, "text": "TEDs", "orig": "TEDs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 13, "label": "text", "bbox": { "l": 370.345, "t": 166.55895999999996, "r": 414.74661, "b": 174.62865999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 370.345, "r_y0": 174.62865999999997, "r_x1": 414.74661, "r_y1": 174.62865999999997, "r_x2": 414.74661, "r_y2": 166.55895999999996, "r_x3": 370.345, "r_y3": 166.55895999999996, "coord_origin": "TOPLEFT" }, "text": "mAP(0.75)", "orig": "mAP(0.75)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 14, "label": "text", "bbox": { "l": 426.737, "t": 161.07898, "r": 463.10830999999996, "b": 169.14868, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 426.737, "r_y0": 169.14868, "r_x1": 463.10830999999996, "r_y1": 169.14868, "r_x2": 463.10830999999996, "r_y2": 161.07898, "r_x3": 426.737, "r_y3": 161.07898, "coord_origin": "TOPLEFT" }, "text": "Inference", "orig": "Inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 15, "label": "text", "bbox": { "l": 423.11401, "t": 172.03796, "r": 466.72656, "b": 180.10766999999998, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.11401, "r_y0": 180.10766999999998, "r_x1": 466.72656, "r_y1": 180.10766999999998, "r_x2": 466.72656, "r_y2": 172.03796, "r_x3": 423.11401, "r_y3": 172.03796, "coord_origin": "TOPLEFT" }, "text": "time (secs)", "orig": "time (secs)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 16, "label": "text", "bbox": { "l": 262.41299, "t": 174.03101000000004, "r": 288.0596, "b": 182.10071000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.41299, "r_y0": 182.10071000000005, "r_x1": 288.0596, "r_y1": 182.10071000000005, "r_x2": 288.0596, "r_y2": 174.03101000000004, "r_x3": 262.41299, "r_y3": 174.03101000000004, "coord_origin": "TOPLEFT" }, "text": "simple", "orig": "simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 17, "label": "text", "bbox": { "l": 296.42899, "t": 174.03101000000004, "r": 329.44687, "b": 182.10071000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 296.42899, "r_y0": 182.10071000000005, "r_x1": 329.44687, "r_y1": 182.10071000000005, "r_x2": 329.44687, "r_y2": 174.03101000000004, "r_x3": 296.42899, "r_y3": 174.03101000000004, "coord_origin": "TOPLEFT" }, "text": "complex", "orig": "complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 18, "label": "text", "bbox": { "l": 345.03299, "t": 174.03101000000004, "r": 354.75793, "b": 182.10071000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.03299, "r_y0": 182.10071000000005, "r_x1": 354.75793, "r_y1": 182.10071000000005, "r_x2": 354.75793, "r_y2": 174.03101000000004, "r_x3": 345.03299, "r_y3": 174.03101000000004, "coord_origin": "TOPLEFT" }, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 19, "label": "text", "bbox": { "l": 154.53799, "t": 192.85999000000004, "r": 201.24129, "b": 200.92969000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.53799, "r_y0": 200.92969000000005, "r_x1": 201.24129, "r_y1": 200.92969000000005, "r_x2": 201.24129, "r_y2": 192.85999000000004, "r_x3": 154.53799, "r_y3": 192.85999000000004, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 20, "label": "text", "bbox": { "l": 222.43700000000004, "t": 187.38098000000002, "r": 247.13226000000003, "b": 195.45068000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.43700000000004, "r_y0": 195.45068000000003, "r_x1": 247.13226000000003, "r_y1": 195.45068000000003, "r_x2": 247.13226000000003, "r_y2": 187.38098000000002, "r_x3": 222.43700000000004, "r_y3": 187.38098000000002, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 21, "label": "text", "bbox": { "l": 264.74399, "t": 187.38098000000002, "r": 285.73074, "b": 195.45068000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74399, "r_y0": 195.45068000000003, "r_x1": 285.73074, "r_y1": 195.45068000000003, "r_x2": 285.73074, "r_y2": 187.38098000000002, "r_x3": 264.74399, "r_y3": 187.38098000000002, "coord_origin": "TOPLEFT" }, "text": "0.965", "orig": "0.965", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 22, "label": "text", "bbox": { "l": 302.444, "t": 187.38098000000002, "r": 323.43076, "b": 195.45068000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.444, "r_y0": 195.45068000000003, "r_x1": 323.43076, "r_y1": 195.45068000000003, "r_x2": 323.43076, "r_y2": 187.38098000000002, "r_x3": 302.444, "r_y3": 187.38098000000002, "coord_origin": "TOPLEFT" }, "text": "0.934", "orig": "0.934", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 23, "label": "text", "bbox": { "l": 339.40302, "t": 187.38098000000002, "r": 360.38977, "b": 195.45068000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.40302, "r_y0": 195.45068000000003, "r_x1": 360.38977, "r_y1": 195.45068000000003, "r_x2": 360.38977, "r_y2": 187.38098000000002, "r_x3": 339.40302, "r_y3": 187.38098000000002, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 24, "label": "text", "bbox": { "l": 383.116, "t": 187.31817999999998, "r": 401.97324, "b": 195.24451, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 383.116, "r_y0": 195.24451, "r_x1": 401.97324, "r_y1": 195.24451, "r_x2": 401.97324, "r_y2": 187.31817999999998, "r_x3": 383.116, "r_y3": 187.31817999999998, "coord_origin": "TOPLEFT" }, "text": "0.88", "orig": "0.88", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 25, "label": "text", "bbox": { "l": 435.49300999999997, "t": 187.31817999999998, "r": 454.35025, "b": 195.24451, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.49300999999997, "r_y0": 195.24451, "r_x1": 454.35025, "r_y1": 195.24451, "r_x2": 454.35025, "r_y2": 187.31817999999998, "r_x3": 435.49300999999997, "r_y3": 187.31817999999998, "coord_origin": "TOPLEFT" }, "text": "2.73", "orig": "2.73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 26, "label": "text", "bbox": { "l": 220.903, "t": 200.33196999999996, "r": 248.66655999999998, "b": 208.40166999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.903, "r_y0": 208.40166999999997, "r_x1": 248.66655999999998, "r_y1": 208.40166999999997, "r_x2": 248.66655999999998, "r_y2": 200.33196999999996, "r_x3": 220.903, "r_y3": 200.33196999999996, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 27, "label": "text", "bbox": { "l": 264.74399, "t": 200.33196999999996, "r": 285.73074, "b": 208.40166999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74399, "r_y0": 208.40166999999997, "r_x1": 285.73074, "r_y1": 208.40166999999997, "r_x2": 285.73074, "r_y2": 200.33196999999996, "r_x3": 264.74399, "r_y3": 200.33196999999996, "coord_origin": "TOPLEFT" }, "text": "0.969", "orig": "0.969", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 28, "label": "text", "bbox": { "l": 302.444, "t": 200.33196999999996, "r": 323.43076, "b": 208.40166999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.444, "r_y0": 208.40166999999997, "r_x1": 323.43076, "r_y1": 208.40166999999997, "r_x2": 323.43076, "r_y2": 200.33196999999996, "r_x3": 302.444, "r_y3": 200.33196999999996, "coord_origin": "TOPLEFT" }, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 29, "label": "text", "bbox": { "l": 339.40302, "t": 200.33196999999996, "r": 360.38977, "b": 208.40166999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.40302, "r_y0": 208.40166999999997, "r_x1": 360.38977, "r_y1": 208.40166999999997, "r_x2": 360.38977, "r_y2": 200.33196999999996, "r_x3": 339.40302, "r_y3": 200.33196999999996, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 30, "label": "text", "bbox": { "l": 382.052, "t": 200.33196999999996, "r": 403.03876, "b": 208.40166999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.052, "r_y0": 208.40166999999997, "r_x1": 403.03876, "r_y1": 208.40166999999997, "r_x2": 403.03876, "r_y2": 200.33196999999996, "r_x3": 382.052, "r_y3": 200.33196999999996, "coord_origin": "TOPLEFT" }, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 31, "label": "text", "bbox": { "l": 436.73199000000005, "t": 200.33196999999996, "r": 453.11182, "b": 208.40166999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.73199000000005, "r_y0": 208.40166999999997, "r_x1": 453.11182, "r_y1": 208.40166999999997, "r_x2": 453.11182, "r_y2": 200.33196999999996, "r_x3": 436.73199000000005, "r_y3": 200.33196999999996, "coord_origin": "TOPLEFT" }, "text": "5.39", "orig": "5.39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 32, "label": "text", "bbox": { "l": 155.94501, "t": 219.16198999999995, "r": 199.83374, "b": 227.23168999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 155.94501, "r_y0": 227.23168999999996, "r_x1": 199.83374, "r_y1": 227.23168999999996, "r_x2": 199.83374, "r_y2": 219.16198999999995, "r_x3": 155.94501, "r_y3": 219.16198999999995, "coord_origin": "TOPLEFT" }, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 33, "label": "text", "bbox": { "l": 222.43700000000004, "t": 213.68201, "r": 247.13226000000003, "b": 221.75171, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.43700000000004, "r_y0": 221.75171, "r_x1": 247.13226000000003, "r_y1": 221.75171, "r_x2": 247.13226000000003, "r_y2": 213.68201, "r_x3": 222.43700000000004, "r_y3": 213.68201, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 34, "label": "text", "bbox": { "l": 264.74399, "t": 213.68201, "r": 285.73074, "b": 221.75171, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74399, "r_y0": 221.75171, "r_x1": 285.73074, "r_y1": 221.75171, "r_x2": 285.73074, "r_y2": 213.68201, "r_x3": 264.74399, "r_y3": 213.68201, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 35, "label": "text", "bbox": { "l": 302.444, "t": 213.68201, "r": 323.43076, "b": 221.75171, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.444, "r_y0": 221.75171, "r_x1": 323.43076, "r_y1": 221.75171, "r_x2": 323.43076, "r_y2": 213.68201, "r_x3": 302.444, "r_y3": 213.68201, "coord_origin": "TOPLEFT" }, "text": "0.961", "orig": "0.961", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 36, "label": "text", "bbox": { "l": 337.815, "t": 213.61919999999998, "r": 361.97586, "b": 221.54552999999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.815, "r_y0": 221.54552999999999, "r_x1": 361.97586, "r_y1": 221.54552999999999, "r_x2": 361.97586, "r_y2": 213.61919999999998, "r_x3": 337.815, "r_y3": 213.61919999999998, "coord_origin": "TOPLEFT" }, "text": "0.959", "orig": "0.959", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 37, "label": "text", "bbox": { "l": 380.46399, "t": 213.61919999999998, "r": 404.62485, "b": 221.54552999999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 380.46399, "r_y0": 221.54552999999999, "r_x1": 404.62485, "r_y1": 221.54552999999999, "r_x2": 404.62485, "r_y2": 213.61919999999998, "r_x3": 380.46399, "r_y3": 213.61919999999998, "coord_origin": "TOPLEFT" }, "text": "0.862", "orig": "0.862", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 38, "label": "text", "bbox": { "l": 435.49300999999997, "t": 213.61919999999998, "r": 454.35025, "b": 221.54552999999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.49300999999997, "r_y0": 221.54552999999999, "r_x1": 454.35025, "r_y1": 221.54552999999999, "r_x2": 454.35025, "r_y2": 213.61919999999998, "r_x3": 435.49300999999997, "r_y3": 213.61919999999998, "coord_origin": "TOPLEFT" }, "text": "1.85", "orig": "1.85", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 39, "label": "text", "bbox": { "l": 220.903, "t": 226.63396999999998, "r": 248.66655999999998, "b": 234.70367, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.903, "r_y0": 234.70367, "r_x1": 248.66655999999998, "r_y1": 234.70367, "r_x2": 248.66655999999998, "r_y2": 226.63396999999998, "r_x3": 220.903, "r_y3": 226.63396999999998, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 40, "label": "text", "bbox": { "l": 264.74399, "t": 226.63396999999998, "r": 285.73074, "b": 234.70367, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74399, "r_y0": 234.70367, "r_x1": 285.73074, "r_y1": 234.70367, "r_x2": 285.73074, "r_y2": 226.63396999999998, "r_x3": 264.74399, "r_y3": 226.63396999999998, "coord_origin": "TOPLEFT" }, "text": "0.917", "orig": "0.917", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 302.444, "t": 226.63396999999998, "r": 323.43076, "b": 234.70367, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.444, "r_y0": 234.70367, "r_x1": 323.43076, "r_y1": 234.70367, "r_x2": 323.43076, "r_y2": 226.63396999999998, "r_x3": 302.444, "r_y3": 226.63396999999998, "coord_origin": "TOPLEFT" }, "text": "0.922", "orig": "0.922", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 341.70599, "t": 226.63396999999998, "r": 358.08582, "b": 234.70367, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 341.70599, "r_y0": 234.70367, "r_x1": 358.08582, "r_y1": 234.70367, "r_x2": 358.08582, "r_y2": 226.63396999999998, "r_x3": 341.70599, "r_y3": 226.63396999999998, "coord_origin": "TOPLEFT" }, "text": "0.92", "orig": "0.92", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 382.052, "t": 226.63396999999998, "r": 403.03876, "b": 234.70367, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.052, "r_y0": 234.70367, "r_x1": 403.03876, "r_y1": 234.70367, "r_x2": 403.03876, "r_y2": 226.63396999999998, "r_x3": 382.052, "r_y3": 226.63396999999998, "coord_origin": "TOPLEFT" }, "text": "0.722", "orig": "0.722", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 436.73199000000005, "t": 226.63396999999998, "r": 453.11182, "b": 234.70367, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.73199000000005, "r_y0": 234.70367, "r_x1": 453.11182, "r_y1": 234.70367, "r_x2": 453.11182, "r_y2": 226.63396999999998, "r_x3": 436.73199000000005, "r_y3": 226.63396999999998, "coord_origin": "TOPLEFT" }, "text": "3.26", "orig": "3.26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 148.62601, "t": 245.46294999999998, "r": 207.1524, "b": 253.53265, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 148.62601, "r_y0": 253.53265, "r_x1": 207.1524, "r_y1": 253.53265, "r_x2": 207.1524, "r_y2": 245.46294999999998, "r_x3": 148.62601, "r_y3": 245.46294999999998, "coord_origin": "TOPLEFT" }, "text": "PubTables-1M", "orig": "PubTables-1M", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 222.43700000000004, "t": 239.98297000000002, "r": 247.13226000000003, "b": 248.05267000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.43700000000004, "r_y0": 248.05267000000003, "r_x1": 247.13226000000003, "r_y1": 248.05267000000003, "r_x2": 247.13226000000003, "r_y2": 239.98297000000002, "r_x3": 222.43700000000004, "r_y3": 239.98297000000002, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 264.74399, "t": 239.98297000000002, "r": 285.73074, "b": 248.05267000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74399, "r_y0": 248.05267000000003, "r_x1": 285.73074, "r_y1": 248.05267000000003, "r_x2": 285.73074, "r_y2": 239.98297000000002, "r_x3": 264.74399, "r_y3": 239.98297000000002, "coord_origin": "TOPLEFT" }, "text": "0.987", "orig": "0.987", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 302.444, "t": 239.98297000000002, "r": 323.43076, "b": 248.05267000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.444, "r_y0": 248.05267000000003, "r_x1": 323.43076, "r_y1": 248.05267000000003, "r_x2": 323.43076, "r_y2": 239.98297000000002, "r_x3": 302.444, "r_y3": 239.98297000000002, "coord_origin": "TOPLEFT" }, "text": "0.964", "orig": "0.964", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 337.815, "t": 239.92016999999998, "r": 361.97586, "b": 247.8465, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.815, "r_y0": 247.8465, "r_x1": 361.97586, "r_y1": 247.8465, "r_x2": 361.97586, "r_y2": 239.92016999999998, "r_x3": 337.815, "r_y3": 239.92016999999998, "coord_origin": "TOPLEFT" }, "text": "0.977", "orig": "0.977", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 380.46399, "t": 239.92016999999998, "r": 404.62485, "b": 247.8465, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 380.46399, "r_y0": 247.8465, "r_x1": 404.62485, "r_y1": 247.8465, "r_x2": 404.62485, "r_y2": 239.92016999999998, "r_x3": 380.46399, "r_y3": 239.92016999999998, "coord_origin": "TOPLEFT" }, "text": "0.896", "orig": "0.896", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 51, "label": "text", "bbox": { "l": 435.49300999999997, "t": 239.92016999999998, "r": 454.35025, "b": 247.8465, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.49300999999997, "r_y0": 247.8465, "r_x1": 454.35025, "r_y1": 247.8465, "r_x2": 454.35025, "r_y2": 239.92016999999998, "r_x3": 435.49300999999997, "r_y3": 239.92016999999998, "coord_origin": "TOPLEFT" }, "text": "1.79", "orig": "1.79", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 52, "label": "text", "bbox": { "l": 220.903, "t": 252.93499999999995, "r": 248.66655999999998, "b": 261.00469999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.903, "r_y0": 261.00469999999996, "r_x1": 248.66655999999998, "r_y1": 261.00469999999996, "r_x2": 248.66655999999998, "r_y2": 252.93499999999995, "r_x3": 220.903, "r_y3": 252.93499999999995, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 53, "label": "text", "bbox": { "l": 264.74399, "t": 252.93499999999995, "r": 285.73074, "b": 261.00469999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74399, "r_y0": 261.00469999999996, "r_x1": 285.73074, "r_y1": 261.00469999999996, "r_x2": 285.73074, "r_y2": 252.93499999999995, "r_x3": 264.74399, "r_y3": 252.93499999999995, "coord_origin": "TOPLEFT" }, "text": "0.983", "orig": "0.983", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 54, "label": "text", "bbox": { "l": 302.444, "t": 252.93499999999995, "r": 323.43076, "b": 261.00469999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.444, "r_y0": 261.00469999999996, "r_x1": 323.43076, "r_y1": 261.00469999999996, "r_x2": 323.43076, "r_y2": 252.93499999999995, "r_x3": 302.444, "r_y3": 252.93499999999995, "coord_origin": "TOPLEFT" }, "text": "0.944", "orig": "0.944", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 55, "label": "text", "bbox": { "l": 339.40302, "t": 252.93499999999995, "r": 360.38977, "b": 261.00469999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.40302, "r_y0": 261.00469999999996, "r_x1": 360.38977, "r_y1": 261.00469999999996, "r_x2": 360.38977, "r_y2": 252.93499999999995, "r_x3": 339.40302, "r_y3": 252.93499999999995, "coord_origin": "TOPLEFT" }, "text": "0.966", "orig": "0.966", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 56, "label": "text", "bbox": { "l": 382.052, "t": 252.93499999999995, "r": 403.03876, "b": 261.00469999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.052, "r_y0": 261.00469999999996, "r_x1": 403.03876, "r_y1": 261.00469999999996, "r_x2": 403.03876, "r_y2": 252.93499999999995, "r_x3": 382.052, "r_y3": 252.93499999999995, "coord_origin": "TOPLEFT" }, "text": "0.889", "orig": "0.889", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 57, "label": "text", "bbox": { "l": 436.73199000000005, "t": 252.93499999999995, "r": 453.11182, "b": 261.00469999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.73199000000005, "r_y0": 261.00469999999996, "r_x1": 453.11182, "r_y1": 261.00469999999996, "r_x2": 453.11182, "r_y2": 252.93499999999995, "r_x3": 436.73199000000005, "r_y3": 252.93499999999995, "coord_origin": "TOPLEFT" }, "text": "3.26", "orig": "3.26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "lcel", "lcel", "ched", "ched", "nl", "ucel", "ucel", "ched", "ched", "ched", "ucel", "ucel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 5, "num_cols": 7, "table_cells": [ { "bbox": { "l": 160.782, "t": 166.55895999999996, "r": 194.99779, "b": 174.62865999999997, "coord_origin": "TOPLEFT" }, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Data set", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 215.52499000000003, "t": 166.534, "r": 254.04465, "b": 174.6037, "coord_origin": "TOPLEFT" }, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "Language", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 300.397, "t": 161.07898, "r": 323.99118, "b": 169.14868, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 3, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 2, "end_col_offset_idx": 5, "text": "TEDs", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 370.345, "t": 166.55895999999996, "r": 414.74661, "b": 174.62865999999997, "coord_origin": "TOPLEFT" }, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "mAP(0.75)", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 426.737, "t": 161.07898, "r": 463.10830999999996, "b": 169.14868, "coord_origin": "TOPLEFT" }, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "Inference time (secs)", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 262.41299, "t": 174.03101000000004, "r": 288.0596, "b": 182.10071000000005, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "simple", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 296.42899, "t": 174.03101000000004, "r": 329.44687, "b": 182.10071000000005, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "complex", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 345.03299, "t": 174.03101000000004, "r": 354.75793, "b": 182.10071000000005, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "all", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 154.53799, "t": 192.85999000000004, "r": 201.24129, "b": 200.92969000000005, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "PubTabNet", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 222.43700000000004, "t": 187.38098000000002, "r": 247.13226000000003, "b": 195.45068000000003, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 264.74399, "t": 187.38098000000002, "r": 285.73074, "b": 195.45068000000003, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "0.965 0.969", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 302.444, "t": 187.38098000000002, "r": 323.43076, "b": 195.45068000000003, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.934 0.927", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 339.40302, "t": 187.38098000000002, "r": 360.38977, "b": 195.45068000000003, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.955 0.955", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 383.116, "t": 187.31817999999998, "r": 401.97324, "b": 195.24451, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.88 0.857", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 435.49300999999997, "t": 187.31817999999998, "r": 454.35025, "b": 195.24451, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "2.73 5.39", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 155.94501, "t": 219.16198999999995, "r": 199.83374, "b": 227.23168999999996, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "FinTabNet", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 222.43700000000004, "t": 213.68201, "r": 247.13226000000003, "b": 221.75171, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 264.74399, "t": 213.68201, "r": 285.73074, "b": 221.75171, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "0.955 0.917", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 302.444, "t": 213.68201, "r": 323.43076, "b": 221.75171, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.961 0.922", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 337.815, "t": 213.61919999999998, "r": 361.97586, "b": 221.54552999999999, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.959 0.92", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 380.46399, "t": 213.61919999999998, "r": 404.62485, "b": 221.54552999999999, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.862 0.722", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 435.49300999999997, "t": 213.61919999999998, "r": 454.35025, "b": 221.54552999999999, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "1.85 3.26", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 148.62601, "t": 245.46294999999998, "r": 207.1524, "b": 253.53265, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "PubTables-1M", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 222.43700000000004, "t": 239.98297000000002, "r": 247.13226000000003, "b": 248.05267000000003, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 264.74399, "t": 239.98297000000002, "r": 285.73074, "b": 248.05267000000003, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "0.987 0.983", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 302.444, "t": 239.98297000000002, "r": 323.43076, "b": 248.05267000000003, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.964 0.944", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 337.815, "t": 239.92016999999998, "r": 361.97586, "b": 247.8465, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.977 0.966", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 380.46399, "t": 239.92016999999998, "r": 404.62485, "b": 247.8465, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.896 0.889", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 435.49300999999997, "t": 239.92016999999998, "r": 454.35025, "b": 247.8465, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "1.79 3.26", "column_header": false, "row_header": false, "row_section": false } ] } } }, "figures_classification": null, "equations_prediction": null, "vlm_response": null }, "assembled": { "elements": [ { "label": "page_header", "id": 7, "page_no": 9, "cluster": { "id": 7, "label": "page_header", "bbox": { "l": 134.765, "t": 93.77099999999996, "r": 143.97887, "b": 101.84069999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.8309906721115112, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 101.84069999999997, "r_x1": 143.97887, "r_y1": 101.84069999999997, "r_x2": 143.97887, "r_y2": 93.77099999999996, "r_x3": 134.765, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "10" }, { "label": "page_header", "id": 6, "page_no": 9, "cluster": { "id": 6, "label": "page_header", "bbox": { "l": 167.82053, "t": 93.77099999999996, "r": 231.72049000000004, "b": 101.84069999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.8367075324058533, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.82053, "r_y0": 101.84069999999997, "r_x1": 178.08249, "r_y1": 101.84069999999997, "r_x2": 178.08249, "r_y2": 93.77099999999996, "r_x3": 167.82053, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.37929, "r_y0": 101.84069999999997, "r_x1": 231.72049000000004, "r_y1": 101.84069999999997, "r_x2": 231.72049000000004, "r_y2": 93.77099999999996, "r_x3": 182.37929, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "M. Lysak, et al." }, { "label": "caption", "id": 4, "page_no": 9, "cluster": { "id": 4, "label": "caption", "bbox": { "l": 134.765, "t": 115.83618000000001, "r": 480.59357000000006, "b": 145.88666, "coord_origin": "TOPLEFT" }, "confidence": 0.9512290954589844, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 123.76251000000002, "r_x1": 173.09366, "r_y1": 123.76251000000002, "r_x2": 173.09366, "r_y2": 115.83618000000001, "r_x3": 134.765, "r_y3": 115.83618000000001, "coord_origin": "TOPLEFT" }, "text": "Table 2.", "orig": "Table 2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 181.30299, "r_y0": 123.96868999999992, "r_x1": 480.59151999999995, "r_y1": 123.96868999999992, "r_x2": 480.59151999999995, "r_y2": 115.89899000000003, "r_x3": 181.30299, "r_y3": 115.89899000000003, "coord_origin": "TOPLEFT" }, "text": "TSR and cell detection results compared between OTSL and HTML on", "orig": "TSR and cell detection results compared between OTSL and HTML on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 134.92767000000003, "r_x1": 480.59357000000006, "r_y1": 134.92767000000003, "r_x2": 480.59357000000006, "r_y2": 126.85797000000014, "r_x3": 134.765, "r_y3": 126.85797000000014, "coord_origin": "TOPLEFT" }, "text": "the PubTabNet [22], FinTabNet [21] and PubTables-1M [14] data sets using Table-", "orig": "the PubTabNet [22], FinTabNet [21] and PubTables-1M [14] data sets using Table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 145.88666, "r_x1": 305.95691, "r_y1": 145.88666, "r_x2": 305.95691, "r_y2": 137.81696, "r_x3": 134.765, "r_y3": 137.81696, "coord_origin": "TOPLEFT" }, "text": "Former [9] (with enc=6, dec=6, heads=8).", "orig": "Former [9] (with enc=6, dec=6, heads=8).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Table 2. TSR and cell detection results compared between OTSL and HTML on the PubTabNet [22], FinTabNet [21] and PubTables-1M [14] data sets using TableFormer [9] (with enc=6, dec=6, heads=8)." }, { "label": "table", "id": 0, "page_no": 9, "cluster": { "id": 0, "label": "table", "bbox": { "l": 143.6376495361328, "t": 156.3477020263672, "r": 470.8485412597656, "b": 263.2624816894531, "coord_origin": "TOPLEFT" }, "confidence": 0.9884640574455261, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.782, "r_y0": 174.62865999999997, "r_x1": 194.99779, "r_y1": 174.62865999999997, "r_x2": 194.99779, "r_y2": 166.55895999999996, "r_x3": 160.782, "r_y3": 166.55895999999996, "coord_origin": "TOPLEFT" }, "text": "Data set", "orig": "Data set", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 215.52499000000003, "r_y0": 174.6037, "r_x1": 254.04465, "r_y1": 174.6037, "r_x2": 254.04465, "r_y2": 166.534, "r_x3": 215.52499000000003, "r_y3": 166.534, "coord_origin": "TOPLEFT" }, "text": "Language", "orig": "Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 300.397, "r_y0": 169.14868, "r_x1": 323.99118, "r_y1": 169.14868, "r_x2": 323.99118, "r_y2": 161.07898, "r_x3": 300.397, "r_y3": 161.07898, "coord_origin": "TOPLEFT" }, "text": "TEDs", "orig": "TEDs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 370.345, "r_y0": 174.62865999999997, "r_x1": 414.74661, "r_y1": 174.62865999999997, "r_x2": 414.74661, "r_y2": 166.55895999999996, "r_x3": 370.345, "r_y3": 166.55895999999996, "coord_origin": "TOPLEFT" }, "text": "mAP(0.75)", "orig": "mAP(0.75)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 426.737, "r_y0": 169.14868, "r_x1": 463.10830999999996, "r_y1": 169.14868, "r_x2": 463.10830999999996, "r_y2": 161.07898, "r_x3": 426.737, "r_y3": 161.07898, "coord_origin": "TOPLEFT" }, "text": "Inference", "orig": "Inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.11401, "r_y0": 180.10766999999998, "r_x1": 466.72656, "r_y1": 180.10766999999998, "r_x2": 466.72656, "r_y2": 172.03796, "r_x3": 423.11401, "r_y3": 172.03796, "coord_origin": "TOPLEFT" }, "text": "time (secs)", "orig": "time (secs)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.41299, "r_y0": 182.10071000000005, "r_x1": 288.0596, "r_y1": 182.10071000000005, "r_x2": 288.0596, "r_y2": 174.03101000000004, "r_x3": 262.41299, "r_y3": 174.03101000000004, "coord_origin": "TOPLEFT" }, "text": "simple", "orig": "simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 296.42899, "r_y0": 182.10071000000005, "r_x1": 329.44687, "r_y1": 182.10071000000005, "r_x2": 329.44687, "r_y2": 174.03101000000004, "r_x3": 296.42899, "r_y3": 174.03101000000004, "coord_origin": "TOPLEFT" }, "text": "complex", "orig": "complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.03299, "r_y0": 182.10071000000005, "r_x1": 354.75793, "r_y1": 182.10071000000005, "r_x2": 354.75793, "r_y2": 174.03101000000004, "r_x3": 345.03299, "r_y3": 174.03101000000004, "coord_origin": "TOPLEFT" }, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.53799, "r_y0": 200.92969000000005, "r_x1": 201.24129, "r_y1": 200.92969000000005, "r_x2": 201.24129, "r_y2": 192.85999000000004, "r_x3": 154.53799, "r_y3": 192.85999000000004, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.43700000000004, "r_y0": 195.45068000000003, "r_x1": 247.13226000000003, "r_y1": 195.45068000000003, "r_x2": 247.13226000000003, "r_y2": 187.38098000000002, "r_x3": 222.43700000000004, "r_y3": 187.38098000000002, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74399, "r_y0": 195.45068000000003, "r_x1": 285.73074, "r_y1": 195.45068000000003, "r_x2": 285.73074, "r_y2": 187.38098000000002, "r_x3": 264.74399, "r_y3": 187.38098000000002, "coord_origin": "TOPLEFT" }, "text": "0.965", "orig": "0.965", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.444, "r_y0": 195.45068000000003, "r_x1": 323.43076, "r_y1": 195.45068000000003, "r_x2": 323.43076, "r_y2": 187.38098000000002, "r_x3": 302.444, "r_y3": 187.38098000000002, "coord_origin": "TOPLEFT" }, "text": "0.934", "orig": "0.934", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.40302, "r_y0": 195.45068000000003, "r_x1": 360.38977, "r_y1": 195.45068000000003, "r_x2": 360.38977, "r_y2": 187.38098000000002, "r_x3": 339.40302, "r_y3": 187.38098000000002, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 383.116, "r_y0": 195.24451, "r_x1": 401.97324, "r_y1": 195.24451, "r_x2": 401.97324, "r_y2": 187.31817999999998, "r_x3": 383.116, "r_y3": 187.31817999999998, "coord_origin": "TOPLEFT" }, "text": "0.88", "orig": "0.88", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.49300999999997, "r_y0": 195.24451, "r_x1": 454.35025, "r_y1": 195.24451, "r_x2": 454.35025, "r_y2": 187.31817999999998, "r_x3": 435.49300999999997, "r_y3": 187.31817999999998, "coord_origin": "TOPLEFT" }, "text": "2.73", "orig": "2.73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.903, "r_y0": 208.40166999999997, "r_x1": 248.66655999999998, "r_y1": 208.40166999999997, "r_x2": 248.66655999999998, "r_y2": 200.33196999999996, "r_x3": 220.903, "r_y3": 200.33196999999996, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74399, "r_y0": 208.40166999999997, "r_x1": 285.73074, "r_y1": 208.40166999999997, "r_x2": 285.73074, "r_y2": 200.33196999999996, "r_x3": 264.74399, "r_y3": 200.33196999999996, "coord_origin": "TOPLEFT" }, "text": "0.969", "orig": "0.969", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.444, "r_y0": 208.40166999999997, "r_x1": 323.43076, "r_y1": 208.40166999999997, "r_x2": 323.43076, "r_y2": 200.33196999999996, "r_x3": 302.444, "r_y3": 200.33196999999996, "coord_origin": "TOPLEFT" }, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.40302, "r_y0": 208.40166999999997, "r_x1": 360.38977, "r_y1": 208.40166999999997, "r_x2": 360.38977, "r_y2": 200.33196999999996, "r_x3": 339.40302, "r_y3": 200.33196999999996, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.052, "r_y0": 208.40166999999997, "r_x1": 403.03876, "r_y1": 208.40166999999997, "r_x2": 403.03876, "r_y2": 200.33196999999996, "r_x3": 382.052, "r_y3": 200.33196999999996, "coord_origin": "TOPLEFT" }, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.73199000000005, "r_y0": 208.40166999999997, "r_x1": 453.11182, "r_y1": 208.40166999999997, "r_x2": 453.11182, "r_y2": 200.33196999999996, "r_x3": 436.73199000000005, "r_y3": 200.33196999999996, "coord_origin": "TOPLEFT" }, "text": "5.39", "orig": "5.39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 155.94501, "r_y0": 227.23168999999996, "r_x1": 199.83374, "r_y1": 227.23168999999996, "r_x2": 199.83374, "r_y2": 219.16198999999995, "r_x3": 155.94501, "r_y3": 219.16198999999995, "coord_origin": "TOPLEFT" }, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.43700000000004, "r_y0": 221.75171, "r_x1": 247.13226000000003, "r_y1": 221.75171, "r_x2": 247.13226000000003, "r_y2": 213.68201, "r_x3": 222.43700000000004, "r_y3": 213.68201, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74399, "r_y0": 221.75171, "r_x1": 285.73074, "r_y1": 221.75171, "r_x2": 285.73074, "r_y2": 213.68201, "r_x3": 264.74399, "r_y3": 213.68201, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.444, "r_y0": 221.75171, "r_x1": 323.43076, "r_y1": 221.75171, "r_x2": 323.43076, "r_y2": 213.68201, "r_x3": 302.444, "r_y3": 213.68201, "coord_origin": "TOPLEFT" }, "text": "0.961", "orig": "0.961", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.815, "r_y0": 221.54552999999999, "r_x1": 361.97586, "r_y1": 221.54552999999999, "r_x2": 361.97586, "r_y2": 213.61919999999998, "r_x3": 337.815, "r_y3": 213.61919999999998, "coord_origin": "TOPLEFT" }, "text": "0.959", "orig": "0.959", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 380.46399, "r_y0": 221.54552999999999, "r_x1": 404.62485, "r_y1": 221.54552999999999, "r_x2": 404.62485, "r_y2": 213.61919999999998, "r_x3": 380.46399, "r_y3": 213.61919999999998, "coord_origin": "TOPLEFT" }, "text": "0.862", "orig": "0.862", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.49300999999997, "r_y0": 221.54552999999999, "r_x1": 454.35025, "r_y1": 221.54552999999999, "r_x2": 454.35025, "r_y2": 213.61919999999998, "r_x3": 435.49300999999997, "r_y3": 213.61919999999998, "coord_origin": "TOPLEFT" }, "text": "1.85", "orig": "1.85", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.903, "r_y0": 234.70367, "r_x1": 248.66655999999998, "r_y1": 234.70367, "r_x2": 248.66655999999998, "r_y2": 226.63396999999998, "r_x3": 220.903, "r_y3": 226.63396999999998, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74399, "r_y0": 234.70367, "r_x1": 285.73074, "r_y1": 234.70367, "r_x2": 285.73074, "r_y2": 226.63396999999998, "r_x3": 264.74399, "r_y3": 226.63396999999998, "coord_origin": "TOPLEFT" }, "text": "0.917", "orig": "0.917", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.444, "r_y0": 234.70367, "r_x1": 323.43076, "r_y1": 234.70367, "r_x2": 323.43076, "r_y2": 226.63396999999998, "r_x3": 302.444, "r_y3": 226.63396999999998, "coord_origin": "TOPLEFT" }, "text": "0.922", "orig": "0.922", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 341.70599, "r_y0": 234.70367, "r_x1": 358.08582, "r_y1": 234.70367, "r_x2": 358.08582, "r_y2": 226.63396999999998, "r_x3": 341.70599, "r_y3": 226.63396999999998, "coord_origin": "TOPLEFT" }, "text": "0.92", "orig": "0.92", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.052, "r_y0": 234.70367, "r_x1": 403.03876, "r_y1": 234.70367, "r_x2": 403.03876, "r_y2": 226.63396999999998, "r_x3": 382.052, "r_y3": 226.63396999999998, "coord_origin": "TOPLEFT" }, "text": "0.722", "orig": "0.722", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.73199000000005, "r_y0": 234.70367, "r_x1": 453.11182, "r_y1": 234.70367, "r_x2": 453.11182, "r_y2": 226.63396999999998, "r_x3": 436.73199000000005, "r_y3": 226.63396999999998, "coord_origin": "TOPLEFT" }, "text": "3.26", "orig": "3.26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 148.62601, "r_y0": 253.53265, "r_x1": 207.1524, "r_y1": 253.53265, "r_x2": 207.1524, "r_y2": 245.46294999999998, "r_x3": 148.62601, "r_y3": 245.46294999999998, "coord_origin": "TOPLEFT" }, "text": "PubTables-1M", "orig": "PubTables-1M", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.43700000000004, "r_y0": 248.05267000000003, "r_x1": 247.13226000000003, "r_y1": 248.05267000000003, "r_x2": 247.13226000000003, "r_y2": 239.98297000000002, "r_x3": 222.43700000000004, "r_y3": 239.98297000000002, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74399, "r_y0": 248.05267000000003, "r_x1": 285.73074, "r_y1": 248.05267000000003, "r_x2": 285.73074, "r_y2": 239.98297000000002, "r_x3": 264.74399, "r_y3": 239.98297000000002, "coord_origin": "TOPLEFT" }, "text": "0.987", "orig": "0.987", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.444, "r_y0": 248.05267000000003, "r_x1": 323.43076, "r_y1": 248.05267000000003, "r_x2": 323.43076, "r_y2": 239.98297000000002, "r_x3": 302.444, "r_y3": 239.98297000000002, "coord_origin": "TOPLEFT" }, "text": "0.964", "orig": "0.964", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.815, "r_y0": 247.8465, "r_x1": 361.97586, "r_y1": 247.8465, "r_x2": 361.97586, "r_y2": 239.92016999999998, "r_x3": 337.815, "r_y3": 239.92016999999998, "coord_origin": "TOPLEFT" }, "text": "0.977", "orig": "0.977", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 380.46399, "r_y0": 247.8465, "r_x1": 404.62485, "r_y1": 247.8465, "r_x2": 404.62485, "r_y2": 239.92016999999998, "r_x3": 380.46399, "r_y3": 239.92016999999998, "coord_origin": "TOPLEFT" }, "text": "0.896", "orig": "0.896", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.49300999999997, "r_y0": 247.8465, "r_x1": 454.35025, "r_y1": 247.8465, "r_x2": 454.35025, "r_y2": 239.92016999999998, "r_x3": 435.49300999999997, "r_y3": 239.92016999999998, "coord_origin": "TOPLEFT" }, "text": "1.79", "orig": "1.79", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.903, "r_y0": 261.00469999999996, "r_x1": 248.66655999999998, "r_y1": 261.00469999999996, "r_x2": 248.66655999999998, "r_y2": 252.93499999999995, "r_x3": 220.903, "r_y3": 252.93499999999995, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74399, "r_y0": 261.00469999999996, "r_x1": 285.73074, "r_y1": 261.00469999999996, "r_x2": 285.73074, "r_y2": 252.93499999999995, "r_x3": 264.74399, "r_y3": 252.93499999999995, "coord_origin": "TOPLEFT" }, "text": "0.983", "orig": "0.983", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.444, "r_y0": 261.00469999999996, "r_x1": 323.43076, "r_y1": 261.00469999999996, "r_x2": 323.43076, "r_y2": 252.93499999999995, "r_x3": 302.444, "r_y3": 252.93499999999995, "coord_origin": "TOPLEFT" }, "text": "0.944", "orig": "0.944", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.40302, "r_y0": 261.00469999999996, "r_x1": 360.38977, "r_y1": 261.00469999999996, "r_x2": 360.38977, "r_y2": 252.93499999999995, "r_x3": 339.40302, "r_y3": 252.93499999999995, "coord_origin": "TOPLEFT" }, "text": "0.966", "orig": "0.966", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.052, "r_y0": 261.00469999999996, "r_x1": 403.03876, "r_y1": 261.00469999999996, "r_x2": 403.03876, "r_y2": 252.93499999999995, "r_x3": 382.052, "r_y3": 252.93499999999995, "coord_origin": "TOPLEFT" }, "text": "0.889", "orig": "0.889", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.73199000000005, "r_y0": 261.00469999999996, "r_x1": 453.11182, "r_y1": 261.00469999999996, "r_x2": 453.11182, "r_y2": 252.93499999999995, "r_x3": 436.73199000000005, "r_y3": 252.93499999999995, "coord_origin": "TOPLEFT" }, "text": "3.26", "orig": "3.26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 10, "label": "text", "bbox": { "l": 160.782, "t": 166.55895999999996, "r": 194.99779, "b": 174.62865999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.782, "r_y0": 174.62865999999997, "r_x1": 194.99779, "r_y1": 174.62865999999997, "r_x2": 194.99779, "r_y2": 166.55895999999996, "r_x3": 160.782, "r_y3": 166.55895999999996, "coord_origin": "TOPLEFT" }, "text": "Data set", "orig": "Data set", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 11, "label": "text", "bbox": { "l": 215.52499000000003, "t": 166.534, "r": 254.04465, "b": 174.6037, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 215.52499000000003, "r_y0": 174.6037, "r_x1": 254.04465, "r_y1": 174.6037, "r_x2": 254.04465, "r_y2": 166.534, "r_x3": 215.52499000000003, "r_y3": 166.534, "coord_origin": "TOPLEFT" }, "text": "Language", "orig": "Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 12, "label": "text", "bbox": { "l": 300.397, "t": 161.07898, "r": 323.99118, "b": 169.14868, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 300.397, "r_y0": 169.14868, "r_x1": 323.99118, "r_y1": 169.14868, "r_x2": 323.99118, "r_y2": 161.07898, "r_x3": 300.397, "r_y3": 161.07898, "coord_origin": "TOPLEFT" }, "text": "TEDs", "orig": "TEDs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 13, "label": "text", "bbox": { "l": 370.345, "t": 166.55895999999996, "r": 414.74661, "b": 174.62865999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 370.345, "r_y0": 174.62865999999997, "r_x1": 414.74661, "r_y1": 174.62865999999997, "r_x2": 414.74661, "r_y2": 166.55895999999996, "r_x3": 370.345, "r_y3": 166.55895999999996, "coord_origin": "TOPLEFT" }, "text": "mAP(0.75)", "orig": "mAP(0.75)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 14, "label": "text", "bbox": { "l": 426.737, "t": 161.07898, "r": 463.10830999999996, "b": 169.14868, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 426.737, "r_y0": 169.14868, "r_x1": 463.10830999999996, "r_y1": 169.14868, "r_x2": 463.10830999999996, "r_y2": 161.07898, "r_x3": 426.737, "r_y3": 161.07898, "coord_origin": "TOPLEFT" }, "text": "Inference", "orig": "Inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 15, "label": "text", "bbox": { "l": 423.11401, "t": 172.03796, "r": 466.72656, "b": 180.10766999999998, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.11401, "r_y0": 180.10766999999998, "r_x1": 466.72656, "r_y1": 180.10766999999998, "r_x2": 466.72656, "r_y2": 172.03796, "r_x3": 423.11401, "r_y3": 172.03796, "coord_origin": "TOPLEFT" }, "text": "time (secs)", "orig": "time (secs)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 16, "label": "text", "bbox": { "l": 262.41299, "t": 174.03101000000004, "r": 288.0596, "b": 182.10071000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.41299, "r_y0": 182.10071000000005, "r_x1": 288.0596, "r_y1": 182.10071000000005, "r_x2": 288.0596, "r_y2": 174.03101000000004, "r_x3": 262.41299, "r_y3": 174.03101000000004, "coord_origin": "TOPLEFT" }, "text": "simple", "orig": "simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 17, "label": "text", "bbox": { "l": 296.42899, "t": 174.03101000000004, "r": 329.44687, "b": 182.10071000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 296.42899, "r_y0": 182.10071000000005, "r_x1": 329.44687, "r_y1": 182.10071000000005, "r_x2": 329.44687, "r_y2": 174.03101000000004, "r_x3": 296.42899, "r_y3": 174.03101000000004, "coord_origin": "TOPLEFT" }, "text": "complex", "orig": "complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 18, "label": "text", "bbox": { "l": 345.03299, "t": 174.03101000000004, "r": 354.75793, "b": 182.10071000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.03299, "r_y0": 182.10071000000005, "r_x1": 354.75793, "r_y1": 182.10071000000005, "r_x2": 354.75793, "r_y2": 174.03101000000004, "r_x3": 345.03299, "r_y3": 174.03101000000004, "coord_origin": "TOPLEFT" }, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 19, "label": "text", "bbox": { "l": 154.53799, "t": 192.85999000000004, "r": 201.24129, "b": 200.92969000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.53799, "r_y0": 200.92969000000005, "r_x1": 201.24129, "r_y1": 200.92969000000005, "r_x2": 201.24129, "r_y2": 192.85999000000004, "r_x3": 154.53799, "r_y3": 192.85999000000004, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 20, "label": "text", "bbox": { "l": 222.43700000000004, "t": 187.38098000000002, "r": 247.13226000000003, "b": 195.45068000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.43700000000004, "r_y0": 195.45068000000003, "r_x1": 247.13226000000003, "r_y1": 195.45068000000003, "r_x2": 247.13226000000003, "r_y2": 187.38098000000002, "r_x3": 222.43700000000004, "r_y3": 187.38098000000002, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 21, "label": "text", "bbox": { "l": 264.74399, "t": 187.38098000000002, "r": 285.73074, "b": 195.45068000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74399, "r_y0": 195.45068000000003, "r_x1": 285.73074, "r_y1": 195.45068000000003, "r_x2": 285.73074, "r_y2": 187.38098000000002, "r_x3": 264.74399, "r_y3": 187.38098000000002, "coord_origin": "TOPLEFT" }, "text": "0.965", "orig": "0.965", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 22, "label": "text", "bbox": { "l": 302.444, "t": 187.38098000000002, "r": 323.43076, "b": 195.45068000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.444, "r_y0": 195.45068000000003, "r_x1": 323.43076, "r_y1": 195.45068000000003, "r_x2": 323.43076, "r_y2": 187.38098000000002, "r_x3": 302.444, "r_y3": 187.38098000000002, "coord_origin": "TOPLEFT" }, "text": "0.934", "orig": "0.934", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 23, "label": "text", "bbox": { "l": 339.40302, "t": 187.38098000000002, "r": 360.38977, "b": 195.45068000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.40302, "r_y0": 195.45068000000003, "r_x1": 360.38977, "r_y1": 195.45068000000003, "r_x2": 360.38977, "r_y2": 187.38098000000002, "r_x3": 339.40302, "r_y3": 187.38098000000002, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 24, "label": "text", "bbox": { "l": 383.116, "t": 187.31817999999998, "r": 401.97324, "b": 195.24451, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 383.116, "r_y0": 195.24451, "r_x1": 401.97324, "r_y1": 195.24451, "r_x2": 401.97324, "r_y2": 187.31817999999998, "r_x3": 383.116, "r_y3": 187.31817999999998, "coord_origin": "TOPLEFT" }, "text": "0.88", "orig": "0.88", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 25, "label": "text", "bbox": { "l": 435.49300999999997, "t": 187.31817999999998, "r": 454.35025, "b": 195.24451, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.49300999999997, "r_y0": 195.24451, "r_x1": 454.35025, "r_y1": 195.24451, "r_x2": 454.35025, "r_y2": 187.31817999999998, "r_x3": 435.49300999999997, "r_y3": 187.31817999999998, "coord_origin": "TOPLEFT" }, "text": "2.73", "orig": "2.73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 26, "label": "text", "bbox": { "l": 220.903, "t": 200.33196999999996, "r": 248.66655999999998, "b": 208.40166999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.903, "r_y0": 208.40166999999997, "r_x1": 248.66655999999998, "r_y1": 208.40166999999997, "r_x2": 248.66655999999998, "r_y2": 200.33196999999996, "r_x3": 220.903, "r_y3": 200.33196999999996, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 27, "label": "text", "bbox": { "l": 264.74399, "t": 200.33196999999996, "r": 285.73074, "b": 208.40166999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74399, "r_y0": 208.40166999999997, "r_x1": 285.73074, "r_y1": 208.40166999999997, "r_x2": 285.73074, "r_y2": 200.33196999999996, "r_x3": 264.74399, "r_y3": 200.33196999999996, "coord_origin": "TOPLEFT" }, "text": "0.969", "orig": "0.969", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 28, "label": "text", "bbox": { "l": 302.444, "t": 200.33196999999996, "r": 323.43076, "b": 208.40166999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.444, "r_y0": 208.40166999999997, "r_x1": 323.43076, "r_y1": 208.40166999999997, "r_x2": 323.43076, "r_y2": 200.33196999999996, "r_x3": 302.444, "r_y3": 200.33196999999996, "coord_origin": "TOPLEFT" }, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 29, "label": "text", "bbox": { "l": 339.40302, "t": 200.33196999999996, "r": 360.38977, "b": 208.40166999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.40302, "r_y0": 208.40166999999997, "r_x1": 360.38977, "r_y1": 208.40166999999997, "r_x2": 360.38977, "r_y2": 200.33196999999996, "r_x3": 339.40302, "r_y3": 200.33196999999996, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 30, "label": "text", "bbox": { "l": 382.052, "t": 200.33196999999996, "r": 403.03876, "b": 208.40166999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.052, "r_y0": 208.40166999999997, "r_x1": 403.03876, "r_y1": 208.40166999999997, "r_x2": 403.03876, "r_y2": 200.33196999999996, "r_x3": 382.052, "r_y3": 200.33196999999996, "coord_origin": "TOPLEFT" }, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 31, "label": "text", "bbox": { "l": 436.73199000000005, "t": 200.33196999999996, "r": 453.11182, "b": 208.40166999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.73199000000005, "r_y0": 208.40166999999997, "r_x1": 453.11182, "r_y1": 208.40166999999997, "r_x2": 453.11182, "r_y2": 200.33196999999996, "r_x3": 436.73199000000005, "r_y3": 200.33196999999996, "coord_origin": "TOPLEFT" }, "text": "5.39", "orig": "5.39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 32, "label": "text", "bbox": { "l": 155.94501, "t": 219.16198999999995, "r": 199.83374, "b": 227.23168999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 155.94501, "r_y0": 227.23168999999996, "r_x1": 199.83374, "r_y1": 227.23168999999996, "r_x2": 199.83374, "r_y2": 219.16198999999995, "r_x3": 155.94501, "r_y3": 219.16198999999995, "coord_origin": "TOPLEFT" }, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 33, "label": "text", "bbox": { "l": 222.43700000000004, "t": 213.68201, "r": 247.13226000000003, "b": 221.75171, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.43700000000004, "r_y0": 221.75171, "r_x1": 247.13226000000003, "r_y1": 221.75171, "r_x2": 247.13226000000003, "r_y2": 213.68201, "r_x3": 222.43700000000004, "r_y3": 213.68201, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 34, "label": "text", "bbox": { "l": 264.74399, "t": 213.68201, "r": 285.73074, "b": 221.75171, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74399, "r_y0": 221.75171, "r_x1": 285.73074, "r_y1": 221.75171, "r_x2": 285.73074, "r_y2": 213.68201, "r_x3": 264.74399, "r_y3": 213.68201, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 35, "label": "text", "bbox": { "l": 302.444, "t": 213.68201, "r": 323.43076, "b": 221.75171, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.444, "r_y0": 221.75171, "r_x1": 323.43076, "r_y1": 221.75171, "r_x2": 323.43076, "r_y2": 213.68201, "r_x3": 302.444, "r_y3": 213.68201, "coord_origin": "TOPLEFT" }, "text": "0.961", "orig": "0.961", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 36, "label": "text", "bbox": { "l": 337.815, "t": 213.61919999999998, "r": 361.97586, "b": 221.54552999999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.815, "r_y0": 221.54552999999999, "r_x1": 361.97586, "r_y1": 221.54552999999999, "r_x2": 361.97586, "r_y2": 213.61919999999998, "r_x3": 337.815, "r_y3": 213.61919999999998, "coord_origin": "TOPLEFT" }, "text": "0.959", "orig": "0.959", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 37, "label": "text", "bbox": { "l": 380.46399, "t": 213.61919999999998, "r": 404.62485, "b": 221.54552999999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 380.46399, "r_y0": 221.54552999999999, "r_x1": 404.62485, "r_y1": 221.54552999999999, "r_x2": 404.62485, "r_y2": 213.61919999999998, "r_x3": 380.46399, "r_y3": 213.61919999999998, "coord_origin": "TOPLEFT" }, "text": "0.862", "orig": "0.862", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 38, "label": "text", "bbox": { "l": 435.49300999999997, "t": 213.61919999999998, "r": 454.35025, "b": 221.54552999999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.49300999999997, "r_y0": 221.54552999999999, "r_x1": 454.35025, "r_y1": 221.54552999999999, "r_x2": 454.35025, "r_y2": 213.61919999999998, "r_x3": 435.49300999999997, "r_y3": 213.61919999999998, "coord_origin": "TOPLEFT" }, "text": "1.85", "orig": "1.85", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 39, "label": "text", "bbox": { "l": 220.903, "t": 226.63396999999998, "r": 248.66655999999998, "b": 234.70367, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.903, "r_y0": 234.70367, "r_x1": 248.66655999999998, "r_y1": 234.70367, "r_x2": 248.66655999999998, "r_y2": 226.63396999999998, "r_x3": 220.903, "r_y3": 226.63396999999998, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 40, "label": "text", "bbox": { "l": 264.74399, "t": 226.63396999999998, "r": 285.73074, "b": 234.70367, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74399, "r_y0": 234.70367, "r_x1": 285.73074, "r_y1": 234.70367, "r_x2": 285.73074, "r_y2": 226.63396999999998, "r_x3": 264.74399, "r_y3": 226.63396999999998, "coord_origin": "TOPLEFT" }, "text": "0.917", "orig": "0.917", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 302.444, "t": 226.63396999999998, "r": 323.43076, "b": 234.70367, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.444, "r_y0": 234.70367, "r_x1": 323.43076, "r_y1": 234.70367, "r_x2": 323.43076, "r_y2": 226.63396999999998, "r_x3": 302.444, "r_y3": 226.63396999999998, "coord_origin": "TOPLEFT" }, "text": "0.922", "orig": "0.922", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 341.70599, "t": 226.63396999999998, "r": 358.08582, "b": 234.70367, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 341.70599, "r_y0": 234.70367, "r_x1": 358.08582, "r_y1": 234.70367, "r_x2": 358.08582, "r_y2": 226.63396999999998, "r_x3": 341.70599, "r_y3": 226.63396999999998, "coord_origin": "TOPLEFT" }, "text": "0.92", "orig": "0.92", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 382.052, "t": 226.63396999999998, "r": 403.03876, "b": 234.70367, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.052, "r_y0": 234.70367, "r_x1": 403.03876, "r_y1": 234.70367, "r_x2": 403.03876, "r_y2": 226.63396999999998, "r_x3": 382.052, "r_y3": 226.63396999999998, "coord_origin": "TOPLEFT" }, "text": "0.722", "orig": "0.722", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 436.73199000000005, "t": 226.63396999999998, "r": 453.11182, "b": 234.70367, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.73199000000005, "r_y0": 234.70367, "r_x1": 453.11182, "r_y1": 234.70367, "r_x2": 453.11182, "r_y2": 226.63396999999998, "r_x3": 436.73199000000005, "r_y3": 226.63396999999998, "coord_origin": "TOPLEFT" }, "text": "3.26", "orig": "3.26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 148.62601, "t": 245.46294999999998, "r": 207.1524, "b": 253.53265, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 148.62601, "r_y0": 253.53265, "r_x1": 207.1524, "r_y1": 253.53265, "r_x2": 207.1524, "r_y2": 245.46294999999998, "r_x3": 148.62601, "r_y3": 245.46294999999998, "coord_origin": "TOPLEFT" }, "text": "PubTables-1M", "orig": "PubTables-1M", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 222.43700000000004, "t": 239.98297000000002, "r": 247.13226000000003, "b": 248.05267000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.43700000000004, "r_y0": 248.05267000000003, "r_x1": 247.13226000000003, "r_y1": 248.05267000000003, "r_x2": 247.13226000000003, "r_y2": 239.98297000000002, "r_x3": 222.43700000000004, "r_y3": 239.98297000000002, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 264.74399, "t": 239.98297000000002, "r": 285.73074, "b": 248.05267000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74399, "r_y0": 248.05267000000003, "r_x1": 285.73074, "r_y1": 248.05267000000003, "r_x2": 285.73074, "r_y2": 239.98297000000002, "r_x3": 264.74399, "r_y3": 239.98297000000002, "coord_origin": "TOPLEFT" }, "text": "0.987", "orig": "0.987", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 302.444, "t": 239.98297000000002, "r": 323.43076, "b": 248.05267000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.444, "r_y0": 248.05267000000003, "r_x1": 323.43076, "r_y1": 248.05267000000003, "r_x2": 323.43076, "r_y2": 239.98297000000002, "r_x3": 302.444, "r_y3": 239.98297000000002, "coord_origin": "TOPLEFT" }, "text": "0.964", "orig": "0.964", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 337.815, "t": 239.92016999999998, "r": 361.97586, "b": 247.8465, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.815, "r_y0": 247.8465, "r_x1": 361.97586, "r_y1": 247.8465, "r_x2": 361.97586, "r_y2": 239.92016999999998, "r_x3": 337.815, "r_y3": 239.92016999999998, "coord_origin": "TOPLEFT" }, "text": "0.977", "orig": "0.977", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 380.46399, "t": 239.92016999999998, "r": 404.62485, "b": 247.8465, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 380.46399, "r_y0": 247.8465, "r_x1": 404.62485, "r_y1": 247.8465, "r_x2": 404.62485, "r_y2": 239.92016999999998, "r_x3": 380.46399, "r_y3": 239.92016999999998, "coord_origin": "TOPLEFT" }, "text": "0.896", "orig": "0.896", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 51, "label": "text", "bbox": { "l": 435.49300999999997, "t": 239.92016999999998, "r": 454.35025, "b": 247.8465, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.49300999999997, "r_y0": 247.8465, "r_x1": 454.35025, "r_y1": 247.8465, "r_x2": 454.35025, "r_y2": 239.92016999999998, "r_x3": 435.49300999999997, "r_y3": 239.92016999999998, "coord_origin": "TOPLEFT" }, "text": "1.79", "orig": "1.79", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 52, "label": "text", "bbox": { "l": 220.903, "t": 252.93499999999995, "r": 248.66655999999998, "b": 261.00469999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.903, "r_y0": 261.00469999999996, "r_x1": 248.66655999999998, "r_y1": 261.00469999999996, "r_x2": 248.66655999999998, "r_y2": 252.93499999999995, "r_x3": 220.903, "r_y3": 252.93499999999995, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 53, "label": "text", "bbox": { "l": 264.74399, "t": 252.93499999999995, "r": 285.73074, "b": 261.00469999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74399, "r_y0": 261.00469999999996, "r_x1": 285.73074, "r_y1": 261.00469999999996, "r_x2": 285.73074, "r_y2": 252.93499999999995, "r_x3": 264.74399, "r_y3": 252.93499999999995, "coord_origin": "TOPLEFT" }, "text": "0.983", "orig": "0.983", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 54, "label": "text", "bbox": { "l": 302.444, "t": 252.93499999999995, "r": 323.43076, "b": 261.00469999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.444, "r_y0": 261.00469999999996, "r_x1": 323.43076, "r_y1": 261.00469999999996, "r_x2": 323.43076, "r_y2": 252.93499999999995, "r_x3": 302.444, "r_y3": 252.93499999999995, "coord_origin": "TOPLEFT" }, "text": "0.944", "orig": "0.944", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 55, "label": "text", "bbox": { "l": 339.40302, "t": 252.93499999999995, "r": 360.38977, "b": 261.00469999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.40302, "r_y0": 261.00469999999996, "r_x1": 360.38977, "r_y1": 261.00469999999996, "r_x2": 360.38977, "r_y2": 252.93499999999995, "r_x3": 339.40302, "r_y3": 252.93499999999995, "coord_origin": "TOPLEFT" }, "text": "0.966", "orig": "0.966", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 56, "label": "text", "bbox": { "l": 382.052, "t": 252.93499999999995, "r": 403.03876, "b": 261.00469999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.052, "r_y0": 261.00469999999996, "r_x1": 403.03876, "r_y1": 261.00469999999996, "r_x2": 403.03876, "r_y2": 252.93499999999995, "r_x3": 382.052, "r_y3": 252.93499999999995, "coord_origin": "TOPLEFT" }, "text": "0.889", "orig": "0.889", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 57, "label": "text", "bbox": { "l": 436.73199000000005, "t": 252.93499999999995, "r": 453.11182, "b": 261.00469999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.73199000000005, "r_y0": 261.00469999999996, "r_x1": 453.11182, "r_y1": 261.00469999999996, "r_x2": 453.11182, "r_y2": 252.93499999999995, "r_x3": 436.73199000000005, "r_y3": 252.93499999999995, "coord_origin": "TOPLEFT" }, "text": "3.26", "orig": "3.26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "lcel", "lcel", "ched", "ched", "nl", "ucel", "ucel", "ched", "ched", "ched", "ucel", "ucel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 5, "num_cols": 7, "table_cells": [ { "bbox": { "l": 160.782, "t": 166.55895999999996, "r": 194.99779, "b": 174.62865999999997, "coord_origin": "TOPLEFT" }, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Data set", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 215.52499000000003, "t": 166.534, "r": 254.04465, "b": 174.6037, "coord_origin": "TOPLEFT" }, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "Language", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 300.397, "t": 161.07898, "r": 323.99118, "b": 169.14868, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 3, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 2, "end_col_offset_idx": 5, "text": "TEDs", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 370.345, "t": 166.55895999999996, "r": 414.74661, "b": 174.62865999999997, "coord_origin": "TOPLEFT" }, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "mAP(0.75)", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 426.737, "t": 161.07898, "r": 463.10830999999996, "b": 169.14868, "coord_origin": "TOPLEFT" }, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "Inference time (secs)", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 262.41299, "t": 174.03101000000004, "r": 288.0596, "b": 182.10071000000005, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "simple", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 296.42899, "t": 174.03101000000004, "r": 329.44687, "b": 182.10071000000005, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "complex", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 345.03299, "t": 174.03101000000004, "r": 354.75793, "b": 182.10071000000005, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "all", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 154.53799, "t": 192.85999000000004, "r": 201.24129, "b": 200.92969000000005, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "PubTabNet", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 222.43700000000004, "t": 187.38098000000002, "r": 247.13226000000003, "b": 195.45068000000003, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 264.74399, "t": 187.38098000000002, "r": 285.73074, "b": 195.45068000000003, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "0.965 0.969", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 302.444, "t": 187.38098000000002, "r": 323.43076, "b": 195.45068000000003, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.934 0.927", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 339.40302, "t": 187.38098000000002, "r": 360.38977, "b": 195.45068000000003, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.955 0.955", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 383.116, "t": 187.31817999999998, "r": 401.97324, "b": 195.24451, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.88 0.857", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 435.49300999999997, "t": 187.31817999999998, "r": 454.35025, "b": 195.24451, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "2.73 5.39", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 155.94501, "t": 219.16198999999995, "r": 199.83374, "b": 227.23168999999996, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "FinTabNet", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 222.43700000000004, "t": 213.68201, "r": 247.13226000000003, "b": 221.75171, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 264.74399, "t": 213.68201, "r": 285.73074, "b": 221.75171, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "0.955 0.917", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 302.444, "t": 213.68201, "r": 323.43076, "b": 221.75171, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.961 0.922", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 337.815, "t": 213.61919999999998, "r": 361.97586, "b": 221.54552999999999, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.959 0.92", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 380.46399, "t": 213.61919999999998, "r": 404.62485, "b": 221.54552999999999, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.862 0.722", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 435.49300999999997, "t": 213.61919999999998, "r": 454.35025, "b": 221.54552999999999, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "1.85 3.26", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 148.62601, "t": 245.46294999999998, "r": 207.1524, "b": 253.53265, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "PubTables-1M", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 222.43700000000004, "t": 239.98297000000002, "r": 247.13226000000003, "b": 248.05267000000003, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 264.74399, "t": 239.98297000000002, "r": 285.73074, "b": 248.05267000000003, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "0.987 0.983", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 302.444, "t": 239.98297000000002, "r": 323.43076, "b": 248.05267000000003, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.964 0.944", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 337.815, "t": 239.92016999999998, "r": 361.97586, "b": 247.8465, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.977 0.966", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 380.46399, "t": 239.92016999999998, "r": 404.62485, "b": 247.8465, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.896 0.889", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 435.49300999999997, "t": 239.92016999999998, "r": 454.35025, "b": 247.8465, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "1.79 3.26", "column_header": false, "row_header": false, "row_section": false } ] }, { "label": "section_header", "id": 3, "page_no": 9, "cluster": { "id": 3, "label": "section_header", "bbox": { "l": 134.765, "t": 288.91479, "r": 257.08679, "b": 297.72173999999995, "coord_origin": "TOPLEFT" }, "confidence": 0.9546447992324829, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 297.72173999999995, "r_x1": 149.40205, "r_y1": 297.72173999999995, "r_x2": 149.40205, "r_y2": 288.91479, "r_x3": 134.765, "r_y3": 288.91479, "coord_origin": "TOPLEFT" }, "text": "5.3", "orig": "5.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.85904, "r_y0": 297.72173999999995, "r_x1": 257.08679, "r_y1": 297.72173999999995, "r_x2": 257.08679, "r_y2": 288.91479, "r_x3": 160.85904, "r_y3": 288.91479, "coord_origin": "TOPLEFT" }, "text": "Qualitative Results", "orig": "Qualitative Results", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "5.3 Qualitative Results" }, { "label": "text", "id": 1, "page_no": 9, "cluster": { "id": 1, "label": "text", "bbox": { "l": 134.765, "t": 309.86078, "r": 480.58981, "b": 366.47769, "coord_origin": "TOPLEFT" }, "confidence": 0.9834085702896118, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 318.65775, "r_x1": 480.58777, "r_y1": 318.65775, "r_x2": 480.58777, "r_y2": 309.86078, "r_x3": 134.765, "r_y3": 309.86078, "coord_origin": "TOPLEFT" }, "text": "To illustrate the qualitative differences between OTSL and HTML, Figure 5", "orig": "To illustrate the qualitative differences between OTSL and HTML, Figure 5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 330.61273, "r_x1": 480.58889999999997, "r_y1": 330.61273, "r_x2": 480.58889999999997, "r_y2": 321.81577, "r_x3": 134.765, "r_y3": 321.81577, "coord_origin": "TOPLEFT" }, "text": "demonstrates less overlap and more accurate bounding boxes with OTSL. In", "orig": "demonstrates less overlap and more accurate bounding boxes with OTSL. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 342.56772, "r_x1": 480.58681999999993, "r_y1": 342.56772, "r_x2": 480.58681999999993, "r_y2": 333.77075, "r_x3": 134.765, "r_y3": 333.77075, "coord_origin": "TOPLEFT" }, "text": "Figure 6, OTSL proves to be more effective in handling tables with longer to-", "orig": "Figure 6, OTSL proves to be more effective in handling tables with longer to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 354.52271, "r_x1": 480.58981, "r_y1": 354.52271, "r_x2": 480.58981, "r_y2": 345.72574, "r_x3": 134.765, "r_y3": 345.72574, "coord_origin": "TOPLEFT" }, "text": "ken sequences, resulting in even more precise structure prediction and bounding", "orig": "ken sequences, resulting in even more precise structure prediction and bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 366.47769, "r_x1": 161.65704, "r_y1": 366.47769, "r_x2": 161.65704, "r_y2": 357.68073, "r_x3": 134.765, "r_y3": 357.68073, "coord_origin": "TOPLEFT" }, "text": "boxes.", "orig": "boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "To illustrate the qualitative differences between OTSL and HTML, Figure 5 demonstrates less overlap and more accurate bounding boxes with OTSL. In Figure 6, OTSL proves to be more effective in handling tables with longer token sequences, resulting in even more precise structure prediction and bounding boxes." }, { "label": "caption", "id": 5, "page_no": 9, "cluster": { "id": 5, "label": "caption", "bbox": { "l": 134.765, "t": 397.59012, "r": 480.59106, "b": 439.71716, "coord_origin": "TOPLEFT" }, "confidence": 0.9482728838920593, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 405.51642, "r_x1": 162.64424, "r_y1": 405.51642, "r_x2": 162.64424, "r_y2": 397.59012, "r_x3": 134.765, "r_y3": 397.59012, "coord_origin": "TOPLEFT" }, "text": "Fig. 5.", "orig": "Fig. 5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.384, "r_y0": 405.72266, "r_x1": 480.59106, "r_y1": 405.72266, "r_x2": 480.59106, "r_y2": 397.65289, "r_x3": 167.384, "r_y3": 397.65289, "coord_origin": "TOPLEFT" }, "text": "The OTSL model produces more accurate bounding boxes with less over-", "orig": "The OTSL model produces more accurate bounding boxes with less over-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 416.68167000000005, "r_x1": 480.59106, "r_y1": 416.68167000000005, "r_x2": 480.59106, "r_y2": 408.61190999999997, "r_x3": 134.765, "r_y3": 408.61190999999997, "coord_origin": "TOPLEFT" }, "text": "lap (E) than the HTML model (D), when predicting the structure of a sparse ta-", "orig": "lap (E) than the HTML model (D), when predicting the structure of a sparse ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 427.64066, "r_x1": 480.58838000000003, "r_y1": 427.64066, "r_x2": 480.58838000000003, "r_y2": 419.57089, "r_x3": 134.765, "r_y3": 419.57089, "coord_origin": "TOPLEFT" }, "text": "ble (A), at twice the inference speed because of shorter sequence length (B),(C).", "orig": "ble (A), at twice the inference speed because of shorter sequence length (B),(C).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 438.59964, "r_x1": 304.69171, "r_y1": 438.59964, "r_x2": 304.69171, "r_y2": 430.52987999999993, "r_x3": 134.765, "r_y3": 430.52987999999993, "coord_origin": "TOPLEFT" }, "text": "\"PMC2807444_006_00.png\" PubTabNet.", "orig": "\"PMC2807444_006_00.png\" PubTabNet.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 342.63354, "r_y0": 439.71716, "r_x1": 344.81915, "r_y1": 439.71716, "r_x2": 344.81915, "r_y2": 430.19678, "r_x3": 342.63354, "r_y3": 430.19678, "coord_origin": "TOPLEFT" }, "text": "\u03bc", "orig": "\u03bc", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Fig. 5. The OTSL model produces more accurate bounding boxes with less overlap (E) than the HTML model (D), when predicting the structure of a sparse table (A), at twice the inference speed because of shorter sequence length (B),(C). \"PMC2807444_006_00.png\" PubTabNet. \u03bc" }, { "label": "picture", "id": 2, "page_no": 9, "cluster": { "id": 2, "label": "picture", "bbox": { "l": 162.67430114746094, "t": 444.62255859375, "r": 451.70062255859375, "b": 663.2135620117188, "coord_origin": "TOPLEFT" }, "confidence": 0.9742383360862732, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 180.12473, "r_y0": 518.94992, "r_x1": 190.62042, "r_y1": 518.94992, "r_x2": 190.62042, "r_y2": 516.2332200000001, "r_x3": 180.12473, "r_y3": 516.2332200000001, "coord_origin": "TOPLEFT" }, "text": "", "orig": "
", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2438, "r_y0": 522.84879, "r_x1": 304.54797, "r_y1": 522.84879, "r_x2": 304.54797, "r_y2": 520.13208, "r_x3": 183.2438, "r_y3": 520.13208, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2438, "r_y0": 526.74765, "r_x1": 388.42313, "r_y1": 526.74765, "r_x2": 388.42313, "r_y2": 524.03094, "r_x3": 183.2438, "r_y3": 524.03094, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2438, "r_y0": 530.64648, "r_x1": 388.42313, "r_y1": 530.64648, "r_x2": 388.42313, "r_y2": 527.9297799999999, "r_x3": 183.2438, "r_y3": 527.9297799999999, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2438, "r_y0": 534.54532, "r_x1": 388.42313, "r_y1": 534.54532, "r_x2": 388.42313, "r_y2": 531.82861, "r_x3": 183.2438, "r_y3": 531.82861, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2438, "r_y0": 538.44418, "r_x1": 388.42313, "r_y1": 538.44418, "r_x2": 388.42313, "r_y2": 535.72748, "r_x3": 183.2438, "r_y3": 535.72748, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2438, "r_y0": 542.34303, "r_x1": 388.42313, "r_y1": 542.34303, "r_x2": 388.42313, "r_y2": 539.62631, "r_x3": 183.2438, "r_y3": 539.62631, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2438, "r_y0": 546.24188, "r_x1": 388.42313, "r_y1": 546.24188, "r_x2": 388.42313, "r_y2": 543.52516, "r_x3": 183.2438, "r_y3": 543.52516, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2438, "r_y0": 550.14073, "r_x1": 388.42313, "r_y1": 550.14073, "r_x2": 388.42313, "r_y2": 547.42401, "r_x3": 183.2438, "r_y3": 547.42401, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2438, "r_y0": 554.03958, "r_x1": 388.42313, "r_y1": 554.03958, "r_x2": 388.42313, "r_y2": 551.32286, "r_x3": 183.2438, "r_y3": 551.32286, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 180.12473, "r_y0": 557.93845, "r_x1": 191.86806, "r_y1": 557.93845, "r_x2": 191.86806, "r_y2": 555.22173, "r_x3": 180.12473, "r_y3": 555.22173, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38348, "r_y0": 521.01712, "r_x1": 408.82025, "r_y1": 521.01712, "r_x2": 408.82025, "r_y2": 518.30042, "r_x3": 407.38348, "r_y3": 518.30042, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.25699, "r_y0": 521.01712, "r_x1": 450.48605, "r_y1": 521.01712, "r_x2": 450.48605, "r_y2": 518.30042, "r_x3": 410.25699, "r_y3": 518.30042, "coord_origin": "TOPLEFT" }, "text": "C L L L C L L L L L C L L NL", "orig": "C L L L C L L L L L C L L NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38348, "r_y0": 524.9159500000001, "r_x1": 408.82025, "r_y1": 524.9159500000001, "r_x2": 408.82025, "r_y2": 522.19925, "r_x3": 407.38348, "r_y3": 522.19925, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.25699, "r_y0": 524.9159500000001, "r_x1": 450.48605, "r_y1": 524.9159500000001, "r_x2": 450.48605, "r_y2": 522.19925, "r_x3": 410.25699, "r_y3": 522.19925, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38348, "r_y0": 528.81479, "r_x1": 408.82025, "r_y1": 528.81479, "r_x2": 408.82025, "r_y2": 526.09808, "r_x3": 407.38348, "r_y3": 526.09808, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.25699, "r_y0": 528.81479, "r_x1": 450.48605, "r_y1": 528.81479, "r_x2": 450.48605, "r_y2": 526.09808, "r_x3": 410.25699, "r_y3": 526.09808, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38348, "r_y0": 532.7136499999999, "r_x1": 408.82025, "r_y1": 532.7136499999999, "r_x2": 408.82025, "r_y2": 529.99695, "r_x3": 407.38348, "r_y3": 529.99695, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.25699, "r_y0": 532.7136499999999, "r_x1": 450.48605, "r_y1": 532.7136499999999, "r_x2": 450.48605, "r_y2": 529.99695, "r_x3": 410.25699, "r_y3": 529.99695, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38348, "r_y0": 536.6125, "r_x1": 408.82025, "r_y1": 536.6125, "r_x2": 408.82025, "r_y2": 533.8957800000001, "r_x3": 407.38348, "r_y3": 533.8957800000001, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.25699, "r_y0": 536.6125, "r_x1": 450.48605, "r_y1": 536.6125, "r_x2": 450.48605, "r_y2": 533.8957800000001, "r_x3": 410.25699, "r_y3": 533.8957800000001, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38348, "r_y0": 540.51135, "r_x1": 408.82025, "r_y1": 540.51135, "r_x2": 408.82025, "r_y2": 537.79463, "r_x3": 407.38348, "r_y3": 537.79463, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.25699, "r_y0": 540.51135, "r_x1": 450.48605, "r_y1": 540.51135, "r_x2": 450.48605, "r_y2": 537.79463, "r_x3": 410.25699, "r_y3": 537.79463, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38348, "r_y0": 544.4102, "r_x1": 408.82025, "r_y1": 544.4102, "r_x2": 408.82025, "r_y2": 541.69348, "r_x3": 407.38348, "r_y3": 541.69348, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.25699, "r_y0": 544.4102, "r_x1": 450.48605, "r_y1": 544.4102, "r_x2": 450.48605, "r_y2": 541.69348, "r_x3": 410.25699, "r_y3": 541.69348, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38348, "r_y0": 548.3090500000001, "r_x1": 408.82025, "r_y1": 548.3090500000001, "r_x2": 408.82025, "r_y2": 545.59233, "r_x3": 407.38348, "r_y3": 545.59233, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.25699, "r_y0": 548.3090500000001, "r_x1": 450.48605, "r_y1": 548.3090500000001, "r_x2": 450.48605, "r_y2": 545.59233, "r_x3": 410.25699, "r_y3": 545.59233, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38348, "r_y0": 552.2079200000001, "r_x1": 408.82025, "r_y1": 552.2079200000001, "r_x2": 408.82025, "r_y2": 549.4911999999999, "r_x3": 407.38348, "r_y3": 549.4911999999999, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.25699, "r_y0": 552.2079200000001, "r_x1": 450.48605, "r_y1": 552.2079200000001, "r_x2": 450.48605, "r_y2": 549.4911999999999, "r_x3": 410.25699, "r_y3": 549.4911999999999, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 164.52881, "r_y0": 515.31, "r_x1": 181.8528, "r_y1": 515.31, "r_x2": 181.8528, "r_y2": 509.45859, "r_x3": 164.52881, "r_y3": 509.45859, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.58441, "r_y0": 515.31, "r_x1": 186.3974, "r_y1": 515.31, "r_x2": 186.3974, "r_y2": 509.45859, "r_x3": 183.58441, "r_y3": 509.45859, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 189.2104, "r_y0": 515.31, "r_x1": 208.90137, "r_y1": 515.31, "r_x2": 208.90137, "r_y2": 509.45859, "r_x3": 189.2104, "r_y3": 509.45859, "coord_origin": "TOPLEFT" }, "text": "tokens:", "orig": "tokens:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.63269, "r_y0": 515.31, "r_x1": 221.04044, "r_y1": 515.31, "r_x2": 221.04044, "r_y2": 509.45859, "r_x3": 210.63269, "r_y3": 509.45859, "coord_origin": "TOPLEFT" }, "text": "258", "orig": "258", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 390.20203, "r_y0": 515.45502, "r_x1": 406.83609, "r_y1": 515.45502, "r_x2": 406.83609, "r_y2": 509.60361, "r_x3": 390.20203, "r_y3": 509.60361, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.56952, "r_y0": 515.45502, "r_x1": 411.38251, "r_y1": 515.45502, "r_x2": 411.38251, "r_y2": 509.60361, "r_x3": 408.56952, "r_y3": 509.60361, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 414.1955, "r_y0": 515.45502, "r_x1": 433.88647000000003, "r_y1": 515.45502, "r_x2": 433.88647000000003, "r_y2": 509.60361, "r_x3": 414.1955, "r_y3": 509.60361, "coord_origin": "TOPLEFT" }, "text": "tokens:", "orig": "tokens:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.61737, "r_y0": 515.45502, "r_x1": 446.02512, "r_y1": 515.45502, "r_x2": 446.02512, "r_y2": 509.60361, "r_x3": 435.61737, "r_y3": 509.60361, "coord_origin": "TOPLEFT" }, "text": "135", "orig": "135", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.19316, "r_y0": 526.3866, "r_x1": 172.8231, "r_y1": 526.3866, "r_x2": 172.8231, "r_y2": 519.07236, "r_x3": 167.19316, "r_y3": 519.07236, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 187.33745, "r_y0": 455.93909, "r_x1": 192.96739, "r_y1": 455.93909, "r_x2": 192.96739, "r_y2": 448.62485, "r_x3": 187.33745, "r_y3": 448.62485, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.38654, "r_y0": 573.3194, "r_x1": 173.01648, "r_y1": 573.3194, "r_x2": 173.01648, "r_y2": 566.0051599999999, "r_x3": 167.38654, "r_y3": 566.0051599999999, "coord_origin": "TOPLEFT" }, "text": "D", "orig": "D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 248.45621000000003, "r_y0": 629.09431, "r_x1": 253.65727, "r_y1": 629.09431, "r_x2": 253.65727, "r_y2": 621.78008, "r_x3": 248.45621000000003, "r_y3": 621.78008, "coord_origin": "TOPLEFT" }, "text": "E", "orig": "E", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.90057, "r_y0": 526.5137, "r_x1": 401.53052, "r_y1": 526.5137, "r_x2": 401.53052, "r_y2": 519.19946, "r_x3": 395.90057, "r_y3": 519.19946, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.62886, "r_y0": 597.26784, "r_x1": 177.48148, "r_y1": 597.26784, "r_x2": 177.48148, "r_y2": 580.28853, "r_x3": 171.62886, "r_y3": 580.28853, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 251.05969000000002, "r_y0": 649.92345, "r_x1": 256.91235, "r_y1": 649.92345, "r_x2": 256.91235, "r_y2": 633.63408, "r_x3": 251.05969000000002, "r_y3": 633.63408, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 372.14645, "r_y0": 607.30864, "r_x1": 427.0379, "r_y1": 607.30864, "r_x2": 427.0379, "r_y2": 601.45724, "r_x3": 372.14645, "r_y3": 601.45724, "coord_origin": "TOPLEFT" }, "text": "HTML model shows", "orig": "HTML model shows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 372.14645, "r_y0": 613.75087, "r_x1": 430.06838999999997, "r_y1": 613.75087, "r_x2": 430.06838999999997, "r_y2": 607.89948, "r_x3": 372.14645, "r_y3": 607.89948, "coord_origin": "TOPLEFT" }, "text": "bounding box drifting", "orig": "bounding box drifting", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.88042, "r_y0": 648.72348, "r_x1": 231.08191, "r_y1": 648.72348, "r_x2": 231.08191, "r_y2": 642.87209, "r_x3": 176.88042, "r_y3": 642.87209, "coord_origin": "TOPLEFT" }, "text": "OTSL model shows", "orig": "OTSL model shows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.88042, "r_y0": 655.1657, "r_x1": 230.99271000000002, "r_y1": 655.1657, "r_x2": 230.99271000000002, "r_y2": 649.3143, "r_x3": 176.88042, "r_y3": 649.3143, "coord_origin": "TOPLEFT" }, "text": "clean bounding box", "orig": "clean bounding box", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.88042, "r_y0": 661.60794, "r_x1": 203.93219, "r_y1": 661.60794, "r_x2": 203.93219, "r_y2": 655.7565500000001, "r_x3": 176.88042, "r_y3": 655.7565500000001, "coord_origin": "TOPLEFT" }, "text": "alignment", "orig": "alignment", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 215.93231000000003, "r_y0": 569.15967, "r_x1": 218.4697, "r_y1": 569.15967, "r_x2": 218.4697, "r_y2": 557.56342, "r_x3": 215.93231000000003, "r_y3": 557.56342, "coord_origin": "TOPLEFT" }, "text": "\u2264", "orig": "\u2264", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.05689999999998, "r_y0": 569.15967, "r_x1": 231.71908999999997, "r_y1": 569.15967, "r_x2": 231.71908999999997, "r_y2": 557.56342, "r_x3": 229.05689999999998, "r_y3": 557.56342, "coord_origin": "TOPLEFT" }, "text": "\u03bc", "orig": "\u03bc", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 261.20892, "r_y0": 451.19727, "r_x1": 263.56973, "r_y1": 451.19727, "r_x2": 263.56973, "r_y2": 448.46124, "r_x3": 261.20892, "r_y3": 448.46124, "coord_origin": "TOPLEFT" }, "text": "S", "orig": "S", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.33463, "r_y0": 451.19727, "r_x1": 313.6362, "r_y1": 451.19727, "r_x2": 313.6362, "r_y2": 448.46124, "r_x3": 312.33463, "r_y3": 448.46124, "coord_origin": "TOPLEFT" }, "text": "I", "orig": "I", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 377.41125, "r_y0": 451.19727, "r_x1": 380.05737, "r_y1": 451.19727, "r_x2": 380.05737, "r_y2": 448.46124, "r_x3": 377.41125, "r_y3": 448.46124, "coord_origin": "TOPLEFT" }, "text": "R", "orig": "R", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.63976, "r_y0": 456.07599, "r_x1": 205.82492, "r_y1": 456.07599, "r_x2": 205.82492, "r_y2": 453.33997, "r_x3": 200.63976, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "ST", "orig": "ST", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.20833000000002, "r_y0": 456.07599, "r_x1": 229.76836, "r_y1": 456.07599, "r_x2": 229.76836, "r_y2": 453.33997, "r_x3": 222.20833000000002, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "0.03", "orig": "0.03", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 243.26666, "r_y0": 456.07599, "r_x1": 250.82669, "r_y1": 456.07599, "r_x2": 250.82669, "r_y2": 453.33997, "r_x3": 243.26666, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "0.06", "orig": "0.06", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.29657, "r_y0": 456.07599, "r_x1": 271.84949, "r_y1": 456.07599, "r_x2": 271.84949, "r_y2": 453.33997, "r_x3": 264.29657, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "0.12", "orig": "0.12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.31943, "r_y0": 456.07599, "r_x1": 292.87946, "r_y1": 456.07599, "r_x2": 292.87946, "r_y2": 453.33997, "r_x3": 285.31943, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "0.25", "orig": "0.25", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.37775, "r_y0": 456.07599, "r_x1": 311.77319, "r_y1": 456.07599, "r_x2": 311.77319, "r_y2": 453.33997, "r_x3": 306.37775, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "0.5", "orig": "0.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.41699, "r_y0": 456.07599, "r_x1": 325.58157, "r_y1": 456.07599, "r_x2": 325.58157, "r_y2": 453.33997, "r_x3": 323.41699, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.45807, "r_y0": 456.07599, "r_x1": 336.62265, "r_y1": 456.07599, "r_x2": 336.62265, "r_y2": 453.33997, "r_x3": 334.45807, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.52756, "r_y0": 456.07599, "r_x1": 347.69214, "r_y1": 456.07599, "r_x2": 347.69214, "r_y2": 453.33997, "r_x3": 345.52756, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 356.56863, "r_y0": 456.07599, "r_x1": 358.73322, "r_y1": 456.07599, "r_x2": 358.73322, "r_y2": 453.33997, "r_x3": 356.56863, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.63812, "r_y0": 456.07599, "r_x1": 371.97089, "r_y1": 456.07599, "r_x2": 371.97089, "r_y2": 453.33997, "r_x3": 367.63812, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.6734, "r_y0": 456.07599, "r_x1": 387.00616, "r_y1": 456.07599, "r_x2": 387.00616, "r_y2": 453.33997, "r_x3": 382.6734, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "32", "orig": "32", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.73727, "r_y0": 456.07599, "r_x1": 402.07001, "r_y1": 456.07599, "r_x2": 402.07001, "r_y2": 453.33997, "r_x3": 397.73727, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "64", "orig": "64", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 412.78879, "r_y0": 457.79964999999993, "r_x1": 414.93463, "r_y1": 457.79964999999993, "r_x2": 414.93463, "r_y2": 447.99298, "r_x3": 412.78879, "r_y3": 447.99298, "coord_origin": "TOPLEFT" }, "text": "\u2265", "orig": "\u2265", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 414.95697, "r_y0": 456.07599, "r_x1": 422.51746, "r_y1": 456.07599, "r_x2": 422.51746, "r_y2": 453.33997, "r_x3": 414.95697, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": " 128", "orig": " 128", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.63998, "r_y0": 466.66043, "r_x1": 204.57674, "r_y1": 466.66043, "r_x2": 204.57674, "r_y2": 463.92444, "r_x3": 200.63998, "r_y3": 463.92444, "coord_origin": "TOPLEFT" }, "text": "63", "orig": "63", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.62604, "r_y0": 466.66043, "r_x1": 369.58032, "r_y1": 466.66043, "r_x2": 369.58032, "r_y2": 463.92444, "r_x3": 367.62604, "r_y3": 463.92444, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.66132, "r_y0": 466.66043, "r_x1": 384.6156, "r_y1": 466.66043, "r_x2": 384.6156, "r_y2": 463.92444, "r_x3": 382.66132, "r_y3": 463.92444, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.72504, "r_y0": 466.66043, "r_x1": 399.67932, "r_y1": 466.66043, "r_x2": 399.67932, "r_y2": 463.92444, "r_x3": 397.72504, "r_y3": 463.92444, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 471.53915, "r_x1": 206.51694, "r_y1": 471.53915, "r_x2": 206.51694, "r_y2": 468.80313, "r_x3": 200.64, "r_y3": 468.80313, "coord_origin": "TOPLEFT" }, "text": "199", "orig": "199", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.29047, "r_y0": 471.53915, "r_x1": 266.25885, "r_y1": 471.53915, "r_x2": 266.25885, "r_y2": 468.80313, "r_x3": 264.29047, "r_y3": 468.80313, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.37213, "r_y0": 471.53915, "r_x1": 308.34052, "r_y1": 471.53915, "r_x2": 308.34052, "r_y2": 468.80313, "r_x3": 306.37213, "r_y3": 468.80313, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.51526, "r_y0": 471.53915, "r_x1": 347.48364, "r_y1": 471.53915, "r_x2": 347.48364, "r_y2": 468.80313, "r_x3": 345.51526, "r_y3": 468.80313, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 356.55634, "r_y0": 471.53915, "r_x1": 358.52472, "r_y1": 471.53915, "r_x2": 358.52472, "r_y2": 468.80313, "r_x3": 356.55634, "r_y3": 468.80313, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.62582, "r_y0": 471.53915, "r_x1": 369.59418, "r_y1": 471.53915, "r_x2": 369.59418, "r_y2": 468.80313, "r_x3": 367.62582, "r_y3": 468.80313, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.66107, "r_y0": 471.53915, "r_x1": 384.62946, "r_y1": 471.53915, "r_x2": 384.62946, "r_y2": 468.80313, "r_x3": 382.66107, "r_y3": 468.80313, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 476.41788, "r_x1": 206.51694, "r_y1": 476.41788, "r_x2": 206.51694, "r_y2": 473.68185, "r_x3": 200.64, "r_y3": 473.68185, "coord_origin": "TOPLEFT" }, "text": "416", "orig": "416", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.29047, "r_y0": 476.41788, "r_x1": 266.25885, "r_y1": 476.41788, "r_x2": 266.25885, "r_y2": 473.68185, "r_x3": 264.29047, "r_y3": 473.68185, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 481.26816, "r_x1": 206.51694, "r_y1": 481.26816, "r_x2": 206.51694, "r_y2": 478.53214, "r_x3": 200.64, "r_y3": 478.53214, "coord_origin": "TOPLEFT" }, "text": "230", "orig": "230", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 243.26373, "r_y0": 481.26816, "r_x1": 245.2321, "r_y1": 481.26816, "r_x2": 245.2321, "r_y2": 478.53214, "r_x3": 243.26373, "r_y3": 478.53214, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.29047, "r_y0": 481.26816, "r_x1": 266.25885, "r_y1": 481.26816, "r_x2": 266.25885, "r_y2": 478.53214, "r_x3": 264.29047, "r_y3": 478.53214, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.40466, "r_y0": 481.26816, "r_x1": 325.37305, "r_y1": 481.26816, "r_x2": 325.37305, "r_y2": 478.53214, "r_x3": 323.40466, "r_y3": 478.53214, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.72519, "r_y0": 481.26816, "r_x1": 399.69354, "r_y1": 481.26816, "r_x2": 399.69354, "r_y2": 478.53214, "r_x3": 397.72519, "r_y3": 478.53214, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 486.14688, "r_x1": 206.51694, "r_y1": 486.14688, "r_x2": 206.51694, "r_y2": 483.41086, "r_x3": 200.64, "r_y3": 483.41086, "coord_origin": "TOPLEFT" }, "text": "276", "orig": "276", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.66132, "r_y0": 486.14688, "r_x1": 384.61563, "r_y1": 486.14688, "r_x2": 384.61563, "r_y2": 483.41086, "r_x3": 382.66132, "r_y3": 483.41086, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.72513, "r_y0": 486.14688, "r_x1": 401.64819, "r_y1": 486.14688, "r_x2": 401.64819, "r_y2": 483.41086, "r_x3": 397.72513, "r_y3": 483.41086, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 158, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 412.78928, "r_y0": 486.14688, "r_x1": 414.74359, "r_y1": 486.14688, "r_x2": 414.74359, "r_y2": 483.41086, "r_x3": 412.78928, "r_y3": 483.41086, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 159, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64014, "r_y0": 491.0256, "r_x1": 207.14445, "r_y1": 491.0256, "r_x2": 207.14445, "r_y2": 488.28958, "r_x3": 200.64014, "r_y3": 488.28958, "coord_origin": "TOPLEFT" }, "text": "320", "orig": "320", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 160, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.62616, "r_y0": 491.0256, "r_x1": 369.78375, "r_y1": 491.0256, "r_x2": 369.78375, "r_y2": 488.28958, "r_x3": 367.62616, "r_y3": 488.28958, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 161, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.66141, "r_y0": 491.0256, "r_x1": 384.81897, "r_y1": 491.0256, "r_x2": 384.81897, "r_y2": 488.28958, "r_x3": 382.66141, "r_y3": 488.28958, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 162, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.7251, "r_y0": 491.0256, "r_x1": 402.05087, "r_y1": 491.0256, "r_x2": 402.05087, "r_y2": 488.28958, "r_x3": 397.7251, "r_y3": 488.28958, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 163, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64032, "r_y0": 495.90433, "r_x1": 208.48566, "r_y1": 495.90433, "r_x2": 208.48566, "r_y2": 493.1683, "r_x3": 200.64032, "r_y3": 493.1683, "coord_origin": "TOPLEFT" }, "text": "2013", "orig": "2013", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 164, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.29044, "r_y0": 495.90433, "r_x1": 266.25879, "r_y1": 495.90433, "r_x2": 266.25879, "r_y2": 493.1683, "r_x3": 264.29044, "r_y3": 493.1683, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 58, "label": "text", "bbox": { "l": 180.12473, "t": 516.2332200000001, "r": 190.62042, "b": 518.94992, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 180.12473, "r_y0": 518.94992, "r_x1": 190.62042, "r_y1": 518.94992, "r_x2": 190.62042, "r_y2": 516.2332200000001, "r_x3": 180.12473, "r_y3": 516.2332200000001, "coord_origin": "TOPLEFT" }, "text": "", "orig": "
", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 59, "label": "text", "bbox": { "l": 183.2438, "t": 520.13208, "r": 304.54797, "b": 522.84879, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2438, "r_y0": 522.84879, "r_x1": 304.54797, "r_y1": 522.84879, "r_x2": 304.54797, "r_y2": 520.13208, "r_x3": 183.2438, "r_y3": 520.13208, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 60, "label": "text", "bbox": { "l": 183.2438, "t": 524.03094, "r": 388.42313, "b": 526.74765, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2438, "r_y0": 526.74765, "r_x1": 388.42313, "r_y1": 526.74765, "r_x2": 388.42313, "r_y2": 524.03094, "r_x3": 183.2438, "r_y3": 524.03094, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 61, "label": "text", "bbox": { "l": 183.2438, "t": 527.9297799999999, "r": 388.42313, "b": 530.64648, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2438, "r_y0": 530.64648, "r_x1": 388.42313, "r_y1": 530.64648, "r_x2": 388.42313, "r_y2": 527.9297799999999, "r_x3": 183.2438, "r_y3": 527.9297799999999, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 62, "label": "text", "bbox": { "l": 183.2438, "t": 531.82861, "r": 388.42313, "b": 534.54532, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2438, "r_y0": 534.54532, "r_x1": 388.42313, "r_y1": 534.54532, "r_x2": 388.42313, "r_y2": 531.82861, "r_x3": 183.2438, "r_y3": 531.82861, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 183.2438, "t": 535.72748, "r": 388.42313, "b": 538.44418, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2438, "r_y0": 538.44418, "r_x1": 388.42313, "r_y1": 538.44418, "r_x2": 388.42313, "r_y2": 535.72748, "r_x3": 183.2438, "r_y3": 535.72748, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 183.2438, "t": 539.62631, "r": 388.42313, "b": 542.34303, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2438, "r_y0": 542.34303, "r_x1": 388.42313, "r_y1": 542.34303, "r_x2": 388.42313, "r_y2": 539.62631, "r_x3": 183.2438, "r_y3": 539.62631, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 183.2438, "t": 543.52516, "r": 388.42313, "b": 546.24188, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2438, "r_y0": 546.24188, "r_x1": 388.42313, "r_y1": 546.24188, "r_x2": 388.42313, "r_y2": 543.52516, "r_x3": 183.2438, "r_y3": 543.52516, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 183.2438, "t": 547.42401, "r": 388.42313, "b": 550.14073, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2438, "r_y0": 550.14073, "r_x1": 388.42313, "r_y1": 550.14073, "r_x2": 388.42313, "r_y2": 547.42401, "r_x3": 183.2438, "r_y3": 547.42401, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 183.2438, "t": 551.32286, "r": 388.42313, "b": 554.03958, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2438, "r_y0": 554.03958, "r_x1": 388.42313, "r_y1": 554.03958, "r_x2": 388.42313, "r_y2": 551.32286, "r_x3": 183.2438, "r_y3": 551.32286, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 180.12473, "t": 555.22173, "r": 191.86806, "b": 557.93845, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 180.12473, "r_y0": 557.93845, "r_x1": 191.86806, "r_y1": 557.93845, "r_x2": 191.86806, "r_y2": 555.22173, "r_x3": 180.12473, "r_y3": 555.22173, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 407.38348, "t": 518.30042, "r": 408.82025, "b": 521.01712, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38348, "r_y0": 521.01712, "r_x1": 408.82025, "r_y1": 521.01712, "r_x2": 408.82025, "r_y2": 518.30042, "r_x3": 407.38348, "r_y3": 518.30042, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 410.25699, "t": 518.30042, "r": 450.48605, "b": 521.01712, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.25699, "r_y0": 521.01712, "r_x1": 450.48605, "r_y1": 521.01712, "r_x2": 450.48605, "r_y2": 518.30042, "r_x3": 410.25699, "r_y3": 518.30042, "coord_origin": "TOPLEFT" }, "text": "C L L L C L L L L L C L L NL", "orig": "C L L L C L L L L L C L L NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 407.38348, "t": 522.19925, "r": 408.82025, "b": 524.9159500000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38348, "r_y0": 524.9159500000001, "r_x1": 408.82025, "r_y1": 524.9159500000001, "r_x2": 408.82025, "r_y2": 522.19925, "r_x3": 407.38348, "r_y3": 522.19925, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 410.25699, "t": 522.19925, "r": 450.48605, "b": 524.9159500000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.25699, "r_y0": 524.9159500000001, "r_x1": 450.48605, "r_y1": 524.9159500000001, "r_x2": 450.48605, "r_y2": 522.19925, "r_x3": 410.25699, "r_y3": 522.19925, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 407.38348, "t": 526.09808, "r": 408.82025, "b": 528.81479, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38348, "r_y0": 528.81479, "r_x1": 408.82025, "r_y1": 528.81479, "r_x2": 408.82025, "r_y2": 526.09808, "r_x3": 407.38348, "r_y3": 526.09808, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 410.25699, "t": 526.09808, "r": 450.48605, "b": 528.81479, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.25699, "r_y0": 528.81479, "r_x1": 450.48605, "r_y1": 528.81479, "r_x2": 450.48605, "r_y2": 526.09808, "r_x3": 410.25699, "r_y3": 526.09808, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 407.38348, "t": 529.99695, "r": 408.82025, "b": 532.7136499999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38348, "r_y0": 532.7136499999999, "r_x1": 408.82025, "r_y1": 532.7136499999999, "r_x2": 408.82025, "r_y2": 529.99695, "r_x3": 407.38348, "r_y3": 529.99695, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 410.25699, "t": 529.99695, "r": 450.48605, "b": 532.7136499999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.25699, "r_y0": 532.7136499999999, "r_x1": 450.48605, "r_y1": 532.7136499999999, "r_x2": 450.48605, "r_y2": 529.99695, "r_x3": 410.25699, "r_y3": 529.99695, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 407.38348, "t": 533.8957800000001, "r": 408.82025, "b": 536.6125, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38348, "r_y0": 536.6125, "r_x1": 408.82025, "r_y1": 536.6125, "r_x2": 408.82025, "r_y2": 533.8957800000001, "r_x3": 407.38348, "r_y3": 533.8957800000001, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 410.25699, "t": 533.8957800000001, "r": 450.48605, "b": 536.6125, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.25699, "r_y0": 536.6125, "r_x1": 450.48605, "r_y1": 536.6125, "r_x2": 450.48605, "r_y2": 533.8957800000001, "r_x3": 410.25699, "r_y3": 533.8957800000001, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 407.38348, "t": 537.79463, "r": 408.82025, "b": 540.51135, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38348, "r_y0": 540.51135, "r_x1": 408.82025, "r_y1": 540.51135, "r_x2": 408.82025, "r_y2": 537.79463, "r_x3": 407.38348, "r_y3": 537.79463, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 80, "label": "text", "bbox": { "l": 410.25699, "t": 537.79463, "r": 450.48605, "b": 540.51135, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.25699, "r_y0": 540.51135, "r_x1": 450.48605, "r_y1": 540.51135, "r_x2": 450.48605, "r_y2": 537.79463, "r_x3": 410.25699, "r_y3": 537.79463, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 81, "label": "text", "bbox": { "l": 407.38348, "t": 541.69348, "r": 408.82025, "b": 544.4102, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38348, "r_y0": 544.4102, "r_x1": 408.82025, "r_y1": 544.4102, "r_x2": 408.82025, "r_y2": 541.69348, "r_x3": 407.38348, "r_y3": 541.69348, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 82, "label": "text", "bbox": { "l": 410.25699, "t": 541.69348, "r": 450.48605, "b": 544.4102, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.25699, "r_y0": 544.4102, "r_x1": 450.48605, "r_y1": 544.4102, "r_x2": 450.48605, "r_y2": 541.69348, "r_x3": 410.25699, "r_y3": 541.69348, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 83, "label": "text", "bbox": { "l": 407.38348, "t": 545.59233, "r": 408.82025, "b": 548.3090500000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38348, "r_y0": 548.3090500000001, "r_x1": 408.82025, "r_y1": 548.3090500000001, "r_x2": 408.82025, "r_y2": 545.59233, "r_x3": 407.38348, "r_y3": 545.59233, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 84, "label": "text", "bbox": { "l": 410.25699, "t": 545.59233, "r": 450.48605, "b": 548.3090500000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.25699, "r_y0": 548.3090500000001, "r_x1": 450.48605, "r_y1": 548.3090500000001, "r_x2": 450.48605, "r_y2": 545.59233, "r_x3": 410.25699, "r_y3": 545.59233, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 85, "label": "text", "bbox": { "l": 407.38348, "t": 549.4911999999999, "r": 408.82025, "b": 552.2079200000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38348, "r_y0": 552.2079200000001, "r_x1": 408.82025, "r_y1": 552.2079200000001, "r_x2": 408.82025, "r_y2": 549.4911999999999, "r_x3": 407.38348, "r_y3": 549.4911999999999, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 86, "label": "text", "bbox": { "l": 410.25699, "t": 549.4911999999999, "r": 450.48605, "b": 552.2079200000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.25699, "r_y0": 552.2079200000001, "r_x1": 450.48605, "r_y1": 552.2079200000001, "r_x2": 450.48605, "r_y2": 549.4911999999999, "r_x3": 410.25699, "r_y3": 549.4911999999999, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 87, "label": "text", "bbox": { "l": 164.52881, "t": 509.45859, "r": 181.8528, "b": 515.31, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 164.52881, "r_y0": 515.31, "r_x1": 181.8528, "r_y1": 515.31, "r_x2": 181.8528, "r_y2": 509.45859, "r_x3": 164.52881, "r_y3": 509.45859, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 88, "label": "text", "bbox": { "l": 183.58441, "t": 509.45859, "r": 186.3974, "b": 515.31, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.58441, "r_y0": 515.31, "r_x1": 186.3974, "r_y1": 515.31, "r_x2": 186.3974, "r_y2": 509.45859, "r_x3": 183.58441, "r_y3": 509.45859, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 89, "label": "text", "bbox": { "l": 189.2104, "t": 509.45859, "r": 208.90137, "b": 515.31, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 189.2104, "r_y0": 515.31, "r_x1": 208.90137, "r_y1": 515.31, "r_x2": 208.90137, "r_y2": 509.45859, "r_x3": 189.2104, "r_y3": 509.45859, "coord_origin": "TOPLEFT" }, "text": "tokens:", "orig": "tokens:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 90, "label": "text", "bbox": { "l": 210.63269, "t": 509.45859, "r": 221.04044, "b": 515.31, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.63269, "r_y0": 515.31, "r_x1": 221.04044, "r_y1": 515.31, "r_x2": 221.04044, "r_y2": 509.45859, "r_x3": 210.63269, "r_y3": 509.45859, "coord_origin": "TOPLEFT" }, "text": "258", "orig": "258", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 91, "label": "text", "bbox": { "l": 390.20203, "t": 509.60361, "r": 406.83609, "b": 515.45502, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 390.20203, "r_y0": 515.45502, "r_x1": 406.83609, "r_y1": 515.45502, "r_x2": 406.83609, "r_y2": 509.60361, "r_x3": 390.20203, "r_y3": 509.60361, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 92, "label": "text", "bbox": { "l": 408.56952, "t": 509.60361, "r": 411.38251, "b": 515.45502, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.56952, "r_y0": 515.45502, "r_x1": 411.38251, "r_y1": 515.45502, "r_x2": 411.38251, "r_y2": 509.60361, "r_x3": 408.56952, "r_y3": 509.60361, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 93, "label": "text", "bbox": { "l": 414.1955, "t": 509.60361, "r": 433.88647000000003, "b": 515.45502, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 414.1955, "r_y0": 515.45502, "r_x1": 433.88647000000003, "r_y1": 515.45502, "r_x2": 433.88647000000003, "r_y2": 509.60361, "r_x3": 414.1955, "r_y3": 509.60361, "coord_origin": "TOPLEFT" }, "text": "tokens:", "orig": "tokens:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 94, "label": "text", "bbox": { "l": 435.61737, "t": 509.60361, "r": 446.02512, "b": 515.45502, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.61737, "r_y0": 515.45502, "r_x1": 446.02512, "r_y1": 515.45502, "r_x2": 446.02512, "r_y2": 509.60361, "r_x3": 435.61737, "r_y3": 509.60361, "coord_origin": "TOPLEFT" }, "text": "135", "orig": "135", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 95, "label": "text", "bbox": { "l": 167.19316, "t": 519.07236, "r": 172.8231, "b": 526.3866, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.19316, "r_y0": 526.3866, "r_x1": 172.8231, "r_y1": 526.3866, "r_x2": 172.8231, "r_y2": 519.07236, "r_x3": 167.19316, "r_y3": 519.07236, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 96, "label": "text", "bbox": { "l": 187.33745, "t": 448.62485, "r": 192.96739, "b": 455.93909, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 187.33745, "r_y0": 455.93909, "r_x1": 192.96739, "r_y1": 455.93909, "r_x2": 192.96739, "r_y2": 448.62485, "r_x3": 187.33745, "r_y3": 448.62485, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 97, "label": "text", "bbox": { "l": 167.38654, "t": 566.0051599999999, "r": 173.01648, "b": 573.3194, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.38654, "r_y0": 573.3194, "r_x1": 173.01648, "r_y1": 573.3194, "r_x2": 173.01648, "r_y2": 566.0051599999999, "r_x3": 167.38654, "r_y3": 566.0051599999999, "coord_origin": "TOPLEFT" }, "text": "D", "orig": "D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 98, "label": "text", "bbox": { "l": 248.45621000000003, "t": 621.78008, "r": 253.65727, "b": 629.09431, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 248.45621000000003, "r_y0": 629.09431, "r_x1": 253.65727, "r_y1": 629.09431, "r_x2": 253.65727, "r_y2": 621.78008, "r_x3": 248.45621000000003, "r_y3": 621.78008, "coord_origin": "TOPLEFT" }, "text": "E", "orig": "E", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 99, "label": "text", "bbox": { "l": 395.90057, "t": 519.19946, "r": 401.53052, "b": 526.5137, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.90057, "r_y0": 526.5137, "r_x1": 401.53052, "r_y1": 526.5137, "r_x2": 401.53052, "r_y2": 519.19946, "r_x3": 395.90057, "r_y3": 519.19946, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 100, "label": "text", "bbox": { "l": 171.62886, "t": 580.28853, "r": 177.48148, "b": 597.26784, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.62886, "r_y0": 597.26784, "r_x1": 177.48148, "r_y1": 597.26784, "r_x2": 177.48148, "r_y2": 580.28853, "r_x3": 171.62886, "r_y3": 580.28853, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 101, "label": "text", "bbox": { "l": 251.05969000000002, "t": 633.63408, "r": 256.91235, "b": 649.92345, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 251.05969000000002, "r_y0": 649.92345, "r_x1": 256.91235, "r_y1": 649.92345, "r_x2": 256.91235, "r_y2": 633.63408, "r_x3": 251.05969000000002, "r_y3": 633.63408, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 102, "label": "text", "bbox": { "l": 372.14645, "t": 601.45724, "r": 427.0379, "b": 607.30864, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 372.14645, "r_y0": 607.30864, "r_x1": 427.0379, "r_y1": 607.30864, "r_x2": 427.0379, "r_y2": 601.45724, "r_x3": 372.14645, "r_y3": 601.45724, "coord_origin": "TOPLEFT" }, "text": "HTML model shows", "orig": "HTML model shows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 103, "label": "text", "bbox": { "l": 372.14645, "t": 607.89948, "r": 430.06838999999997, "b": 613.75087, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 372.14645, "r_y0": 613.75087, "r_x1": 430.06838999999997, "r_y1": 613.75087, "r_x2": 430.06838999999997, "r_y2": 607.89948, "r_x3": 372.14645, "r_y3": 607.89948, "coord_origin": "TOPLEFT" }, "text": "bounding box drifting", "orig": "bounding box drifting", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 104, "label": "text", "bbox": { "l": 176.88042, "t": 642.87209, "r": 231.08191, "b": 648.72348, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.88042, "r_y0": 648.72348, "r_x1": 231.08191, "r_y1": 648.72348, "r_x2": 231.08191, "r_y2": 642.87209, "r_x3": 176.88042, "r_y3": 642.87209, "coord_origin": "TOPLEFT" }, "text": "OTSL model shows", "orig": "OTSL model shows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 105, "label": "text", "bbox": { "l": 176.88042, "t": 649.3143, "r": 230.99271000000002, "b": 655.1657, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.88042, "r_y0": 655.1657, "r_x1": 230.99271000000002, "r_y1": 655.1657, "r_x2": 230.99271000000002, "r_y2": 649.3143, "r_x3": 176.88042, "r_y3": 649.3143, "coord_origin": "TOPLEFT" }, "text": "clean bounding box", "orig": "clean bounding box", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 106, "label": "text", "bbox": { "l": 176.88042, "t": 655.7565500000001, "r": 203.93219, "b": 661.60794, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.88042, "r_y0": 661.60794, "r_x1": 203.93219, "r_y1": 661.60794, "r_x2": 203.93219, "r_y2": 655.7565500000001, "r_x3": 176.88042, "r_y3": 655.7565500000001, "coord_origin": "TOPLEFT" }, "text": "alignment", "orig": "alignment", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 107, "label": "text", "bbox": { "l": 215.93231000000003, "t": 557.56342, "r": 218.4697, "b": 569.15967, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 215.93231000000003, "r_y0": 569.15967, "r_x1": 218.4697, "r_y1": 569.15967, "r_x2": 218.4697, "r_y2": 557.56342, "r_x3": 215.93231000000003, "r_y3": 557.56342, "coord_origin": "TOPLEFT" }, "text": "\u2264", "orig": "\u2264", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 108, "label": "text", "bbox": { "l": 229.05689999999998, "t": 557.56342, "r": 231.71908999999997, "b": 569.15967, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.05689999999998, "r_y0": 569.15967, "r_x1": 231.71908999999997, "r_y1": 569.15967, "r_x2": 231.71908999999997, "r_y2": 557.56342, "r_x3": 229.05689999999998, "r_y3": 557.56342, "coord_origin": "TOPLEFT" }, "text": "\u03bc", "orig": "\u03bc", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 109, "label": "text", "bbox": { "l": 261.20892, "t": 448.46124, "r": 263.56973, "b": 451.19727, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 261.20892, "r_y0": 451.19727, "r_x1": 263.56973, "r_y1": 451.19727, "r_x2": 263.56973, "r_y2": 448.46124, "r_x3": 261.20892, "r_y3": 448.46124, "coord_origin": "TOPLEFT" }, "text": "S", "orig": "S", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 110, "label": "text", "bbox": { "l": 312.33463, "t": 448.46124, "r": 313.6362, "b": 451.19727, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.33463, "r_y0": 451.19727, "r_x1": 313.6362, "r_y1": 451.19727, "r_x2": 313.6362, "r_y2": 448.46124, "r_x3": 312.33463, "r_y3": 448.46124, "coord_origin": "TOPLEFT" }, "text": "I", "orig": "I", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 111, "label": "text", "bbox": { "l": 377.41125, "t": 448.46124, "r": 380.05737, "b": 451.19727, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 377.41125, "r_y0": 451.19727, "r_x1": 380.05737, "r_y1": 451.19727, "r_x2": 380.05737, "r_y2": 448.46124, "r_x3": 377.41125, "r_y3": 448.46124, "coord_origin": "TOPLEFT" }, "text": "R", "orig": "R", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 112, "label": "text", "bbox": { "l": 200.63976, "t": 453.33997, "r": 205.82492, "b": 456.07599, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.63976, "r_y0": 456.07599, "r_x1": 205.82492, "r_y1": 456.07599, "r_x2": 205.82492, "r_y2": 453.33997, "r_x3": 200.63976, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "ST", "orig": "ST", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 113, "label": "text", "bbox": { "l": 222.20833000000002, "t": 453.33997, "r": 229.76836, "b": 456.07599, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.20833000000002, "r_y0": 456.07599, "r_x1": 229.76836, "r_y1": 456.07599, "r_x2": 229.76836, "r_y2": 453.33997, "r_x3": 222.20833000000002, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "0.03", "orig": "0.03", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 114, "label": "text", "bbox": { "l": 243.26666, "t": 453.33997, "r": 250.82669, "b": 456.07599, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 243.26666, "r_y0": 456.07599, "r_x1": 250.82669, "r_y1": 456.07599, "r_x2": 250.82669, "r_y2": 453.33997, "r_x3": 243.26666, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "0.06", "orig": "0.06", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 115, "label": "text", "bbox": { "l": 264.29657, "t": 453.33997, "r": 271.84949, "b": 456.07599, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.29657, "r_y0": 456.07599, "r_x1": 271.84949, "r_y1": 456.07599, "r_x2": 271.84949, "r_y2": 453.33997, "r_x3": 264.29657, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "0.12", "orig": "0.12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 116, "label": "text", "bbox": { "l": 285.31943, "t": 453.33997, "r": 292.87946, "b": 456.07599, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.31943, "r_y0": 456.07599, "r_x1": 292.87946, "r_y1": 456.07599, "r_x2": 292.87946, "r_y2": 453.33997, "r_x3": 285.31943, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "0.25", "orig": "0.25", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 117, "label": "text", "bbox": { "l": 306.37775, "t": 453.33997, "r": 311.77319, "b": 456.07599, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.37775, "r_y0": 456.07599, "r_x1": 311.77319, "r_y1": 456.07599, "r_x2": 311.77319, "r_y2": 453.33997, "r_x3": 306.37775, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "0.5", "orig": "0.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 118, "label": "text", "bbox": { "l": 323.41699, "t": 453.33997, "r": 325.58157, "b": 456.07599, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.41699, "r_y0": 456.07599, "r_x1": 325.58157, "r_y1": 456.07599, "r_x2": 325.58157, "r_y2": 453.33997, "r_x3": 323.41699, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 119, "label": "text", "bbox": { "l": 334.45807, "t": 453.33997, "r": 336.62265, "b": 456.07599, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.45807, "r_y0": 456.07599, "r_x1": 336.62265, "r_y1": 456.07599, "r_x2": 336.62265, "r_y2": 453.33997, "r_x3": 334.45807, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 120, "label": "text", "bbox": { "l": 345.52756, "t": 453.33997, "r": 347.69214, "b": 456.07599, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.52756, "r_y0": 456.07599, "r_x1": 347.69214, "r_y1": 456.07599, "r_x2": 347.69214, "r_y2": 453.33997, "r_x3": 345.52756, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 121, "label": "text", "bbox": { "l": 356.56863, "t": 453.33997, "r": 358.73322, "b": 456.07599, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 356.56863, "r_y0": 456.07599, "r_x1": 358.73322, "r_y1": 456.07599, "r_x2": 358.73322, "r_y2": 453.33997, "r_x3": 356.56863, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 122, "label": "text", "bbox": { "l": 367.63812, "t": 453.33997, "r": 371.97089, "b": 456.07599, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.63812, "r_y0": 456.07599, "r_x1": 371.97089, "r_y1": 456.07599, "r_x2": 371.97089, "r_y2": 453.33997, "r_x3": 367.63812, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 123, "label": "text", "bbox": { "l": 382.6734, "t": 453.33997, "r": 387.00616, "b": 456.07599, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.6734, "r_y0": 456.07599, "r_x1": 387.00616, "r_y1": 456.07599, "r_x2": 387.00616, "r_y2": 453.33997, "r_x3": 382.6734, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "32", "orig": "32", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 124, "label": "text", "bbox": { "l": 397.73727, "t": 453.33997, "r": 402.07001, "b": 456.07599, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.73727, "r_y0": 456.07599, "r_x1": 402.07001, "r_y1": 456.07599, "r_x2": 402.07001, "r_y2": 453.33997, "r_x3": 397.73727, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "64", "orig": "64", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 125, "label": "text", "bbox": { "l": 412.78879, "t": 447.99298, "r": 414.93463, "b": 457.79964999999993, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 412.78879, "r_y0": 457.79964999999993, "r_x1": 414.93463, "r_y1": 457.79964999999993, "r_x2": 414.93463, "r_y2": 447.99298, "r_x3": 412.78879, "r_y3": 447.99298, "coord_origin": "TOPLEFT" }, "text": "\u2265", "orig": "\u2265", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 126, "label": "text", "bbox": { "l": 414.95697, "t": 453.33997, "r": 422.51746, "b": 456.07599, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 414.95697, "r_y0": 456.07599, "r_x1": 422.51746, "r_y1": 456.07599, "r_x2": 422.51746, "r_y2": 453.33997, "r_x3": 414.95697, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": " 128", "orig": " 128", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 127, "label": "text", "bbox": { "l": 200.63998, "t": 463.92444, "r": 204.57674, "b": 466.66043, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.63998, "r_y0": 466.66043, "r_x1": 204.57674, "r_y1": 466.66043, "r_x2": 204.57674, "r_y2": 463.92444, "r_x3": 200.63998, "r_y3": 463.92444, "coord_origin": "TOPLEFT" }, "text": "63", "orig": "63", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 128, "label": "text", "bbox": { "l": 367.62604, "t": 463.92444, "r": 369.58032, "b": 466.66043, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.62604, "r_y0": 466.66043, "r_x1": 369.58032, "r_y1": 466.66043, "r_x2": 369.58032, "r_y2": 463.92444, "r_x3": 367.62604, "r_y3": 463.92444, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 129, "label": "text", "bbox": { "l": 382.66132, "t": 463.92444, "r": 384.6156, "b": 466.66043, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.66132, "r_y0": 466.66043, "r_x1": 384.6156, "r_y1": 466.66043, "r_x2": 384.6156, "r_y2": 463.92444, "r_x3": 382.66132, "r_y3": 463.92444, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 130, "label": "text", "bbox": { "l": 397.72504, "t": 463.92444, "r": 399.67932, "b": 466.66043, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.72504, "r_y0": 466.66043, "r_x1": 399.67932, "r_y1": 466.66043, "r_x2": 399.67932, "r_y2": 463.92444, "r_x3": 397.72504, "r_y3": 463.92444, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 131, "label": "text", "bbox": { "l": 200.64, "t": 468.80313, "r": 206.51694, "b": 471.53915, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 471.53915, "r_x1": 206.51694, "r_y1": 471.53915, "r_x2": 206.51694, "r_y2": 468.80313, "r_x3": 200.64, "r_y3": 468.80313, "coord_origin": "TOPLEFT" }, "text": "199", "orig": "199", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 132, "label": "text", "bbox": { "l": 264.29047, "t": 468.80313, "r": 266.25885, "b": 471.53915, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.29047, "r_y0": 471.53915, "r_x1": 266.25885, "r_y1": 471.53915, "r_x2": 266.25885, "r_y2": 468.80313, "r_x3": 264.29047, "r_y3": 468.80313, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 133, "label": "text", "bbox": { "l": 306.37213, "t": 468.80313, "r": 308.34052, "b": 471.53915, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.37213, "r_y0": 471.53915, "r_x1": 308.34052, "r_y1": 471.53915, "r_x2": 308.34052, "r_y2": 468.80313, "r_x3": 306.37213, "r_y3": 468.80313, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 134, "label": "text", "bbox": { "l": 345.51526, "t": 468.80313, "r": 347.48364, "b": 471.53915, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.51526, "r_y0": 471.53915, "r_x1": 347.48364, "r_y1": 471.53915, "r_x2": 347.48364, "r_y2": 468.80313, "r_x3": 345.51526, "r_y3": 468.80313, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 135, "label": "text", "bbox": { "l": 356.55634, "t": 468.80313, "r": 358.52472, "b": 471.53915, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 356.55634, "r_y0": 471.53915, "r_x1": 358.52472, "r_y1": 471.53915, "r_x2": 358.52472, "r_y2": 468.80313, "r_x3": 356.55634, "r_y3": 468.80313, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 136, "label": "text", "bbox": { "l": 367.62582, "t": 468.80313, "r": 369.59418, "b": 471.53915, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.62582, "r_y0": 471.53915, "r_x1": 369.59418, "r_y1": 471.53915, "r_x2": 369.59418, "r_y2": 468.80313, "r_x3": 367.62582, "r_y3": 468.80313, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 137, "label": "text", "bbox": { "l": 382.66107, "t": 468.80313, "r": 384.62946, "b": 471.53915, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.66107, "r_y0": 471.53915, "r_x1": 384.62946, "r_y1": 471.53915, "r_x2": 384.62946, "r_y2": 468.80313, "r_x3": 382.66107, "r_y3": 468.80313, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 138, "label": "text", "bbox": { "l": 200.64, "t": 473.68185, "r": 206.51694, "b": 476.41788, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 476.41788, "r_x1": 206.51694, "r_y1": 476.41788, "r_x2": 206.51694, "r_y2": 473.68185, "r_x3": 200.64, "r_y3": 473.68185, "coord_origin": "TOPLEFT" }, "text": "416", "orig": "416", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 139, "label": "text", "bbox": { "l": 264.29047, "t": 473.68185, "r": 266.25885, "b": 476.41788, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.29047, "r_y0": 476.41788, "r_x1": 266.25885, "r_y1": 476.41788, "r_x2": 266.25885, "r_y2": 473.68185, "r_x3": 264.29047, "r_y3": 473.68185, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 140, "label": "text", "bbox": { "l": 200.64, "t": 478.53214, "r": 206.51694, "b": 481.26816, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 481.26816, "r_x1": 206.51694, "r_y1": 481.26816, "r_x2": 206.51694, "r_y2": 478.53214, "r_x3": 200.64, "r_y3": 478.53214, "coord_origin": "TOPLEFT" }, "text": "230", "orig": "230", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 141, "label": "text", "bbox": { "l": 243.26373, "t": 478.53214, "r": 245.2321, "b": 481.26816, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 243.26373, "r_y0": 481.26816, "r_x1": 245.2321, "r_y1": 481.26816, "r_x2": 245.2321, "r_y2": 478.53214, "r_x3": 243.26373, "r_y3": 478.53214, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 142, "label": "text", "bbox": { "l": 264.29047, "t": 478.53214, "r": 266.25885, "b": 481.26816, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.29047, "r_y0": 481.26816, "r_x1": 266.25885, "r_y1": 481.26816, "r_x2": 266.25885, "r_y2": 478.53214, "r_x3": 264.29047, "r_y3": 478.53214, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 143, "label": "text", "bbox": { "l": 323.40466, "t": 478.53214, "r": 325.37305, "b": 481.26816, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.40466, "r_y0": 481.26816, "r_x1": 325.37305, "r_y1": 481.26816, "r_x2": 325.37305, "r_y2": 478.53214, "r_x3": 323.40466, "r_y3": 478.53214, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 144, "label": "text", "bbox": { "l": 397.72519, "t": 478.53214, "r": 399.69354, "b": 481.26816, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.72519, "r_y0": 481.26816, "r_x1": 399.69354, "r_y1": 481.26816, "r_x2": 399.69354, "r_y2": 478.53214, "r_x3": 397.72519, "r_y3": 478.53214, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 145, "label": "text", "bbox": { "l": 200.64, "t": 483.41086, "r": 206.51694, "b": 486.14688, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 486.14688, "r_x1": 206.51694, "r_y1": 486.14688, "r_x2": 206.51694, "r_y2": 483.41086, "r_x3": 200.64, "r_y3": 483.41086, "coord_origin": "TOPLEFT" }, "text": "276", "orig": "276", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 146, "label": "text", "bbox": { "l": 382.66132, "t": 483.41086, "r": 384.61563, "b": 486.14688, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.66132, "r_y0": 486.14688, "r_x1": 384.61563, "r_y1": 486.14688, "r_x2": 384.61563, "r_y2": 483.41086, "r_x3": 382.66132, "r_y3": 483.41086, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 147, "label": "text", "bbox": { "l": 397.72513, "t": 483.41086, "r": 401.64819, "b": 486.14688, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.72513, "r_y0": 486.14688, "r_x1": 401.64819, "r_y1": 486.14688, "r_x2": 401.64819, "r_y2": 483.41086, "r_x3": 397.72513, "r_y3": 483.41086, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 148, "label": "text", "bbox": { "l": 412.78928, "t": 483.41086, "r": 414.74359, "b": 486.14688, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 158, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 412.78928, "r_y0": 486.14688, "r_x1": 414.74359, "r_y1": 486.14688, "r_x2": 414.74359, "r_y2": 483.41086, "r_x3": 412.78928, "r_y3": 483.41086, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 149, "label": "text", "bbox": { "l": 200.64014, "t": 488.28958, "r": 207.14445, "b": 491.0256, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 159, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64014, "r_y0": 491.0256, "r_x1": 207.14445, "r_y1": 491.0256, "r_x2": 207.14445, "r_y2": 488.28958, "r_x3": 200.64014, "r_y3": 488.28958, "coord_origin": "TOPLEFT" }, "text": "320", "orig": "320", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 150, "label": "text", "bbox": { "l": 367.62616, "t": 488.28958, "r": 369.78375, "b": 491.0256, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 160, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.62616, "r_y0": 491.0256, "r_x1": 369.78375, "r_y1": 491.0256, "r_x2": 369.78375, "r_y2": 488.28958, "r_x3": 367.62616, "r_y3": 488.28958, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 151, "label": "text", "bbox": { "l": 382.66141, "t": 488.28958, "r": 384.81897, "b": 491.0256, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 161, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.66141, "r_y0": 491.0256, "r_x1": 384.81897, "r_y1": 491.0256, "r_x2": 384.81897, "r_y2": 488.28958, "r_x3": 382.66141, "r_y3": 488.28958, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 152, "label": "text", "bbox": { "l": 397.7251, "t": 488.28958, "r": 402.05087, "b": 491.0256, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 162, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.7251, "r_y0": 491.0256, "r_x1": 402.05087, "r_y1": 491.0256, "r_x2": 402.05087, "r_y2": 488.28958, "r_x3": 397.7251, "r_y3": 488.28958, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 153, "label": "text", "bbox": { "l": 200.64032, "t": 493.1683, "r": 208.48566, "b": 495.90433, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 163, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64032, "r_y0": 495.90433, "r_x1": 208.48566, "r_y1": 495.90433, "r_x2": 208.48566, "r_y2": 493.1683, "r_x3": 200.64032, "r_y3": 493.1683, "coord_origin": "TOPLEFT" }, "text": "2013", "orig": "2013", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 154, "label": "text", "bbox": { "l": 264.29044, "t": 493.1683, "r": 266.25879, "b": 495.90433, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 164, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.29044, "r_y0": 495.90433, "r_x1": 266.25879, "r_y1": 495.90433, "r_x2": 266.25879, "r_y2": 493.1683, "r_x3": 264.29044, "r_y3": 493.1683, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "text", "id": 155, "page_no": 9, "cluster": { "id": 155, "label": "text", "bbox": { "l": 227.91466, "t": 665.82603, "r": 230.10028, "b": 675.3464, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 165, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.91466, "r_y0": 675.3464, "r_x1": 230.10028, "r_y1": 675.3464, "r_x2": 230.10028, "r_y2": 665.82603, "r_x3": 227.91466, "r_y3": 665.82603, "coord_origin": "TOPLEFT" }, "text": "\u03bc", "orig": "\u03bc", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "\u03bc" }, { "label": "text", "id": 156, "page_no": 9, "cluster": { "id": 156, "label": "text", "bbox": { "l": 300.58057, "t": 683.62195, "r": 302.72638, "b": 693.428658, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 166, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 300.58057, "r_y0": 693.428658, "r_x1": 302.72638, "r_y1": 693.428658, "r_x2": 302.72638, "r_y2": 683.62195, "r_x3": 300.58057, "r_y3": 683.62195, "coord_origin": "TOPLEFT" }, "text": "\u2265", "orig": "\u2265", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "\u2265" } ], "body": [ { "label": "caption", "id": 4, "page_no": 9, "cluster": { "id": 4, "label": "caption", "bbox": { "l": 134.765, "t": 115.83618000000001, "r": 480.59357000000006, "b": 145.88666, "coord_origin": "TOPLEFT" }, "confidence": 0.9512290954589844, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 123.76251000000002, "r_x1": 173.09366, "r_y1": 123.76251000000002, "r_x2": 173.09366, "r_y2": 115.83618000000001, "r_x3": 134.765, "r_y3": 115.83618000000001, "coord_origin": "TOPLEFT" }, "text": "Table 2.", "orig": "Table 2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 181.30299, "r_y0": 123.96868999999992, "r_x1": 480.59151999999995, "r_y1": 123.96868999999992, "r_x2": 480.59151999999995, "r_y2": 115.89899000000003, "r_x3": 181.30299, "r_y3": 115.89899000000003, "coord_origin": "TOPLEFT" }, "text": "TSR and cell detection results compared between OTSL and HTML on", "orig": "TSR and cell detection results compared between OTSL and HTML on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 134.92767000000003, "r_x1": 480.59357000000006, "r_y1": 134.92767000000003, "r_x2": 480.59357000000006, "r_y2": 126.85797000000014, "r_x3": 134.765, "r_y3": 126.85797000000014, "coord_origin": "TOPLEFT" }, "text": "the PubTabNet [22], FinTabNet [21] and PubTables-1M [14] data sets using Table-", "orig": "the PubTabNet [22], FinTabNet [21] and PubTables-1M [14] data sets using Table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 145.88666, "r_x1": 305.95691, "r_y1": 145.88666, "r_x2": 305.95691, "r_y2": 137.81696, "r_x3": 134.765, "r_y3": 137.81696, "coord_origin": "TOPLEFT" }, "text": "Former [9] (with enc=6, dec=6, heads=8).", "orig": "Former [9] (with enc=6, dec=6, heads=8).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Table 2. TSR and cell detection results compared between OTSL and HTML on the PubTabNet [22], FinTabNet [21] and PubTables-1M [14] data sets using TableFormer [9] (with enc=6, dec=6, heads=8)." }, { "label": "table", "id": 0, "page_no": 9, "cluster": { "id": 0, "label": "table", "bbox": { "l": 143.6376495361328, "t": 156.3477020263672, "r": 470.8485412597656, "b": 263.2624816894531, "coord_origin": "TOPLEFT" }, "confidence": 0.9884640574455261, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.782, "r_y0": 174.62865999999997, "r_x1": 194.99779, "r_y1": 174.62865999999997, "r_x2": 194.99779, "r_y2": 166.55895999999996, "r_x3": 160.782, "r_y3": 166.55895999999996, "coord_origin": "TOPLEFT" }, "text": "Data set", "orig": "Data set", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 215.52499000000003, "r_y0": 174.6037, "r_x1": 254.04465, "r_y1": 174.6037, "r_x2": 254.04465, "r_y2": 166.534, "r_x3": 215.52499000000003, "r_y3": 166.534, "coord_origin": "TOPLEFT" }, "text": "Language", "orig": "Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 300.397, "r_y0": 169.14868, "r_x1": 323.99118, "r_y1": 169.14868, "r_x2": 323.99118, "r_y2": 161.07898, "r_x3": 300.397, "r_y3": 161.07898, "coord_origin": "TOPLEFT" }, "text": "TEDs", "orig": "TEDs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 370.345, "r_y0": 174.62865999999997, "r_x1": 414.74661, "r_y1": 174.62865999999997, "r_x2": 414.74661, "r_y2": 166.55895999999996, "r_x3": 370.345, "r_y3": 166.55895999999996, "coord_origin": "TOPLEFT" }, "text": "mAP(0.75)", "orig": "mAP(0.75)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 426.737, "r_y0": 169.14868, "r_x1": 463.10830999999996, "r_y1": 169.14868, "r_x2": 463.10830999999996, "r_y2": 161.07898, "r_x3": 426.737, "r_y3": 161.07898, "coord_origin": "TOPLEFT" }, "text": "Inference", "orig": "Inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.11401, "r_y0": 180.10766999999998, "r_x1": 466.72656, "r_y1": 180.10766999999998, "r_x2": 466.72656, "r_y2": 172.03796, "r_x3": 423.11401, "r_y3": 172.03796, "coord_origin": "TOPLEFT" }, "text": "time (secs)", "orig": "time (secs)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.41299, "r_y0": 182.10071000000005, "r_x1": 288.0596, "r_y1": 182.10071000000005, "r_x2": 288.0596, "r_y2": 174.03101000000004, "r_x3": 262.41299, "r_y3": 174.03101000000004, "coord_origin": "TOPLEFT" }, "text": "simple", "orig": "simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 296.42899, "r_y0": 182.10071000000005, "r_x1": 329.44687, "r_y1": 182.10071000000005, "r_x2": 329.44687, "r_y2": 174.03101000000004, "r_x3": 296.42899, "r_y3": 174.03101000000004, "coord_origin": "TOPLEFT" }, "text": "complex", "orig": "complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.03299, "r_y0": 182.10071000000005, "r_x1": 354.75793, "r_y1": 182.10071000000005, "r_x2": 354.75793, "r_y2": 174.03101000000004, "r_x3": 345.03299, "r_y3": 174.03101000000004, "coord_origin": "TOPLEFT" }, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.53799, "r_y0": 200.92969000000005, "r_x1": 201.24129, "r_y1": 200.92969000000005, "r_x2": 201.24129, "r_y2": 192.85999000000004, "r_x3": 154.53799, "r_y3": 192.85999000000004, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.43700000000004, "r_y0": 195.45068000000003, "r_x1": 247.13226000000003, "r_y1": 195.45068000000003, "r_x2": 247.13226000000003, "r_y2": 187.38098000000002, "r_x3": 222.43700000000004, "r_y3": 187.38098000000002, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74399, "r_y0": 195.45068000000003, "r_x1": 285.73074, "r_y1": 195.45068000000003, "r_x2": 285.73074, "r_y2": 187.38098000000002, "r_x3": 264.74399, "r_y3": 187.38098000000002, "coord_origin": "TOPLEFT" }, "text": "0.965", "orig": "0.965", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.444, "r_y0": 195.45068000000003, "r_x1": 323.43076, "r_y1": 195.45068000000003, "r_x2": 323.43076, "r_y2": 187.38098000000002, "r_x3": 302.444, "r_y3": 187.38098000000002, "coord_origin": "TOPLEFT" }, "text": "0.934", "orig": "0.934", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.40302, "r_y0": 195.45068000000003, "r_x1": 360.38977, "r_y1": 195.45068000000003, "r_x2": 360.38977, "r_y2": 187.38098000000002, "r_x3": 339.40302, "r_y3": 187.38098000000002, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 383.116, "r_y0": 195.24451, "r_x1": 401.97324, "r_y1": 195.24451, "r_x2": 401.97324, "r_y2": 187.31817999999998, "r_x3": 383.116, "r_y3": 187.31817999999998, "coord_origin": "TOPLEFT" }, "text": "0.88", "orig": "0.88", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.49300999999997, "r_y0": 195.24451, "r_x1": 454.35025, "r_y1": 195.24451, "r_x2": 454.35025, "r_y2": 187.31817999999998, "r_x3": 435.49300999999997, "r_y3": 187.31817999999998, "coord_origin": "TOPLEFT" }, "text": "2.73", "orig": "2.73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.903, "r_y0": 208.40166999999997, "r_x1": 248.66655999999998, "r_y1": 208.40166999999997, "r_x2": 248.66655999999998, "r_y2": 200.33196999999996, "r_x3": 220.903, "r_y3": 200.33196999999996, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74399, "r_y0": 208.40166999999997, "r_x1": 285.73074, "r_y1": 208.40166999999997, "r_x2": 285.73074, "r_y2": 200.33196999999996, "r_x3": 264.74399, "r_y3": 200.33196999999996, "coord_origin": "TOPLEFT" }, "text": "0.969", "orig": "0.969", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.444, "r_y0": 208.40166999999997, "r_x1": 323.43076, "r_y1": 208.40166999999997, "r_x2": 323.43076, "r_y2": 200.33196999999996, "r_x3": 302.444, "r_y3": 200.33196999999996, "coord_origin": "TOPLEFT" }, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.40302, "r_y0": 208.40166999999997, "r_x1": 360.38977, "r_y1": 208.40166999999997, "r_x2": 360.38977, "r_y2": 200.33196999999996, "r_x3": 339.40302, "r_y3": 200.33196999999996, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.052, "r_y0": 208.40166999999997, "r_x1": 403.03876, "r_y1": 208.40166999999997, "r_x2": 403.03876, "r_y2": 200.33196999999996, "r_x3": 382.052, "r_y3": 200.33196999999996, "coord_origin": "TOPLEFT" }, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.73199000000005, "r_y0": 208.40166999999997, "r_x1": 453.11182, "r_y1": 208.40166999999997, "r_x2": 453.11182, "r_y2": 200.33196999999996, "r_x3": 436.73199000000005, "r_y3": 200.33196999999996, "coord_origin": "TOPLEFT" }, "text": "5.39", "orig": "5.39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 155.94501, "r_y0": 227.23168999999996, "r_x1": 199.83374, "r_y1": 227.23168999999996, "r_x2": 199.83374, "r_y2": 219.16198999999995, "r_x3": 155.94501, "r_y3": 219.16198999999995, "coord_origin": "TOPLEFT" }, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.43700000000004, "r_y0": 221.75171, "r_x1": 247.13226000000003, "r_y1": 221.75171, "r_x2": 247.13226000000003, "r_y2": 213.68201, "r_x3": 222.43700000000004, "r_y3": 213.68201, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74399, "r_y0": 221.75171, "r_x1": 285.73074, "r_y1": 221.75171, "r_x2": 285.73074, "r_y2": 213.68201, "r_x3": 264.74399, "r_y3": 213.68201, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.444, "r_y0": 221.75171, "r_x1": 323.43076, "r_y1": 221.75171, "r_x2": 323.43076, "r_y2": 213.68201, "r_x3": 302.444, "r_y3": 213.68201, "coord_origin": "TOPLEFT" }, "text": "0.961", "orig": "0.961", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.815, "r_y0": 221.54552999999999, "r_x1": 361.97586, "r_y1": 221.54552999999999, "r_x2": 361.97586, "r_y2": 213.61919999999998, "r_x3": 337.815, "r_y3": 213.61919999999998, "coord_origin": "TOPLEFT" }, "text": "0.959", "orig": "0.959", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 380.46399, "r_y0": 221.54552999999999, "r_x1": 404.62485, "r_y1": 221.54552999999999, "r_x2": 404.62485, "r_y2": 213.61919999999998, "r_x3": 380.46399, "r_y3": 213.61919999999998, "coord_origin": "TOPLEFT" }, "text": "0.862", "orig": "0.862", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.49300999999997, "r_y0": 221.54552999999999, "r_x1": 454.35025, "r_y1": 221.54552999999999, "r_x2": 454.35025, "r_y2": 213.61919999999998, "r_x3": 435.49300999999997, "r_y3": 213.61919999999998, "coord_origin": "TOPLEFT" }, "text": "1.85", "orig": "1.85", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.903, "r_y0": 234.70367, "r_x1": 248.66655999999998, "r_y1": 234.70367, "r_x2": 248.66655999999998, "r_y2": 226.63396999999998, "r_x3": 220.903, "r_y3": 226.63396999999998, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74399, "r_y0": 234.70367, "r_x1": 285.73074, "r_y1": 234.70367, "r_x2": 285.73074, "r_y2": 226.63396999999998, "r_x3": 264.74399, "r_y3": 226.63396999999998, "coord_origin": "TOPLEFT" }, "text": "0.917", "orig": "0.917", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.444, "r_y0": 234.70367, "r_x1": 323.43076, "r_y1": 234.70367, "r_x2": 323.43076, "r_y2": 226.63396999999998, "r_x3": 302.444, "r_y3": 226.63396999999998, "coord_origin": "TOPLEFT" }, "text": "0.922", "orig": "0.922", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 341.70599, "r_y0": 234.70367, "r_x1": 358.08582, "r_y1": 234.70367, "r_x2": 358.08582, "r_y2": 226.63396999999998, "r_x3": 341.70599, "r_y3": 226.63396999999998, "coord_origin": "TOPLEFT" }, "text": "0.92", "orig": "0.92", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.052, "r_y0": 234.70367, "r_x1": 403.03876, "r_y1": 234.70367, "r_x2": 403.03876, "r_y2": 226.63396999999998, "r_x3": 382.052, "r_y3": 226.63396999999998, "coord_origin": "TOPLEFT" }, "text": "0.722", "orig": "0.722", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.73199000000005, "r_y0": 234.70367, "r_x1": 453.11182, "r_y1": 234.70367, "r_x2": 453.11182, "r_y2": 226.63396999999998, "r_x3": 436.73199000000005, "r_y3": 226.63396999999998, "coord_origin": "TOPLEFT" }, "text": "3.26", "orig": "3.26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 148.62601, "r_y0": 253.53265, "r_x1": 207.1524, "r_y1": 253.53265, "r_x2": 207.1524, "r_y2": 245.46294999999998, "r_x3": 148.62601, "r_y3": 245.46294999999998, "coord_origin": "TOPLEFT" }, "text": "PubTables-1M", "orig": "PubTables-1M", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.43700000000004, "r_y0": 248.05267000000003, "r_x1": 247.13226000000003, "r_y1": 248.05267000000003, "r_x2": 247.13226000000003, "r_y2": 239.98297000000002, "r_x3": 222.43700000000004, "r_y3": 239.98297000000002, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74399, "r_y0": 248.05267000000003, "r_x1": 285.73074, "r_y1": 248.05267000000003, "r_x2": 285.73074, "r_y2": 239.98297000000002, "r_x3": 264.74399, "r_y3": 239.98297000000002, "coord_origin": "TOPLEFT" }, "text": "0.987", "orig": "0.987", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.444, "r_y0": 248.05267000000003, "r_x1": 323.43076, "r_y1": 248.05267000000003, "r_x2": 323.43076, "r_y2": 239.98297000000002, "r_x3": 302.444, "r_y3": 239.98297000000002, "coord_origin": "TOPLEFT" }, "text": "0.964", "orig": "0.964", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.815, "r_y0": 247.8465, "r_x1": 361.97586, "r_y1": 247.8465, "r_x2": 361.97586, "r_y2": 239.92016999999998, "r_x3": 337.815, "r_y3": 239.92016999999998, "coord_origin": "TOPLEFT" }, "text": "0.977", "orig": "0.977", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 380.46399, "r_y0": 247.8465, "r_x1": 404.62485, "r_y1": 247.8465, "r_x2": 404.62485, "r_y2": 239.92016999999998, "r_x3": 380.46399, "r_y3": 239.92016999999998, "coord_origin": "TOPLEFT" }, "text": "0.896", "orig": "0.896", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.49300999999997, "r_y0": 247.8465, "r_x1": 454.35025, "r_y1": 247.8465, "r_x2": 454.35025, "r_y2": 239.92016999999998, "r_x3": 435.49300999999997, "r_y3": 239.92016999999998, "coord_origin": "TOPLEFT" }, "text": "1.79", "orig": "1.79", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.903, "r_y0": 261.00469999999996, "r_x1": 248.66655999999998, "r_y1": 261.00469999999996, "r_x2": 248.66655999999998, "r_y2": 252.93499999999995, "r_x3": 220.903, "r_y3": 252.93499999999995, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74399, "r_y0": 261.00469999999996, "r_x1": 285.73074, "r_y1": 261.00469999999996, "r_x2": 285.73074, "r_y2": 252.93499999999995, "r_x3": 264.74399, "r_y3": 252.93499999999995, "coord_origin": "TOPLEFT" }, "text": "0.983", "orig": "0.983", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.444, "r_y0": 261.00469999999996, "r_x1": 323.43076, "r_y1": 261.00469999999996, "r_x2": 323.43076, "r_y2": 252.93499999999995, "r_x3": 302.444, "r_y3": 252.93499999999995, "coord_origin": "TOPLEFT" }, "text": "0.944", "orig": "0.944", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.40302, "r_y0": 261.00469999999996, "r_x1": 360.38977, "r_y1": 261.00469999999996, "r_x2": 360.38977, "r_y2": 252.93499999999995, "r_x3": 339.40302, "r_y3": 252.93499999999995, "coord_origin": "TOPLEFT" }, "text": "0.966", "orig": "0.966", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.052, "r_y0": 261.00469999999996, "r_x1": 403.03876, "r_y1": 261.00469999999996, "r_x2": 403.03876, "r_y2": 252.93499999999995, "r_x3": 382.052, "r_y3": 252.93499999999995, "coord_origin": "TOPLEFT" }, "text": "0.889", "orig": "0.889", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.73199000000005, "r_y0": 261.00469999999996, "r_x1": 453.11182, "r_y1": 261.00469999999996, "r_x2": 453.11182, "r_y2": 252.93499999999995, "r_x3": 436.73199000000005, "r_y3": 252.93499999999995, "coord_origin": "TOPLEFT" }, "text": "3.26", "orig": "3.26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 10, "label": "text", "bbox": { "l": 160.782, "t": 166.55895999999996, "r": 194.99779, "b": 174.62865999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.782, "r_y0": 174.62865999999997, "r_x1": 194.99779, "r_y1": 174.62865999999997, "r_x2": 194.99779, "r_y2": 166.55895999999996, "r_x3": 160.782, "r_y3": 166.55895999999996, "coord_origin": "TOPLEFT" }, "text": "Data set", "orig": "Data set", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 11, "label": "text", "bbox": { "l": 215.52499000000003, "t": 166.534, "r": 254.04465, "b": 174.6037, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 215.52499000000003, "r_y0": 174.6037, "r_x1": 254.04465, "r_y1": 174.6037, "r_x2": 254.04465, "r_y2": 166.534, "r_x3": 215.52499000000003, "r_y3": 166.534, "coord_origin": "TOPLEFT" }, "text": "Language", "orig": "Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 12, "label": "text", "bbox": { "l": 300.397, "t": 161.07898, "r": 323.99118, "b": 169.14868, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 300.397, "r_y0": 169.14868, "r_x1": 323.99118, "r_y1": 169.14868, "r_x2": 323.99118, "r_y2": 161.07898, "r_x3": 300.397, "r_y3": 161.07898, "coord_origin": "TOPLEFT" }, "text": "TEDs", "orig": "TEDs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 13, "label": "text", "bbox": { "l": 370.345, "t": 166.55895999999996, "r": 414.74661, "b": 174.62865999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 370.345, "r_y0": 174.62865999999997, "r_x1": 414.74661, "r_y1": 174.62865999999997, "r_x2": 414.74661, "r_y2": 166.55895999999996, "r_x3": 370.345, "r_y3": 166.55895999999996, "coord_origin": "TOPLEFT" }, "text": "mAP(0.75)", "orig": "mAP(0.75)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 14, "label": "text", "bbox": { "l": 426.737, "t": 161.07898, "r": 463.10830999999996, "b": 169.14868, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 426.737, "r_y0": 169.14868, "r_x1": 463.10830999999996, "r_y1": 169.14868, "r_x2": 463.10830999999996, "r_y2": 161.07898, "r_x3": 426.737, "r_y3": 161.07898, "coord_origin": "TOPLEFT" }, "text": "Inference", "orig": "Inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 15, "label": "text", "bbox": { "l": 423.11401, "t": 172.03796, "r": 466.72656, "b": 180.10766999999998, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.11401, "r_y0": 180.10766999999998, "r_x1": 466.72656, "r_y1": 180.10766999999998, "r_x2": 466.72656, "r_y2": 172.03796, "r_x3": 423.11401, "r_y3": 172.03796, "coord_origin": "TOPLEFT" }, "text": "time (secs)", "orig": "time (secs)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 16, "label": "text", "bbox": { "l": 262.41299, "t": 174.03101000000004, "r": 288.0596, "b": 182.10071000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.41299, "r_y0": 182.10071000000005, "r_x1": 288.0596, "r_y1": 182.10071000000005, "r_x2": 288.0596, "r_y2": 174.03101000000004, "r_x3": 262.41299, "r_y3": 174.03101000000004, "coord_origin": "TOPLEFT" }, "text": "simple", "orig": "simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 17, "label": "text", "bbox": { "l": 296.42899, "t": 174.03101000000004, "r": 329.44687, "b": 182.10071000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 296.42899, "r_y0": 182.10071000000005, "r_x1": 329.44687, "r_y1": 182.10071000000005, "r_x2": 329.44687, "r_y2": 174.03101000000004, "r_x3": 296.42899, "r_y3": 174.03101000000004, "coord_origin": "TOPLEFT" }, "text": "complex", "orig": "complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 18, "label": "text", "bbox": { "l": 345.03299, "t": 174.03101000000004, "r": 354.75793, "b": 182.10071000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.03299, "r_y0": 182.10071000000005, "r_x1": 354.75793, "r_y1": 182.10071000000005, "r_x2": 354.75793, "r_y2": 174.03101000000004, "r_x3": 345.03299, "r_y3": 174.03101000000004, "coord_origin": "TOPLEFT" }, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 19, "label": "text", "bbox": { "l": 154.53799, "t": 192.85999000000004, "r": 201.24129, "b": 200.92969000000005, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.53799, "r_y0": 200.92969000000005, "r_x1": 201.24129, "r_y1": 200.92969000000005, "r_x2": 201.24129, "r_y2": 192.85999000000004, "r_x3": 154.53799, "r_y3": 192.85999000000004, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 20, "label": "text", "bbox": { "l": 222.43700000000004, "t": 187.38098000000002, "r": 247.13226000000003, "b": 195.45068000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.43700000000004, "r_y0": 195.45068000000003, "r_x1": 247.13226000000003, "r_y1": 195.45068000000003, "r_x2": 247.13226000000003, "r_y2": 187.38098000000002, "r_x3": 222.43700000000004, "r_y3": 187.38098000000002, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 21, "label": "text", "bbox": { "l": 264.74399, "t": 187.38098000000002, "r": 285.73074, "b": 195.45068000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74399, "r_y0": 195.45068000000003, "r_x1": 285.73074, "r_y1": 195.45068000000003, "r_x2": 285.73074, "r_y2": 187.38098000000002, "r_x3": 264.74399, "r_y3": 187.38098000000002, "coord_origin": "TOPLEFT" }, "text": "0.965", "orig": "0.965", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 22, "label": "text", "bbox": { "l": 302.444, "t": 187.38098000000002, "r": 323.43076, "b": 195.45068000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.444, "r_y0": 195.45068000000003, "r_x1": 323.43076, "r_y1": 195.45068000000003, "r_x2": 323.43076, "r_y2": 187.38098000000002, "r_x3": 302.444, "r_y3": 187.38098000000002, "coord_origin": "TOPLEFT" }, "text": "0.934", "orig": "0.934", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 23, "label": "text", "bbox": { "l": 339.40302, "t": 187.38098000000002, "r": 360.38977, "b": 195.45068000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.40302, "r_y0": 195.45068000000003, "r_x1": 360.38977, "r_y1": 195.45068000000003, "r_x2": 360.38977, "r_y2": 187.38098000000002, "r_x3": 339.40302, "r_y3": 187.38098000000002, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 24, "label": "text", "bbox": { "l": 383.116, "t": 187.31817999999998, "r": 401.97324, "b": 195.24451, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 383.116, "r_y0": 195.24451, "r_x1": 401.97324, "r_y1": 195.24451, "r_x2": 401.97324, "r_y2": 187.31817999999998, "r_x3": 383.116, "r_y3": 187.31817999999998, "coord_origin": "TOPLEFT" }, "text": "0.88", "orig": "0.88", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 25, "label": "text", "bbox": { "l": 435.49300999999997, "t": 187.31817999999998, "r": 454.35025, "b": 195.24451, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.49300999999997, "r_y0": 195.24451, "r_x1": 454.35025, "r_y1": 195.24451, "r_x2": 454.35025, "r_y2": 187.31817999999998, "r_x3": 435.49300999999997, "r_y3": 187.31817999999998, "coord_origin": "TOPLEFT" }, "text": "2.73", "orig": "2.73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 26, "label": "text", "bbox": { "l": 220.903, "t": 200.33196999999996, "r": 248.66655999999998, "b": 208.40166999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.903, "r_y0": 208.40166999999997, "r_x1": 248.66655999999998, "r_y1": 208.40166999999997, "r_x2": 248.66655999999998, "r_y2": 200.33196999999996, "r_x3": 220.903, "r_y3": 200.33196999999996, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 27, "label": "text", "bbox": { "l": 264.74399, "t": 200.33196999999996, "r": 285.73074, "b": 208.40166999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74399, "r_y0": 208.40166999999997, "r_x1": 285.73074, "r_y1": 208.40166999999997, "r_x2": 285.73074, "r_y2": 200.33196999999996, "r_x3": 264.74399, "r_y3": 200.33196999999996, "coord_origin": "TOPLEFT" }, "text": "0.969", "orig": "0.969", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 28, "label": "text", "bbox": { "l": 302.444, "t": 200.33196999999996, "r": 323.43076, "b": 208.40166999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.444, "r_y0": 208.40166999999997, "r_x1": 323.43076, "r_y1": 208.40166999999997, "r_x2": 323.43076, "r_y2": 200.33196999999996, "r_x3": 302.444, "r_y3": 200.33196999999996, "coord_origin": "TOPLEFT" }, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 29, "label": "text", "bbox": { "l": 339.40302, "t": 200.33196999999996, "r": 360.38977, "b": 208.40166999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.40302, "r_y0": 208.40166999999997, "r_x1": 360.38977, "r_y1": 208.40166999999997, "r_x2": 360.38977, "r_y2": 200.33196999999996, "r_x3": 339.40302, "r_y3": 200.33196999999996, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 30, "label": "text", "bbox": { "l": 382.052, "t": 200.33196999999996, "r": 403.03876, "b": 208.40166999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.052, "r_y0": 208.40166999999997, "r_x1": 403.03876, "r_y1": 208.40166999999997, "r_x2": 403.03876, "r_y2": 200.33196999999996, "r_x3": 382.052, "r_y3": 200.33196999999996, "coord_origin": "TOPLEFT" }, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 31, "label": "text", "bbox": { "l": 436.73199000000005, "t": 200.33196999999996, "r": 453.11182, "b": 208.40166999999997, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.73199000000005, "r_y0": 208.40166999999997, "r_x1": 453.11182, "r_y1": 208.40166999999997, "r_x2": 453.11182, "r_y2": 200.33196999999996, "r_x3": 436.73199000000005, "r_y3": 200.33196999999996, "coord_origin": "TOPLEFT" }, "text": "5.39", "orig": "5.39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 32, "label": "text", "bbox": { "l": 155.94501, "t": 219.16198999999995, "r": 199.83374, "b": 227.23168999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 155.94501, "r_y0": 227.23168999999996, "r_x1": 199.83374, "r_y1": 227.23168999999996, "r_x2": 199.83374, "r_y2": 219.16198999999995, "r_x3": 155.94501, "r_y3": 219.16198999999995, "coord_origin": "TOPLEFT" }, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 33, "label": "text", "bbox": { "l": 222.43700000000004, "t": 213.68201, "r": 247.13226000000003, "b": 221.75171, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.43700000000004, "r_y0": 221.75171, "r_x1": 247.13226000000003, "r_y1": 221.75171, "r_x2": 247.13226000000003, "r_y2": 213.68201, "r_x3": 222.43700000000004, "r_y3": 213.68201, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 34, "label": "text", "bbox": { "l": 264.74399, "t": 213.68201, "r": 285.73074, "b": 221.75171, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74399, "r_y0": 221.75171, "r_x1": 285.73074, "r_y1": 221.75171, "r_x2": 285.73074, "r_y2": 213.68201, "r_x3": 264.74399, "r_y3": 213.68201, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 35, "label": "text", "bbox": { "l": 302.444, "t": 213.68201, "r": 323.43076, "b": 221.75171, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.444, "r_y0": 221.75171, "r_x1": 323.43076, "r_y1": 221.75171, "r_x2": 323.43076, "r_y2": 213.68201, "r_x3": 302.444, "r_y3": 213.68201, "coord_origin": "TOPLEFT" }, "text": "0.961", "orig": "0.961", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 36, "label": "text", "bbox": { "l": 337.815, "t": 213.61919999999998, "r": 361.97586, "b": 221.54552999999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.815, "r_y0": 221.54552999999999, "r_x1": 361.97586, "r_y1": 221.54552999999999, "r_x2": 361.97586, "r_y2": 213.61919999999998, "r_x3": 337.815, "r_y3": 213.61919999999998, "coord_origin": "TOPLEFT" }, "text": "0.959", "orig": "0.959", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 37, "label": "text", "bbox": { "l": 380.46399, "t": 213.61919999999998, "r": 404.62485, "b": 221.54552999999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 380.46399, "r_y0": 221.54552999999999, "r_x1": 404.62485, "r_y1": 221.54552999999999, "r_x2": 404.62485, "r_y2": 213.61919999999998, "r_x3": 380.46399, "r_y3": 213.61919999999998, "coord_origin": "TOPLEFT" }, "text": "0.862", "orig": "0.862", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 38, "label": "text", "bbox": { "l": 435.49300999999997, "t": 213.61919999999998, "r": 454.35025, "b": 221.54552999999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.49300999999997, "r_y0": 221.54552999999999, "r_x1": 454.35025, "r_y1": 221.54552999999999, "r_x2": 454.35025, "r_y2": 213.61919999999998, "r_x3": 435.49300999999997, "r_y3": 213.61919999999998, "coord_origin": "TOPLEFT" }, "text": "1.85", "orig": "1.85", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 39, "label": "text", "bbox": { "l": 220.903, "t": 226.63396999999998, "r": 248.66655999999998, "b": 234.70367, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.903, "r_y0": 234.70367, "r_x1": 248.66655999999998, "r_y1": 234.70367, "r_x2": 248.66655999999998, "r_y2": 226.63396999999998, "r_x3": 220.903, "r_y3": 226.63396999999998, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 40, "label": "text", "bbox": { "l": 264.74399, "t": 226.63396999999998, "r": 285.73074, "b": 234.70367, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74399, "r_y0": 234.70367, "r_x1": 285.73074, "r_y1": 234.70367, "r_x2": 285.73074, "r_y2": 226.63396999999998, "r_x3": 264.74399, "r_y3": 226.63396999999998, "coord_origin": "TOPLEFT" }, "text": "0.917", "orig": "0.917", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 302.444, "t": 226.63396999999998, "r": 323.43076, "b": 234.70367, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.444, "r_y0": 234.70367, "r_x1": 323.43076, "r_y1": 234.70367, "r_x2": 323.43076, "r_y2": 226.63396999999998, "r_x3": 302.444, "r_y3": 226.63396999999998, "coord_origin": "TOPLEFT" }, "text": "0.922", "orig": "0.922", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 341.70599, "t": 226.63396999999998, "r": 358.08582, "b": 234.70367, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 341.70599, "r_y0": 234.70367, "r_x1": 358.08582, "r_y1": 234.70367, "r_x2": 358.08582, "r_y2": 226.63396999999998, "r_x3": 341.70599, "r_y3": 226.63396999999998, "coord_origin": "TOPLEFT" }, "text": "0.92", "orig": "0.92", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 382.052, "t": 226.63396999999998, "r": 403.03876, "b": 234.70367, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.052, "r_y0": 234.70367, "r_x1": 403.03876, "r_y1": 234.70367, "r_x2": 403.03876, "r_y2": 226.63396999999998, "r_x3": 382.052, "r_y3": 226.63396999999998, "coord_origin": "TOPLEFT" }, "text": "0.722", "orig": "0.722", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 436.73199000000005, "t": 226.63396999999998, "r": 453.11182, "b": 234.70367, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.73199000000005, "r_y0": 234.70367, "r_x1": 453.11182, "r_y1": 234.70367, "r_x2": 453.11182, "r_y2": 226.63396999999998, "r_x3": 436.73199000000005, "r_y3": 226.63396999999998, "coord_origin": "TOPLEFT" }, "text": "3.26", "orig": "3.26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 148.62601, "t": 245.46294999999998, "r": 207.1524, "b": 253.53265, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 148.62601, "r_y0": 253.53265, "r_x1": 207.1524, "r_y1": 253.53265, "r_x2": 207.1524, "r_y2": 245.46294999999998, "r_x3": 148.62601, "r_y3": 245.46294999999998, "coord_origin": "TOPLEFT" }, "text": "PubTables-1M", "orig": "PubTables-1M", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 222.43700000000004, "t": 239.98297000000002, "r": 247.13226000000003, "b": 248.05267000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.43700000000004, "r_y0": 248.05267000000003, "r_x1": 247.13226000000003, "r_y1": 248.05267000000003, "r_x2": 247.13226000000003, "r_y2": 239.98297000000002, "r_x3": 222.43700000000004, "r_y3": 239.98297000000002, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 264.74399, "t": 239.98297000000002, "r": 285.73074, "b": 248.05267000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74399, "r_y0": 248.05267000000003, "r_x1": 285.73074, "r_y1": 248.05267000000003, "r_x2": 285.73074, "r_y2": 239.98297000000002, "r_x3": 264.74399, "r_y3": 239.98297000000002, "coord_origin": "TOPLEFT" }, "text": "0.987", "orig": "0.987", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 302.444, "t": 239.98297000000002, "r": 323.43076, "b": 248.05267000000003, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.444, "r_y0": 248.05267000000003, "r_x1": 323.43076, "r_y1": 248.05267000000003, "r_x2": 323.43076, "r_y2": 239.98297000000002, "r_x3": 302.444, "r_y3": 239.98297000000002, "coord_origin": "TOPLEFT" }, "text": "0.964", "orig": "0.964", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 337.815, "t": 239.92016999999998, "r": 361.97586, "b": 247.8465, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.815, "r_y0": 247.8465, "r_x1": 361.97586, "r_y1": 247.8465, "r_x2": 361.97586, "r_y2": 239.92016999999998, "r_x3": 337.815, "r_y3": 239.92016999999998, "coord_origin": "TOPLEFT" }, "text": "0.977", "orig": "0.977", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 380.46399, "t": 239.92016999999998, "r": 404.62485, "b": 247.8465, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 380.46399, "r_y0": 247.8465, "r_x1": 404.62485, "r_y1": 247.8465, "r_x2": 404.62485, "r_y2": 239.92016999999998, "r_x3": 380.46399, "r_y3": 239.92016999999998, "coord_origin": "TOPLEFT" }, "text": "0.896", "orig": "0.896", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 51, "label": "text", "bbox": { "l": 435.49300999999997, "t": 239.92016999999998, "r": 454.35025, "b": 247.8465, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.49300999999997, "r_y0": 247.8465, "r_x1": 454.35025, "r_y1": 247.8465, "r_x2": 454.35025, "r_y2": 239.92016999999998, "r_x3": 435.49300999999997, "r_y3": 239.92016999999998, "coord_origin": "TOPLEFT" }, "text": "1.79", "orig": "1.79", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 52, "label": "text", "bbox": { "l": 220.903, "t": 252.93499999999995, "r": 248.66655999999998, "b": 261.00469999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.903, "r_y0": 261.00469999999996, "r_x1": 248.66655999999998, "r_y1": 261.00469999999996, "r_x2": 248.66655999999998, "r_y2": 252.93499999999995, "r_x3": 220.903, "r_y3": 252.93499999999995, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 53, "label": "text", "bbox": { "l": 264.74399, "t": 252.93499999999995, "r": 285.73074, "b": 261.00469999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74399, "r_y0": 261.00469999999996, "r_x1": 285.73074, "r_y1": 261.00469999999996, "r_x2": 285.73074, "r_y2": 252.93499999999995, "r_x3": 264.74399, "r_y3": 252.93499999999995, "coord_origin": "TOPLEFT" }, "text": "0.983", "orig": "0.983", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 54, "label": "text", "bbox": { "l": 302.444, "t": 252.93499999999995, "r": 323.43076, "b": 261.00469999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.444, "r_y0": 261.00469999999996, "r_x1": 323.43076, "r_y1": 261.00469999999996, "r_x2": 323.43076, "r_y2": 252.93499999999995, "r_x3": 302.444, "r_y3": 252.93499999999995, "coord_origin": "TOPLEFT" }, "text": "0.944", "orig": "0.944", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 55, "label": "text", "bbox": { "l": 339.40302, "t": 252.93499999999995, "r": 360.38977, "b": 261.00469999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.40302, "r_y0": 261.00469999999996, "r_x1": 360.38977, "r_y1": 261.00469999999996, "r_x2": 360.38977, "r_y2": 252.93499999999995, "r_x3": 339.40302, "r_y3": 252.93499999999995, "coord_origin": "TOPLEFT" }, "text": "0.966", "orig": "0.966", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 56, "label": "text", "bbox": { "l": 382.052, "t": 252.93499999999995, "r": 403.03876, "b": 261.00469999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.052, "r_y0": 261.00469999999996, "r_x1": 403.03876, "r_y1": 261.00469999999996, "r_x2": 403.03876, "r_y2": 252.93499999999995, "r_x3": 382.052, "r_y3": 252.93499999999995, "coord_origin": "TOPLEFT" }, "text": "0.889", "orig": "0.889", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 57, "label": "text", "bbox": { "l": 436.73199000000005, "t": 252.93499999999995, "r": 453.11182, "b": 261.00469999999996, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.73199000000005, "r_y0": 261.00469999999996, "r_x1": 453.11182, "r_y1": 261.00469999999996, "r_x2": 453.11182, "r_y2": 252.93499999999995, "r_x3": 436.73199000000005, "r_y3": 252.93499999999995, "coord_origin": "TOPLEFT" }, "text": "3.26", "orig": "3.26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "lcel", "lcel", "ched", "ched", "nl", "ucel", "ucel", "ched", "ched", "ched", "ucel", "ucel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 5, "num_cols": 7, "table_cells": [ { "bbox": { "l": 160.782, "t": 166.55895999999996, "r": 194.99779, "b": 174.62865999999997, "coord_origin": "TOPLEFT" }, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Data set", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 215.52499000000003, "t": 166.534, "r": 254.04465, "b": 174.6037, "coord_origin": "TOPLEFT" }, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "Language", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 300.397, "t": 161.07898, "r": 323.99118, "b": 169.14868, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 3, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 2, "end_col_offset_idx": 5, "text": "TEDs", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 370.345, "t": 166.55895999999996, "r": 414.74661, "b": 174.62865999999997, "coord_origin": "TOPLEFT" }, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "mAP(0.75)", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 426.737, "t": 161.07898, "r": 463.10830999999996, "b": 169.14868, "coord_origin": "TOPLEFT" }, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "Inference time (secs)", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 262.41299, "t": 174.03101000000004, "r": 288.0596, "b": 182.10071000000005, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "simple", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 296.42899, "t": 174.03101000000004, "r": 329.44687, "b": 182.10071000000005, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "complex", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 345.03299, "t": 174.03101000000004, "r": 354.75793, "b": 182.10071000000005, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "all", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 154.53799, "t": 192.85999000000004, "r": 201.24129, "b": 200.92969000000005, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "PubTabNet", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 222.43700000000004, "t": 187.38098000000002, "r": 247.13226000000003, "b": 195.45068000000003, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 264.74399, "t": 187.38098000000002, "r": 285.73074, "b": 195.45068000000003, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "0.965 0.969", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 302.444, "t": 187.38098000000002, "r": 323.43076, "b": 195.45068000000003, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.934 0.927", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 339.40302, "t": 187.38098000000002, "r": 360.38977, "b": 195.45068000000003, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.955 0.955", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 383.116, "t": 187.31817999999998, "r": 401.97324, "b": 195.24451, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.88 0.857", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 435.49300999999997, "t": 187.31817999999998, "r": 454.35025, "b": 195.24451, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "2.73 5.39", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 155.94501, "t": 219.16198999999995, "r": 199.83374, "b": 227.23168999999996, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "FinTabNet", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 222.43700000000004, "t": 213.68201, "r": 247.13226000000003, "b": 221.75171, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 264.74399, "t": 213.68201, "r": 285.73074, "b": 221.75171, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "0.955 0.917", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 302.444, "t": 213.68201, "r": 323.43076, "b": 221.75171, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.961 0.922", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 337.815, "t": 213.61919999999998, "r": 361.97586, "b": 221.54552999999999, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.959 0.92", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 380.46399, "t": 213.61919999999998, "r": 404.62485, "b": 221.54552999999999, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.862 0.722", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 435.49300999999997, "t": 213.61919999999998, "r": 454.35025, "b": 221.54552999999999, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "1.85 3.26", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 148.62601, "t": 245.46294999999998, "r": 207.1524, "b": 253.53265, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "PubTables-1M", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 222.43700000000004, "t": 239.98297000000002, "r": 247.13226000000003, "b": 248.05267000000003, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 264.74399, "t": 239.98297000000002, "r": 285.73074, "b": 248.05267000000003, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "0.987 0.983", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 302.444, "t": 239.98297000000002, "r": 323.43076, "b": 248.05267000000003, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.964 0.944", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 337.815, "t": 239.92016999999998, "r": 361.97586, "b": 247.8465, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.977 0.966", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 380.46399, "t": 239.92016999999998, "r": 404.62485, "b": 247.8465, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.896 0.889", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 435.49300999999997, "t": 239.92016999999998, "r": 454.35025, "b": 247.8465, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "1.79 3.26", "column_header": false, "row_header": false, "row_section": false } ] }, { "label": "section_header", "id": 3, "page_no": 9, "cluster": { "id": 3, "label": "section_header", "bbox": { "l": 134.765, "t": 288.91479, "r": 257.08679, "b": 297.72173999999995, "coord_origin": "TOPLEFT" }, "confidence": 0.9546447992324829, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 297.72173999999995, "r_x1": 149.40205, "r_y1": 297.72173999999995, "r_x2": 149.40205, "r_y2": 288.91479, "r_x3": 134.765, "r_y3": 288.91479, "coord_origin": "TOPLEFT" }, "text": "5.3", "orig": "5.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.85904, "r_y0": 297.72173999999995, "r_x1": 257.08679, "r_y1": 297.72173999999995, "r_x2": 257.08679, "r_y2": 288.91479, "r_x3": 160.85904, "r_y3": 288.91479, "coord_origin": "TOPLEFT" }, "text": "Qualitative Results", "orig": "Qualitative Results", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "5.3 Qualitative Results" }, { "label": "text", "id": 1, "page_no": 9, "cluster": { "id": 1, "label": "text", "bbox": { "l": 134.765, "t": 309.86078, "r": 480.58981, "b": 366.47769, "coord_origin": "TOPLEFT" }, "confidence": 0.9834085702896118, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 318.65775, "r_x1": 480.58777, "r_y1": 318.65775, "r_x2": 480.58777, "r_y2": 309.86078, "r_x3": 134.765, "r_y3": 309.86078, "coord_origin": "TOPLEFT" }, "text": "To illustrate the qualitative differences between OTSL and HTML, Figure 5", "orig": "To illustrate the qualitative differences between OTSL and HTML, Figure 5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 330.61273, "r_x1": 480.58889999999997, "r_y1": 330.61273, "r_x2": 480.58889999999997, "r_y2": 321.81577, "r_x3": 134.765, "r_y3": 321.81577, "coord_origin": "TOPLEFT" }, "text": "demonstrates less overlap and more accurate bounding boxes with OTSL. In", "orig": "demonstrates less overlap and more accurate bounding boxes with OTSL. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 342.56772, "r_x1": 480.58681999999993, "r_y1": 342.56772, "r_x2": 480.58681999999993, "r_y2": 333.77075, "r_x3": 134.765, "r_y3": 333.77075, "coord_origin": "TOPLEFT" }, "text": "Figure 6, OTSL proves to be more effective in handling tables with longer to-", "orig": "Figure 6, OTSL proves to be more effective in handling tables with longer to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 354.52271, "r_x1": 480.58981, "r_y1": 354.52271, "r_x2": 480.58981, "r_y2": 345.72574, "r_x3": 134.765, "r_y3": 345.72574, "coord_origin": "TOPLEFT" }, "text": "ken sequences, resulting in even more precise structure prediction and bounding", "orig": "ken sequences, resulting in even more precise structure prediction and bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 366.47769, "r_x1": 161.65704, "r_y1": 366.47769, "r_x2": 161.65704, "r_y2": 357.68073, "r_x3": 134.765, "r_y3": 357.68073, "coord_origin": "TOPLEFT" }, "text": "boxes.", "orig": "boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "To illustrate the qualitative differences between OTSL and HTML, Figure 5 demonstrates less overlap and more accurate bounding boxes with OTSL. In Figure 6, OTSL proves to be more effective in handling tables with longer token sequences, resulting in even more precise structure prediction and bounding boxes." }, { "label": "caption", "id": 5, "page_no": 9, "cluster": { "id": 5, "label": "caption", "bbox": { "l": 134.765, "t": 397.59012, "r": 480.59106, "b": 439.71716, "coord_origin": "TOPLEFT" }, "confidence": 0.9482728838920593, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 405.51642, "r_x1": 162.64424, "r_y1": 405.51642, "r_x2": 162.64424, "r_y2": 397.59012, "r_x3": 134.765, "r_y3": 397.59012, "coord_origin": "TOPLEFT" }, "text": "Fig. 5.", "orig": "Fig. 5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.384, "r_y0": 405.72266, "r_x1": 480.59106, "r_y1": 405.72266, "r_x2": 480.59106, "r_y2": 397.65289, "r_x3": 167.384, "r_y3": 397.65289, "coord_origin": "TOPLEFT" }, "text": "The OTSL model produces more accurate bounding boxes with less over-", "orig": "The OTSL model produces more accurate bounding boxes with less over-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 416.68167000000005, "r_x1": 480.59106, "r_y1": 416.68167000000005, "r_x2": 480.59106, "r_y2": 408.61190999999997, "r_x3": 134.765, "r_y3": 408.61190999999997, "coord_origin": "TOPLEFT" }, "text": "lap (E) than the HTML model (D), when predicting the structure of a sparse ta-", "orig": "lap (E) than the HTML model (D), when predicting the structure of a sparse ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 427.64066, "r_x1": 480.58838000000003, "r_y1": 427.64066, "r_x2": 480.58838000000003, "r_y2": 419.57089, "r_x3": 134.765, "r_y3": 419.57089, "coord_origin": "TOPLEFT" }, "text": "ble (A), at twice the inference speed because of shorter sequence length (B),(C).", "orig": "ble (A), at twice the inference speed because of shorter sequence length (B),(C).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 438.59964, "r_x1": 304.69171, "r_y1": 438.59964, "r_x2": 304.69171, "r_y2": 430.52987999999993, "r_x3": 134.765, "r_y3": 430.52987999999993, "coord_origin": "TOPLEFT" }, "text": "\"PMC2807444_006_00.png\" PubTabNet.", "orig": "\"PMC2807444_006_00.png\" PubTabNet.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 342.63354, "r_y0": 439.71716, "r_x1": 344.81915, "r_y1": 439.71716, "r_x2": 344.81915, "r_y2": 430.19678, "r_x3": 342.63354, "r_y3": 430.19678, "coord_origin": "TOPLEFT" }, "text": "\u03bc", "orig": "\u03bc", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Fig. 5. The OTSL model produces more accurate bounding boxes with less overlap (E) than the HTML model (D), when predicting the structure of a sparse table (A), at twice the inference speed because of shorter sequence length (B),(C). \"PMC2807444_006_00.png\" PubTabNet. \u03bc" }, { "label": "picture", "id": 2, "page_no": 9, "cluster": { "id": 2, "label": "picture", "bbox": { "l": 162.67430114746094, "t": 444.62255859375, "r": 451.70062255859375, "b": 663.2135620117188, "coord_origin": "TOPLEFT" }, "confidence": 0.9742383360862732, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 180.12473, "r_y0": 518.94992, "r_x1": 190.62042, "r_y1": 518.94992, "r_x2": 190.62042, "r_y2": 516.2332200000001, "r_x3": 180.12473, "r_y3": 516.2332200000001, "coord_origin": "TOPLEFT" }, "text": "", "orig": "
", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2438, "r_y0": 522.84879, "r_x1": 304.54797, "r_y1": 522.84879, "r_x2": 304.54797, "r_y2": 520.13208, "r_x3": 183.2438, "r_y3": 520.13208, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2438, "r_y0": 526.74765, "r_x1": 388.42313, "r_y1": 526.74765, "r_x2": 388.42313, "r_y2": 524.03094, "r_x3": 183.2438, "r_y3": 524.03094, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2438, "r_y0": 530.64648, "r_x1": 388.42313, "r_y1": 530.64648, "r_x2": 388.42313, "r_y2": 527.9297799999999, "r_x3": 183.2438, "r_y3": 527.9297799999999, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2438, "r_y0": 534.54532, "r_x1": 388.42313, "r_y1": 534.54532, "r_x2": 388.42313, "r_y2": 531.82861, "r_x3": 183.2438, "r_y3": 531.82861, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2438, "r_y0": 538.44418, "r_x1": 388.42313, "r_y1": 538.44418, "r_x2": 388.42313, "r_y2": 535.72748, "r_x3": 183.2438, "r_y3": 535.72748, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2438, "r_y0": 542.34303, "r_x1": 388.42313, "r_y1": 542.34303, "r_x2": 388.42313, "r_y2": 539.62631, "r_x3": 183.2438, "r_y3": 539.62631, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2438, "r_y0": 546.24188, "r_x1": 388.42313, "r_y1": 546.24188, "r_x2": 388.42313, "r_y2": 543.52516, "r_x3": 183.2438, "r_y3": 543.52516, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2438, "r_y0": 550.14073, "r_x1": 388.42313, "r_y1": 550.14073, "r_x2": 388.42313, "r_y2": 547.42401, "r_x3": 183.2438, "r_y3": 547.42401, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2438, "r_y0": 554.03958, "r_x1": 388.42313, "r_y1": 554.03958, "r_x2": 388.42313, "r_y2": 551.32286, "r_x3": 183.2438, "r_y3": 551.32286, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 180.12473, "r_y0": 557.93845, "r_x1": 191.86806, "r_y1": 557.93845, "r_x2": 191.86806, "r_y2": 555.22173, "r_x3": 180.12473, "r_y3": 555.22173, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38348, "r_y0": 521.01712, "r_x1": 408.82025, "r_y1": 521.01712, "r_x2": 408.82025, "r_y2": 518.30042, "r_x3": 407.38348, "r_y3": 518.30042, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.25699, "r_y0": 521.01712, "r_x1": 450.48605, "r_y1": 521.01712, "r_x2": 450.48605, "r_y2": 518.30042, "r_x3": 410.25699, "r_y3": 518.30042, "coord_origin": "TOPLEFT" }, "text": "C L L L C L L L L L C L L NL", "orig": "C L L L C L L L L L C L L NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38348, "r_y0": 524.9159500000001, "r_x1": 408.82025, "r_y1": 524.9159500000001, "r_x2": 408.82025, "r_y2": 522.19925, "r_x3": 407.38348, "r_y3": 522.19925, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.25699, "r_y0": 524.9159500000001, "r_x1": 450.48605, "r_y1": 524.9159500000001, "r_x2": 450.48605, "r_y2": 522.19925, "r_x3": 410.25699, "r_y3": 522.19925, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38348, "r_y0": 528.81479, "r_x1": 408.82025, "r_y1": 528.81479, "r_x2": 408.82025, "r_y2": 526.09808, "r_x3": 407.38348, "r_y3": 526.09808, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.25699, "r_y0": 528.81479, "r_x1": 450.48605, "r_y1": 528.81479, "r_x2": 450.48605, "r_y2": 526.09808, "r_x3": 410.25699, "r_y3": 526.09808, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38348, "r_y0": 532.7136499999999, "r_x1": 408.82025, "r_y1": 532.7136499999999, "r_x2": 408.82025, "r_y2": 529.99695, "r_x3": 407.38348, "r_y3": 529.99695, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.25699, "r_y0": 532.7136499999999, "r_x1": 450.48605, "r_y1": 532.7136499999999, "r_x2": 450.48605, "r_y2": 529.99695, "r_x3": 410.25699, "r_y3": 529.99695, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38348, "r_y0": 536.6125, "r_x1": 408.82025, "r_y1": 536.6125, "r_x2": 408.82025, "r_y2": 533.8957800000001, "r_x3": 407.38348, "r_y3": 533.8957800000001, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.25699, "r_y0": 536.6125, "r_x1": 450.48605, "r_y1": 536.6125, "r_x2": 450.48605, "r_y2": 533.8957800000001, "r_x3": 410.25699, "r_y3": 533.8957800000001, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38348, "r_y0": 540.51135, "r_x1": 408.82025, "r_y1": 540.51135, "r_x2": 408.82025, "r_y2": 537.79463, "r_x3": 407.38348, "r_y3": 537.79463, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.25699, "r_y0": 540.51135, "r_x1": 450.48605, "r_y1": 540.51135, "r_x2": 450.48605, "r_y2": 537.79463, "r_x3": 410.25699, "r_y3": 537.79463, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38348, "r_y0": 544.4102, "r_x1": 408.82025, "r_y1": 544.4102, "r_x2": 408.82025, "r_y2": 541.69348, "r_x3": 407.38348, "r_y3": 541.69348, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.25699, "r_y0": 544.4102, "r_x1": 450.48605, "r_y1": 544.4102, "r_x2": 450.48605, "r_y2": 541.69348, "r_x3": 410.25699, "r_y3": 541.69348, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38348, "r_y0": 548.3090500000001, "r_x1": 408.82025, "r_y1": 548.3090500000001, "r_x2": 408.82025, "r_y2": 545.59233, "r_x3": 407.38348, "r_y3": 545.59233, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.25699, "r_y0": 548.3090500000001, "r_x1": 450.48605, "r_y1": 548.3090500000001, "r_x2": 450.48605, "r_y2": 545.59233, "r_x3": 410.25699, "r_y3": 545.59233, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38348, "r_y0": 552.2079200000001, "r_x1": 408.82025, "r_y1": 552.2079200000001, "r_x2": 408.82025, "r_y2": 549.4911999999999, "r_x3": 407.38348, "r_y3": 549.4911999999999, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.25699, "r_y0": 552.2079200000001, "r_x1": 450.48605, "r_y1": 552.2079200000001, "r_x2": 450.48605, "r_y2": 549.4911999999999, "r_x3": 410.25699, "r_y3": 549.4911999999999, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 164.52881, "r_y0": 515.31, "r_x1": 181.8528, "r_y1": 515.31, "r_x2": 181.8528, "r_y2": 509.45859, "r_x3": 164.52881, "r_y3": 509.45859, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.58441, "r_y0": 515.31, "r_x1": 186.3974, "r_y1": 515.31, "r_x2": 186.3974, "r_y2": 509.45859, "r_x3": 183.58441, "r_y3": 509.45859, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 189.2104, "r_y0": 515.31, "r_x1": 208.90137, "r_y1": 515.31, "r_x2": 208.90137, "r_y2": 509.45859, "r_x3": 189.2104, "r_y3": 509.45859, "coord_origin": "TOPLEFT" }, "text": "tokens:", "orig": "tokens:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.63269, "r_y0": 515.31, "r_x1": 221.04044, "r_y1": 515.31, "r_x2": 221.04044, "r_y2": 509.45859, "r_x3": 210.63269, "r_y3": 509.45859, "coord_origin": "TOPLEFT" }, "text": "258", "orig": "258", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 390.20203, "r_y0": 515.45502, "r_x1": 406.83609, "r_y1": 515.45502, "r_x2": 406.83609, "r_y2": 509.60361, "r_x3": 390.20203, "r_y3": 509.60361, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.56952, "r_y0": 515.45502, "r_x1": 411.38251, "r_y1": 515.45502, "r_x2": 411.38251, "r_y2": 509.60361, "r_x3": 408.56952, "r_y3": 509.60361, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 414.1955, "r_y0": 515.45502, "r_x1": 433.88647000000003, "r_y1": 515.45502, "r_x2": 433.88647000000003, "r_y2": 509.60361, "r_x3": 414.1955, "r_y3": 509.60361, "coord_origin": "TOPLEFT" }, "text": "tokens:", "orig": "tokens:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.61737, "r_y0": 515.45502, "r_x1": 446.02512, "r_y1": 515.45502, "r_x2": 446.02512, "r_y2": 509.60361, "r_x3": 435.61737, "r_y3": 509.60361, "coord_origin": "TOPLEFT" }, "text": "135", "orig": "135", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.19316, "r_y0": 526.3866, "r_x1": 172.8231, "r_y1": 526.3866, "r_x2": 172.8231, "r_y2": 519.07236, "r_x3": 167.19316, "r_y3": 519.07236, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 187.33745, "r_y0": 455.93909, "r_x1": 192.96739, "r_y1": 455.93909, "r_x2": 192.96739, "r_y2": 448.62485, "r_x3": 187.33745, "r_y3": 448.62485, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.38654, "r_y0": 573.3194, "r_x1": 173.01648, "r_y1": 573.3194, "r_x2": 173.01648, "r_y2": 566.0051599999999, "r_x3": 167.38654, "r_y3": 566.0051599999999, "coord_origin": "TOPLEFT" }, "text": "D", "orig": "D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 248.45621000000003, "r_y0": 629.09431, "r_x1": 253.65727, "r_y1": 629.09431, "r_x2": 253.65727, "r_y2": 621.78008, "r_x3": 248.45621000000003, "r_y3": 621.78008, "coord_origin": "TOPLEFT" }, "text": "E", "orig": "E", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.90057, "r_y0": 526.5137, "r_x1": 401.53052, "r_y1": 526.5137, "r_x2": 401.53052, "r_y2": 519.19946, "r_x3": 395.90057, "r_y3": 519.19946, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.62886, "r_y0": 597.26784, "r_x1": 177.48148, "r_y1": 597.26784, "r_x2": 177.48148, "r_y2": 580.28853, "r_x3": 171.62886, "r_y3": 580.28853, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 251.05969000000002, "r_y0": 649.92345, "r_x1": 256.91235, "r_y1": 649.92345, "r_x2": 256.91235, "r_y2": 633.63408, "r_x3": 251.05969000000002, "r_y3": 633.63408, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 372.14645, "r_y0": 607.30864, "r_x1": 427.0379, "r_y1": 607.30864, "r_x2": 427.0379, "r_y2": 601.45724, "r_x3": 372.14645, "r_y3": 601.45724, "coord_origin": "TOPLEFT" }, "text": "HTML model shows", "orig": "HTML model shows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 372.14645, "r_y0": 613.75087, "r_x1": 430.06838999999997, "r_y1": 613.75087, "r_x2": 430.06838999999997, "r_y2": 607.89948, "r_x3": 372.14645, "r_y3": 607.89948, "coord_origin": "TOPLEFT" }, "text": "bounding box drifting", "orig": "bounding box drifting", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.88042, "r_y0": 648.72348, "r_x1": 231.08191, "r_y1": 648.72348, "r_x2": 231.08191, "r_y2": 642.87209, "r_x3": 176.88042, "r_y3": 642.87209, "coord_origin": "TOPLEFT" }, "text": "OTSL model shows", "orig": "OTSL model shows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.88042, "r_y0": 655.1657, "r_x1": 230.99271000000002, "r_y1": 655.1657, "r_x2": 230.99271000000002, "r_y2": 649.3143, "r_x3": 176.88042, "r_y3": 649.3143, "coord_origin": "TOPLEFT" }, "text": "clean bounding box", "orig": "clean bounding box", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.88042, "r_y0": 661.60794, "r_x1": 203.93219, "r_y1": 661.60794, "r_x2": 203.93219, "r_y2": 655.7565500000001, "r_x3": 176.88042, "r_y3": 655.7565500000001, "coord_origin": "TOPLEFT" }, "text": "alignment", "orig": "alignment", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 215.93231000000003, "r_y0": 569.15967, "r_x1": 218.4697, "r_y1": 569.15967, "r_x2": 218.4697, "r_y2": 557.56342, "r_x3": 215.93231000000003, "r_y3": 557.56342, "coord_origin": "TOPLEFT" }, "text": "\u2264", "orig": "\u2264", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.05689999999998, "r_y0": 569.15967, "r_x1": 231.71908999999997, "r_y1": 569.15967, "r_x2": 231.71908999999997, "r_y2": 557.56342, "r_x3": 229.05689999999998, "r_y3": 557.56342, "coord_origin": "TOPLEFT" }, "text": "\u03bc", "orig": "\u03bc", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 261.20892, "r_y0": 451.19727, "r_x1": 263.56973, "r_y1": 451.19727, "r_x2": 263.56973, "r_y2": 448.46124, "r_x3": 261.20892, "r_y3": 448.46124, "coord_origin": "TOPLEFT" }, "text": "S", "orig": "S", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.33463, "r_y0": 451.19727, "r_x1": 313.6362, "r_y1": 451.19727, "r_x2": 313.6362, "r_y2": 448.46124, "r_x3": 312.33463, "r_y3": 448.46124, "coord_origin": "TOPLEFT" }, "text": "I", "orig": "I", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 377.41125, "r_y0": 451.19727, "r_x1": 380.05737, "r_y1": 451.19727, "r_x2": 380.05737, "r_y2": 448.46124, "r_x3": 377.41125, "r_y3": 448.46124, "coord_origin": "TOPLEFT" }, "text": "R", "orig": "R", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.63976, "r_y0": 456.07599, "r_x1": 205.82492, "r_y1": 456.07599, "r_x2": 205.82492, "r_y2": 453.33997, "r_x3": 200.63976, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "ST", "orig": "ST", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.20833000000002, "r_y0": 456.07599, "r_x1": 229.76836, "r_y1": 456.07599, "r_x2": 229.76836, "r_y2": 453.33997, "r_x3": 222.20833000000002, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "0.03", "orig": "0.03", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 243.26666, "r_y0": 456.07599, "r_x1": 250.82669, "r_y1": 456.07599, "r_x2": 250.82669, "r_y2": 453.33997, "r_x3": 243.26666, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "0.06", "orig": "0.06", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.29657, "r_y0": 456.07599, "r_x1": 271.84949, "r_y1": 456.07599, "r_x2": 271.84949, "r_y2": 453.33997, "r_x3": 264.29657, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "0.12", "orig": "0.12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.31943, "r_y0": 456.07599, "r_x1": 292.87946, "r_y1": 456.07599, "r_x2": 292.87946, "r_y2": 453.33997, "r_x3": 285.31943, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "0.25", "orig": "0.25", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.37775, "r_y0": 456.07599, "r_x1": 311.77319, "r_y1": 456.07599, "r_x2": 311.77319, "r_y2": 453.33997, "r_x3": 306.37775, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "0.5", "orig": "0.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.41699, "r_y0": 456.07599, "r_x1": 325.58157, "r_y1": 456.07599, "r_x2": 325.58157, "r_y2": 453.33997, "r_x3": 323.41699, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.45807, "r_y0": 456.07599, "r_x1": 336.62265, "r_y1": 456.07599, "r_x2": 336.62265, "r_y2": 453.33997, "r_x3": 334.45807, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.52756, "r_y0": 456.07599, "r_x1": 347.69214, "r_y1": 456.07599, "r_x2": 347.69214, "r_y2": 453.33997, "r_x3": 345.52756, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 356.56863, "r_y0": 456.07599, "r_x1": 358.73322, "r_y1": 456.07599, "r_x2": 358.73322, "r_y2": 453.33997, "r_x3": 356.56863, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.63812, "r_y0": 456.07599, "r_x1": 371.97089, "r_y1": 456.07599, "r_x2": 371.97089, "r_y2": 453.33997, "r_x3": 367.63812, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.6734, "r_y0": 456.07599, "r_x1": 387.00616, "r_y1": 456.07599, "r_x2": 387.00616, "r_y2": 453.33997, "r_x3": 382.6734, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "32", "orig": "32", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.73727, "r_y0": 456.07599, "r_x1": 402.07001, "r_y1": 456.07599, "r_x2": 402.07001, "r_y2": 453.33997, "r_x3": 397.73727, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "64", "orig": "64", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 412.78879, "r_y0": 457.79964999999993, "r_x1": 414.93463, "r_y1": 457.79964999999993, "r_x2": 414.93463, "r_y2": 447.99298, "r_x3": 412.78879, "r_y3": 447.99298, "coord_origin": "TOPLEFT" }, "text": "\u2265", "orig": "\u2265", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 414.95697, "r_y0": 456.07599, "r_x1": 422.51746, "r_y1": 456.07599, "r_x2": 422.51746, "r_y2": 453.33997, "r_x3": 414.95697, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": " 128", "orig": " 128", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.63998, "r_y0": 466.66043, "r_x1": 204.57674, "r_y1": 466.66043, "r_x2": 204.57674, "r_y2": 463.92444, "r_x3": 200.63998, "r_y3": 463.92444, "coord_origin": "TOPLEFT" }, "text": "63", "orig": "63", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.62604, "r_y0": 466.66043, "r_x1": 369.58032, "r_y1": 466.66043, "r_x2": 369.58032, "r_y2": 463.92444, "r_x3": 367.62604, "r_y3": 463.92444, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.66132, "r_y0": 466.66043, "r_x1": 384.6156, "r_y1": 466.66043, "r_x2": 384.6156, "r_y2": 463.92444, "r_x3": 382.66132, "r_y3": 463.92444, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.72504, "r_y0": 466.66043, "r_x1": 399.67932, "r_y1": 466.66043, "r_x2": 399.67932, "r_y2": 463.92444, "r_x3": 397.72504, "r_y3": 463.92444, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 471.53915, "r_x1": 206.51694, "r_y1": 471.53915, "r_x2": 206.51694, "r_y2": 468.80313, "r_x3": 200.64, "r_y3": 468.80313, "coord_origin": "TOPLEFT" }, "text": "199", "orig": "199", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.29047, "r_y0": 471.53915, "r_x1": 266.25885, "r_y1": 471.53915, "r_x2": 266.25885, "r_y2": 468.80313, "r_x3": 264.29047, "r_y3": 468.80313, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.37213, "r_y0": 471.53915, "r_x1": 308.34052, "r_y1": 471.53915, "r_x2": 308.34052, "r_y2": 468.80313, "r_x3": 306.37213, "r_y3": 468.80313, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.51526, "r_y0": 471.53915, "r_x1": 347.48364, "r_y1": 471.53915, "r_x2": 347.48364, "r_y2": 468.80313, "r_x3": 345.51526, "r_y3": 468.80313, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 356.55634, "r_y0": 471.53915, "r_x1": 358.52472, "r_y1": 471.53915, "r_x2": 358.52472, "r_y2": 468.80313, "r_x3": 356.55634, "r_y3": 468.80313, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.62582, "r_y0": 471.53915, "r_x1": 369.59418, "r_y1": 471.53915, "r_x2": 369.59418, "r_y2": 468.80313, "r_x3": 367.62582, "r_y3": 468.80313, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.66107, "r_y0": 471.53915, "r_x1": 384.62946, "r_y1": 471.53915, "r_x2": 384.62946, "r_y2": 468.80313, "r_x3": 382.66107, "r_y3": 468.80313, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 476.41788, "r_x1": 206.51694, "r_y1": 476.41788, "r_x2": 206.51694, "r_y2": 473.68185, "r_x3": 200.64, "r_y3": 473.68185, "coord_origin": "TOPLEFT" }, "text": "416", "orig": "416", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.29047, "r_y0": 476.41788, "r_x1": 266.25885, "r_y1": 476.41788, "r_x2": 266.25885, "r_y2": 473.68185, "r_x3": 264.29047, "r_y3": 473.68185, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 481.26816, "r_x1": 206.51694, "r_y1": 481.26816, "r_x2": 206.51694, "r_y2": 478.53214, "r_x3": 200.64, "r_y3": 478.53214, "coord_origin": "TOPLEFT" }, "text": "230", "orig": "230", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 243.26373, "r_y0": 481.26816, "r_x1": 245.2321, "r_y1": 481.26816, "r_x2": 245.2321, "r_y2": 478.53214, "r_x3": 243.26373, "r_y3": 478.53214, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.29047, "r_y0": 481.26816, "r_x1": 266.25885, "r_y1": 481.26816, "r_x2": 266.25885, "r_y2": 478.53214, "r_x3": 264.29047, "r_y3": 478.53214, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.40466, "r_y0": 481.26816, "r_x1": 325.37305, "r_y1": 481.26816, "r_x2": 325.37305, "r_y2": 478.53214, "r_x3": 323.40466, "r_y3": 478.53214, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.72519, "r_y0": 481.26816, "r_x1": 399.69354, "r_y1": 481.26816, "r_x2": 399.69354, "r_y2": 478.53214, "r_x3": 397.72519, "r_y3": 478.53214, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 486.14688, "r_x1": 206.51694, "r_y1": 486.14688, "r_x2": 206.51694, "r_y2": 483.41086, "r_x3": 200.64, "r_y3": 483.41086, "coord_origin": "TOPLEFT" }, "text": "276", "orig": "276", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.66132, "r_y0": 486.14688, "r_x1": 384.61563, "r_y1": 486.14688, "r_x2": 384.61563, "r_y2": 483.41086, "r_x3": 382.66132, "r_y3": 483.41086, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.72513, "r_y0": 486.14688, "r_x1": 401.64819, "r_y1": 486.14688, "r_x2": 401.64819, "r_y2": 483.41086, "r_x3": 397.72513, "r_y3": 483.41086, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 158, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 412.78928, "r_y0": 486.14688, "r_x1": 414.74359, "r_y1": 486.14688, "r_x2": 414.74359, "r_y2": 483.41086, "r_x3": 412.78928, "r_y3": 483.41086, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 159, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64014, "r_y0": 491.0256, "r_x1": 207.14445, "r_y1": 491.0256, "r_x2": 207.14445, "r_y2": 488.28958, "r_x3": 200.64014, "r_y3": 488.28958, "coord_origin": "TOPLEFT" }, "text": "320", "orig": "320", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 160, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.62616, "r_y0": 491.0256, "r_x1": 369.78375, "r_y1": 491.0256, "r_x2": 369.78375, "r_y2": 488.28958, "r_x3": 367.62616, "r_y3": 488.28958, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 161, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.66141, "r_y0": 491.0256, "r_x1": 384.81897, "r_y1": 491.0256, "r_x2": 384.81897, "r_y2": 488.28958, "r_x3": 382.66141, "r_y3": 488.28958, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 162, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.7251, "r_y0": 491.0256, "r_x1": 402.05087, "r_y1": 491.0256, "r_x2": 402.05087, "r_y2": 488.28958, "r_x3": 397.7251, "r_y3": 488.28958, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 163, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64032, "r_y0": 495.90433, "r_x1": 208.48566, "r_y1": 495.90433, "r_x2": 208.48566, "r_y2": 493.1683, "r_x3": 200.64032, "r_y3": 493.1683, "coord_origin": "TOPLEFT" }, "text": "2013", "orig": "2013", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 164, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.29044, "r_y0": 495.90433, "r_x1": 266.25879, "r_y1": 495.90433, "r_x2": 266.25879, "r_y2": 493.1683, "r_x3": 264.29044, "r_y3": 493.1683, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 58, "label": "text", "bbox": { "l": 180.12473, "t": 516.2332200000001, "r": 190.62042, "b": 518.94992, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 180.12473, "r_y0": 518.94992, "r_x1": 190.62042, "r_y1": 518.94992, "r_x2": 190.62042, "r_y2": 516.2332200000001, "r_x3": 180.12473, "r_y3": 516.2332200000001, "coord_origin": "TOPLEFT" }, "text": "", "orig": "
", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 59, "label": "text", "bbox": { "l": 183.2438, "t": 520.13208, "r": 304.54797, "b": 522.84879, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2438, "r_y0": 522.84879, "r_x1": 304.54797, "r_y1": 522.84879, "r_x2": 304.54797, "r_y2": 520.13208, "r_x3": 183.2438, "r_y3": 520.13208, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 60, "label": "text", "bbox": { "l": 183.2438, "t": 524.03094, "r": 388.42313, "b": 526.74765, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2438, "r_y0": 526.74765, "r_x1": 388.42313, "r_y1": 526.74765, "r_x2": 388.42313, "r_y2": 524.03094, "r_x3": 183.2438, "r_y3": 524.03094, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 61, "label": "text", "bbox": { "l": 183.2438, "t": 527.9297799999999, "r": 388.42313, "b": 530.64648, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2438, "r_y0": 530.64648, "r_x1": 388.42313, "r_y1": 530.64648, "r_x2": 388.42313, "r_y2": 527.9297799999999, "r_x3": 183.2438, "r_y3": 527.9297799999999, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 62, "label": "text", "bbox": { "l": 183.2438, "t": 531.82861, "r": 388.42313, "b": 534.54532, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2438, "r_y0": 534.54532, "r_x1": 388.42313, "r_y1": 534.54532, "r_x2": 388.42313, "r_y2": 531.82861, "r_x3": 183.2438, "r_y3": 531.82861, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 183.2438, "t": 535.72748, "r": 388.42313, "b": 538.44418, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2438, "r_y0": 538.44418, "r_x1": 388.42313, "r_y1": 538.44418, "r_x2": 388.42313, "r_y2": 535.72748, "r_x3": 183.2438, "r_y3": 535.72748, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 183.2438, "t": 539.62631, "r": 388.42313, "b": 542.34303, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2438, "r_y0": 542.34303, "r_x1": 388.42313, "r_y1": 542.34303, "r_x2": 388.42313, "r_y2": 539.62631, "r_x3": 183.2438, "r_y3": 539.62631, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 183.2438, "t": 543.52516, "r": 388.42313, "b": 546.24188, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2438, "r_y0": 546.24188, "r_x1": 388.42313, "r_y1": 546.24188, "r_x2": 388.42313, "r_y2": 543.52516, "r_x3": 183.2438, "r_y3": 543.52516, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 183.2438, "t": 547.42401, "r": 388.42313, "b": 550.14073, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2438, "r_y0": 550.14073, "r_x1": 388.42313, "r_y1": 550.14073, "r_x2": 388.42313, "r_y2": 547.42401, "r_x3": 183.2438, "r_y3": 547.42401, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 183.2438, "t": 551.32286, "r": 388.42313, "b": 554.03958, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2438, "r_y0": 554.03958, "r_x1": 388.42313, "r_y1": 554.03958, "r_x2": 388.42313, "r_y2": 551.32286, "r_x3": 183.2438, "r_y3": 551.32286, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 180.12473, "t": 555.22173, "r": 191.86806, "b": 557.93845, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 180.12473, "r_y0": 557.93845, "r_x1": 191.86806, "r_y1": 557.93845, "r_x2": 191.86806, "r_y2": 555.22173, "r_x3": 180.12473, "r_y3": 555.22173, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 407.38348, "t": 518.30042, "r": 408.82025, "b": 521.01712, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38348, "r_y0": 521.01712, "r_x1": 408.82025, "r_y1": 521.01712, "r_x2": 408.82025, "r_y2": 518.30042, "r_x3": 407.38348, "r_y3": 518.30042, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 410.25699, "t": 518.30042, "r": 450.48605, "b": 521.01712, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.25699, "r_y0": 521.01712, "r_x1": 450.48605, "r_y1": 521.01712, "r_x2": 450.48605, "r_y2": 518.30042, "r_x3": 410.25699, "r_y3": 518.30042, "coord_origin": "TOPLEFT" }, "text": "C L L L C L L L L L C L L NL", "orig": "C L L L C L L L L L C L L NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 407.38348, "t": 522.19925, "r": 408.82025, "b": 524.9159500000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38348, "r_y0": 524.9159500000001, "r_x1": 408.82025, "r_y1": 524.9159500000001, "r_x2": 408.82025, "r_y2": 522.19925, "r_x3": 407.38348, "r_y3": 522.19925, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 410.25699, "t": 522.19925, "r": 450.48605, "b": 524.9159500000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.25699, "r_y0": 524.9159500000001, "r_x1": 450.48605, "r_y1": 524.9159500000001, "r_x2": 450.48605, "r_y2": 522.19925, "r_x3": 410.25699, "r_y3": 522.19925, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 407.38348, "t": 526.09808, "r": 408.82025, "b": 528.81479, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38348, "r_y0": 528.81479, "r_x1": 408.82025, "r_y1": 528.81479, "r_x2": 408.82025, "r_y2": 526.09808, "r_x3": 407.38348, "r_y3": 526.09808, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 410.25699, "t": 526.09808, "r": 450.48605, "b": 528.81479, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.25699, "r_y0": 528.81479, "r_x1": 450.48605, "r_y1": 528.81479, "r_x2": 450.48605, "r_y2": 526.09808, "r_x3": 410.25699, "r_y3": 526.09808, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 407.38348, "t": 529.99695, "r": 408.82025, "b": 532.7136499999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38348, "r_y0": 532.7136499999999, "r_x1": 408.82025, "r_y1": 532.7136499999999, "r_x2": 408.82025, "r_y2": 529.99695, "r_x3": 407.38348, "r_y3": 529.99695, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 410.25699, "t": 529.99695, "r": 450.48605, "b": 532.7136499999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.25699, "r_y0": 532.7136499999999, "r_x1": 450.48605, "r_y1": 532.7136499999999, "r_x2": 450.48605, "r_y2": 529.99695, "r_x3": 410.25699, "r_y3": 529.99695, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 407.38348, "t": 533.8957800000001, "r": 408.82025, "b": 536.6125, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38348, "r_y0": 536.6125, "r_x1": 408.82025, "r_y1": 536.6125, "r_x2": 408.82025, "r_y2": 533.8957800000001, "r_x3": 407.38348, "r_y3": 533.8957800000001, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 410.25699, "t": 533.8957800000001, "r": 450.48605, "b": 536.6125, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.25699, "r_y0": 536.6125, "r_x1": 450.48605, "r_y1": 536.6125, "r_x2": 450.48605, "r_y2": 533.8957800000001, "r_x3": 410.25699, "r_y3": 533.8957800000001, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 407.38348, "t": 537.79463, "r": 408.82025, "b": 540.51135, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38348, "r_y0": 540.51135, "r_x1": 408.82025, "r_y1": 540.51135, "r_x2": 408.82025, "r_y2": 537.79463, "r_x3": 407.38348, "r_y3": 537.79463, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 80, "label": "text", "bbox": { "l": 410.25699, "t": 537.79463, "r": 450.48605, "b": 540.51135, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.25699, "r_y0": 540.51135, "r_x1": 450.48605, "r_y1": 540.51135, "r_x2": 450.48605, "r_y2": 537.79463, "r_x3": 410.25699, "r_y3": 537.79463, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 81, "label": "text", "bbox": { "l": 407.38348, "t": 541.69348, "r": 408.82025, "b": 544.4102, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38348, "r_y0": 544.4102, "r_x1": 408.82025, "r_y1": 544.4102, "r_x2": 408.82025, "r_y2": 541.69348, "r_x3": 407.38348, "r_y3": 541.69348, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 82, "label": "text", "bbox": { "l": 410.25699, "t": 541.69348, "r": 450.48605, "b": 544.4102, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.25699, "r_y0": 544.4102, "r_x1": 450.48605, "r_y1": 544.4102, "r_x2": 450.48605, "r_y2": 541.69348, "r_x3": 410.25699, "r_y3": 541.69348, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 83, "label": "text", "bbox": { "l": 407.38348, "t": 545.59233, "r": 408.82025, "b": 548.3090500000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38348, "r_y0": 548.3090500000001, "r_x1": 408.82025, "r_y1": 548.3090500000001, "r_x2": 408.82025, "r_y2": 545.59233, "r_x3": 407.38348, "r_y3": 545.59233, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 84, "label": "text", "bbox": { "l": 410.25699, "t": 545.59233, "r": 450.48605, "b": 548.3090500000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.25699, "r_y0": 548.3090500000001, "r_x1": 450.48605, "r_y1": 548.3090500000001, "r_x2": 450.48605, "r_y2": 545.59233, "r_x3": 410.25699, "r_y3": 545.59233, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 85, "label": "text", "bbox": { "l": 407.38348, "t": 549.4911999999999, "r": 408.82025, "b": 552.2079200000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38348, "r_y0": 552.2079200000001, "r_x1": 408.82025, "r_y1": 552.2079200000001, "r_x2": 408.82025, "r_y2": 549.4911999999999, "r_x3": 407.38348, "r_y3": 549.4911999999999, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 86, "label": "text", "bbox": { "l": 410.25699, "t": 549.4911999999999, "r": 450.48605, "b": 552.2079200000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.25699, "r_y0": 552.2079200000001, "r_x1": 450.48605, "r_y1": 552.2079200000001, "r_x2": 450.48605, "r_y2": 549.4911999999999, "r_x3": 410.25699, "r_y3": 549.4911999999999, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 87, "label": "text", "bbox": { "l": 164.52881, "t": 509.45859, "r": 181.8528, "b": 515.31, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 164.52881, "r_y0": 515.31, "r_x1": 181.8528, "r_y1": 515.31, "r_x2": 181.8528, "r_y2": 509.45859, "r_x3": 164.52881, "r_y3": 509.45859, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 88, "label": "text", "bbox": { "l": 183.58441, "t": 509.45859, "r": 186.3974, "b": 515.31, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.58441, "r_y0": 515.31, "r_x1": 186.3974, "r_y1": 515.31, "r_x2": 186.3974, "r_y2": 509.45859, "r_x3": 183.58441, "r_y3": 509.45859, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 89, "label": "text", "bbox": { "l": 189.2104, "t": 509.45859, "r": 208.90137, "b": 515.31, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 189.2104, "r_y0": 515.31, "r_x1": 208.90137, "r_y1": 515.31, "r_x2": 208.90137, "r_y2": 509.45859, "r_x3": 189.2104, "r_y3": 509.45859, "coord_origin": "TOPLEFT" }, "text": "tokens:", "orig": "tokens:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 90, "label": "text", "bbox": { "l": 210.63269, "t": 509.45859, "r": 221.04044, "b": 515.31, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.63269, "r_y0": 515.31, "r_x1": 221.04044, "r_y1": 515.31, "r_x2": 221.04044, "r_y2": 509.45859, "r_x3": 210.63269, "r_y3": 509.45859, "coord_origin": "TOPLEFT" }, "text": "258", "orig": "258", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 91, "label": "text", "bbox": { "l": 390.20203, "t": 509.60361, "r": 406.83609, "b": 515.45502, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 390.20203, "r_y0": 515.45502, "r_x1": 406.83609, "r_y1": 515.45502, "r_x2": 406.83609, "r_y2": 509.60361, "r_x3": 390.20203, "r_y3": 509.60361, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 92, "label": "text", "bbox": { "l": 408.56952, "t": 509.60361, "r": 411.38251, "b": 515.45502, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.56952, "r_y0": 515.45502, "r_x1": 411.38251, "r_y1": 515.45502, "r_x2": 411.38251, "r_y2": 509.60361, "r_x3": 408.56952, "r_y3": 509.60361, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 93, "label": "text", "bbox": { "l": 414.1955, "t": 509.60361, "r": 433.88647000000003, "b": 515.45502, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 414.1955, "r_y0": 515.45502, "r_x1": 433.88647000000003, "r_y1": 515.45502, "r_x2": 433.88647000000003, "r_y2": 509.60361, "r_x3": 414.1955, "r_y3": 509.60361, "coord_origin": "TOPLEFT" }, "text": "tokens:", "orig": "tokens:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 94, "label": "text", "bbox": { "l": 435.61737, "t": 509.60361, "r": 446.02512, "b": 515.45502, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.61737, "r_y0": 515.45502, "r_x1": 446.02512, "r_y1": 515.45502, "r_x2": 446.02512, "r_y2": 509.60361, "r_x3": 435.61737, "r_y3": 509.60361, "coord_origin": "TOPLEFT" }, "text": "135", "orig": "135", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 95, "label": "text", "bbox": { "l": 167.19316, "t": 519.07236, "r": 172.8231, "b": 526.3866, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.19316, "r_y0": 526.3866, "r_x1": 172.8231, "r_y1": 526.3866, "r_x2": 172.8231, "r_y2": 519.07236, "r_x3": 167.19316, "r_y3": 519.07236, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 96, "label": "text", "bbox": { "l": 187.33745, "t": 448.62485, "r": 192.96739, "b": 455.93909, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 187.33745, "r_y0": 455.93909, "r_x1": 192.96739, "r_y1": 455.93909, "r_x2": 192.96739, "r_y2": 448.62485, "r_x3": 187.33745, "r_y3": 448.62485, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 97, "label": "text", "bbox": { "l": 167.38654, "t": 566.0051599999999, "r": 173.01648, "b": 573.3194, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.38654, "r_y0": 573.3194, "r_x1": 173.01648, "r_y1": 573.3194, "r_x2": 173.01648, "r_y2": 566.0051599999999, "r_x3": 167.38654, "r_y3": 566.0051599999999, "coord_origin": "TOPLEFT" }, "text": "D", "orig": "D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 98, "label": "text", "bbox": { "l": 248.45621000000003, "t": 621.78008, "r": 253.65727, "b": 629.09431, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 248.45621000000003, "r_y0": 629.09431, "r_x1": 253.65727, "r_y1": 629.09431, "r_x2": 253.65727, "r_y2": 621.78008, "r_x3": 248.45621000000003, "r_y3": 621.78008, "coord_origin": "TOPLEFT" }, "text": "E", "orig": "E", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 99, "label": "text", "bbox": { "l": 395.90057, "t": 519.19946, "r": 401.53052, "b": 526.5137, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.90057, "r_y0": 526.5137, "r_x1": 401.53052, "r_y1": 526.5137, "r_x2": 401.53052, "r_y2": 519.19946, "r_x3": 395.90057, "r_y3": 519.19946, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 100, "label": "text", "bbox": { "l": 171.62886, "t": 580.28853, "r": 177.48148, "b": 597.26784, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.62886, "r_y0": 597.26784, "r_x1": 177.48148, "r_y1": 597.26784, "r_x2": 177.48148, "r_y2": 580.28853, "r_x3": 171.62886, "r_y3": 580.28853, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 101, "label": "text", "bbox": { "l": 251.05969000000002, "t": 633.63408, "r": 256.91235, "b": 649.92345, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 251.05969000000002, "r_y0": 649.92345, "r_x1": 256.91235, "r_y1": 649.92345, "r_x2": 256.91235, "r_y2": 633.63408, "r_x3": 251.05969000000002, "r_y3": 633.63408, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 102, "label": "text", "bbox": { "l": 372.14645, "t": 601.45724, "r": 427.0379, "b": 607.30864, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 372.14645, "r_y0": 607.30864, "r_x1": 427.0379, "r_y1": 607.30864, "r_x2": 427.0379, "r_y2": 601.45724, "r_x3": 372.14645, "r_y3": 601.45724, "coord_origin": "TOPLEFT" }, "text": "HTML model shows", "orig": "HTML model shows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 103, "label": "text", "bbox": { "l": 372.14645, "t": 607.89948, "r": 430.06838999999997, "b": 613.75087, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 372.14645, "r_y0": 613.75087, "r_x1": 430.06838999999997, "r_y1": 613.75087, "r_x2": 430.06838999999997, "r_y2": 607.89948, "r_x3": 372.14645, "r_y3": 607.89948, "coord_origin": "TOPLEFT" }, "text": "bounding box drifting", "orig": "bounding box drifting", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 104, "label": "text", "bbox": { "l": 176.88042, "t": 642.87209, "r": 231.08191, "b": 648.72348, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.88042, "r_y0": 648.72348, "r_x1": 231.08191, "r_y1": 648.72348, "r_x2": 231.08191, "r_y2": 642.87209, "r_x3": 176.88042, "r_y3": 642.87209, "coord_origin": "TOPLEFT" }, "text": "OTSL model shows", "orig": "OTSL model shows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 105, "label": "text", "bbox": { "l": 176.88042, "t": 649.3143, "r": 230.99271000000002, "b": 655.1657, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.88042, "r_y0": 655.1657, "r_x1": 230.99271000000002, "r_y1": 655.1657, "r_x2": 230.99271000000002, "r_y2": 649.3143, "r_x3": 176.88042, "r_y3": 649.3143, "coord_origin": "TOPLEFT" }, "text": "clean bounding box", "orig": "clean bounding box", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 106, "label": "text", "bbox": { "l": 176.88042, "t": 655.7565500000001, "r": 203.93219, "b": 661.60794, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.88042, "r_y0": 661.60794, "r_x1": 203.93219, "r_y1": 661.60794, "r_x2": 203.93219, "r_y2": 655.7565500000001, "r_x3": 176.88042, "r_y3": 655.7565500000001, "coord_origin": "TOPLEFT" }, "text": "alignment", "orig": "alignment", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 107, "label": "text", "bbox": { "l": 215.93231000000003, "t": 557.56342, "r": 218.4697, "b": 569.15967, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 215.93231000000003, "r_y0": 569.15967, "r_x1": 218.4697, "r_y1": 569.15967, "r_x2": 218.4697, "r_y2": 557.56342, "r_x3": 215.93231000000003, "r_y3": 557.56342, "coord_origin": "TOPLEFT" }, "text": "\u2264", "orig": "\u2264", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 108, "label": "text", "bbox": { "l": 229.05689999999998, "t": 557.56342, "r": 231.71908999999997, "b": 569.15967, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.05689999999998, "r_y0": 569.15967, "r_x1": 231.71908999999997, "r_y1": 569.15967, "r_x2": 231.71908999999997, "r_y2": 557.56342, "r_x3": 229.05689999999998, "r_y3": 557.56342, "coord_origin": "TOPLEFT" }, "text": "\u03bc", "orig": "\u03bc", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 109, "label": "text", "bbox": { "l": 261.20892, "t": 448.46124, "r": 263.56973, "b": 451.19727, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 261.20892, "r_y0": 451.19727, "r_x1": 263.56973, "r_y1": 451.19727, "r_x2": 263.56973, "r_y2": 448.46124, "r_x3": 261.20892, "r_y3": 448.46124, "coord_origin": "TOPLEFT" }, "text": "S", "orig": "S", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 110, "label": "text", "bbox": { "l": 312.33463, "t": 448.46124, "r": 313.6362, "b": 451.19727, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.33463, "r_y0": 451.19727, "r_x1": 313.6362, "r_y1": 451.19727, "r_x2": 313.6362, "r_y2": 448.46124, "r_x3": 312.33463, "r_y3": 448.46124, "coord_origin": "TOPLEFT" }, "text": "I", "orig": "I", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 111, "label": "text", "bbox": { "l": 377.41125, "t": 448.46124, "r": 380.05737, "b": 451.19727, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 377.41125, "r_y0": 451.19727, "r_x1": 380.05737, "r_y1": 451.19727, "r_x2": 380.05737, "r_y2": 448.46124, "r_x3": 377.41125, "r_y3": 448.46124, "coord_origin": "TOPLEFT" }, "text": "R", "orig": "R", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 112, "label": "text", "bbox": { "l": 200.63976, "t": 453.33997, "r": 205.82492, "b": 456.07599, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.63976, "r_y0": 456.07599, "r_x1": 205.82492, "r_y1": 456.07599, "r_x2": 205.82492, "r_y2": 453.33997, "r_x3": 200.63976, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "ST", "orig": "ST", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 113, "label": "text", "bbox": { "l": 222.20833000000002, "t": 453.33997, "r": 229.76836, "b": 456.07599, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.20833000000002, "r_y0": 456.07599, "r_x1": 229.76836, "r_y1": 456.07599, "r_x2": 229.76836, "r_y2": 453.33997, "r_x3": 222.20833000000002, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "0.03", "orig": "0.03", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 114, "label": "text", "bbox": { "l": 243.26666, "t": 453.33997, "r": 250.82669, "b": 456.07599, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 243.26666, "r_y0": 456.07599, "r_x1": 250.82669, "r_y1": 456.07599, "r_x2": 250.82669, "r_y2": 453.33997, "r_x3": 243.26666, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "0.06", "orig": "0.06", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 115, "label": "text", "bbox": { "l": 264.29657, "t": 453.33997, "r": 271.84949, "b": 456.07599, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.29657, "r_y0": 456.07599, "r_x1": 271.84949, "r_y1": 456.07599, "r_x2": 271.84949, "r_y2": 453.33997, "r_x3": 264.29657, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "0.12", "orig": "0.12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 116, "label": "text", "bbox": { "l": 285.31943, "t": 453.33997, "r": 292.87946, "b": 456.07599, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.31943, "r_y0": 456.07599, "r_x1": 292.87946, "r_y1": 456.07599, "r_x2": 292.87946, "r_y2": 453.33997, "r_x3": 285.31943, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "0.25", "orig": "0.25", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 117, "label": "text", "bbox": { "l": 306.37775, "t": 453.33997, "r": 311.77319, "b": 456.07599, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.37775, "r_y0": 456.07599, "r_x1": 311.77319, "r_y1": 456.07599, "r_x2": 311.77319, "r_y2": 453.33997, "r_x3": 306.37775, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "0.5", "orig": "0.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 118, "label": "text", "bbox": { "l": 323.41699, "t": 453.33997, "r": 325.58157, "b": 456.07599, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.41699, "r_y0": 456.07599, "r_x1": 325.58157, "r_y1": 456.07599, "r_x2": 325.58157, "r_y2": 453.33997, "r_x3": 323.41699, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 119, "label": "text", "bbox": { "l": 334.45807, "t": 453.33997, "r": 336.62265, "b": 456.07599, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.45807, "r_y0": 456.07599, "r_x1": 336.62265, "r_y1": 456.07599, "r_x2": 336.62265, "r_y2": 453.33997, "r_x3": 334.45807, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 120, "label": "text", "bbox": { "l": 345.52756, "t": 453.33997, "r": 347.69214, "b": 456.07599, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.52756, "r_y0": 456.07599, "r_x1": 347.69214, "r_y1": 456.07599, "r_x2": 347.69214, "r_y2": 453.33997, "r_x3": 345.52756, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 121, "label": "text", "bbox": { "l": 356.56863, "t": 453.33997, "r": 358.73322, "b": 456.07599, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 356.56863, "r_y0": 456.07599, "r_x1": 358.73322, "r_y1": 456.07599, "r_x2": 358.73322, "r_y2": 453.33997, "r_x3": 356.56863, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 122, "label": "text", "bbox": { "l": 367.63812, "t": 453.33997, "r": 371.97089, "b": 456.07599, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.63812, "r_y0": 456.07599, "r_x1": 371.97089, "r_y1": 456.07599, "r_x2": 371.97089, "r_y2": 453.33997, "r_x3": 367.63812, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 123, "label": "text", "bbox": { "l": 382.6734, "t": 453.33997, "r": 387.00616, "b": 456.07599, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.6734, "r_y0": 456.07599, "r_x1": 387.00616, "r_y1": 456.07599, "r_x2": 387.00616, "r_y2": 453.33997, "r_x3": 382.6734, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "32", "orig": "32", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 124, "label": "text", "bbox": { "l": 397.73727, "t": 453.33997, "r": 402.07001, "b": 456.07599, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.73727, "r_y0": 456.07599, "r_x1": 402.07001, "r_y1": 456.07599, "r_x2": 402.07001, "r_y2": 453.33997, "r_x3": 397.73727, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": "64", "orig": "64", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 125, "label": "text", "bbox": { "l": 412.78879, "t": 447.99298, "r": 414.93463, "b": 457.79964999999993, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 412.78879, "r_y0": 457.79964999999993, "r_x1": 414.93463, "r_y1": 457.79964999999993, "r_x2": 414.93463, "r_y2": 447.99298, "r_x3": 412.78879, "r_y3": 447.99298, "coord_origin": "TOPLEFT" }, "text": "\u2265", "orig": "\u2265", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 126, "label": "text", "bbox": { "l": 414.95697, "t": 453.33997, "r": 422.51746, "b": 456.07599, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 414.95697, "r_y0": 456.07599, "r_x1": 422.51746, "r_y1": 456.07599, "r_x2": 422.51746, "r_y2": 453.33997, "r_x3": 414.95697, "r_y3": 453.33997, "coord_origin": "TOPLEFT" }, "text": " 128", "orig": " 128", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 127, "label": "text", "bbox": { "l": 200.63998, "t": 463.92444, "r": 204.57674, "b": 466.66043, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.63998, "r_y0": 466.66043, "r_x1": 204.57674, "r_y1": 466.66043, "r_x2": 204.57674, "r_y2": 463.92444, "r_x3": 200.63998, "r_y3": 463.92444, "coord_origin": "TOPLEFT" }, "text": "63", "orig": "63", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 128, "label": "text", "bbox": { "l": 367.62604, "t": 463.92444, "r": 369.58032, "b": 466.66043, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.62604, "r_y0": 466.66043, "r_x1": 369.58032, "r_y1": 466.66043, "r_x2": 369.58032, "r_y2": 463.92444, "r_x3": 367.62604, "r_y3": 463.92444, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 129, "label": "text", "bbox": { "l": 382.66132, "t": 463.92444, "r": 384.6156, "b": 466.66043, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.66132, "r_y0": 466.66043, "r_x1": 384.6156, "r_y1": 466.66043, "r_x2": 384.6156, "r_y2": 463.92444, "r_x3": 382.66132, "r_y3": 463.92444, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 130, "label": "text", "bbox": { "l": 397.72504, "t": 463.92444, "r": 399.67932, "b": 466.66043, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.72504, "r_y0": 466.66043, "r_x1": 399.67932, "r_y1": 466.66043, "r_x2": 399.67932, "r_y2": 463.92444, "r_x3": 397.72504, "r_y3": 463.92444, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 131, "label": "text", "bbox": { "l": 200.64, "t": 468.80313, "r": 206.51694, "b": 471.53915, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 471.53915, "r_x1": 206.51694, "r_y1": 471.53915, "r_x2": 206.51694, "r_y2": 468.80313, "r_x3": 200.64, "r_y3": 468.80313, "coord_origin": "TOPLEFT" }, "text": "199", "orig": "199", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 132, "label": "text", "bbox": { "l": 264.29047, "t": 468.80313, "r": 266.25885, "b": 471.53915, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.29047, "r_y0": 471.53915, "r_x1": 266.25885, "r_y1": 471.53915, "r_x2": 266.25885, "r_y2": 468.80313, "r_x3": 264.29047, "r_y3": 468.80313, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 133, "label": "text", "bbox": { "l": 306.37213, "t": 468.80313, "r": 308.34052, "b": 471.53915, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.37213, "r_y0": 471.53915, "r_x1": 308.34052, "r_y1": 471.53915, "r_x2": 308.34052, "r_y2": 468.80313, "r_x3": 306.37213, "r_y3": 468.80313, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 134, "label": "text", "bbox": { "l": 345.51526, "t": 468.80313, "r": 347.48364, "b": 471.53915, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.51526, "r_y0": 471.53915, "r_x1": 347.48364, "r_y1": 471.53915, "r_x2": 347.48364, "r_y2": 468.80313, "r_x3": 345.51526, "r_y3": 468.80313, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 135, "label": "text", "bbox": { "l": 356.55634, "t": 468.80313, "r": 358.52472, "b": 471.53915, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 356.55634, "r_y0": 471.53915, "r_x1": 358.52472, "r_y1": 471.53915, "r_x2": 358.52472, "r_y2": 468.80313, "r_x3": 356.55634, "r_y3": 468.80313, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 136, "label": "text", "bbox": { "l": 367.62582, "t": 468.80313, "r": 369.59418, "b": 471.53915, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.62582, "r_y0": 471.53915, "r_x1": 369.59418, "r_y1": 471.53915, "r_x2": 369.59418, "r_y2": 468.80313, "r_x3": 367.62582, "r_y3": 468.80313, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 137, "label": "text", "bbox": { "l": 382.66107, "t": 468.80313, "r": 384.62946, "b": 471.53915, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.66107, "r_y0": 471.53915, "r_x1": 384.62946, "r_y1": 471.53915, "r_x2": 384.62946, "r_y2": 468.80313, "r_x3": 382.66107, "r_y3": 468.80313, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 138, "label": "text", "bbox": { "l": 200.64, "t": 473.68185, "r": 206.51694, "b": 476.41788, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 476.41788, "r_x1": 206.51694, "r_y1": 476.41788, "r_x2": 206.51694, "r_y2": 473.68185, "r_x3": 200.64, "r_y3": 473.68185, "coord_origin": "TOPLEFT" }, "text": "416", "orig": "416", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 139, "label": "text", "bbox": { "l": 264.29047, "t": 473.68185, "r": 266.25885, "b": 476.41788, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.29047, "r_y0": 476.41788, "r_x1": 266.25885, "r_y1": 476.41788, "r_x2": 266.25885, "r_y2": 473.68185, "r_x3": 264.29047, "r_y3": 473.68185, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 140, "label": "text", "bbox": { "l": 200.64, "t": 478.53214, "r": 206.51694, "b": 481.26816, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 481.26816, "r_x1": 206.51694, "r_y1": 481.26816, "r_x2": 206.51694, "r_y2": 478.53214, "r_x3": 200.64, "r_y3": 478.53214, "coord_origin": "TOPLEFT" }, "text": "230", "orig": "230", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 141, "label": "text", "bbox": { "l": 243.26373, "t": 478.53214, "r": 245.2321, "b": 481.26816, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 243.26373, "r_y0": 481.26816, "r_x1": 245.2321, "r_y1": 481.26816, "r_x2": 245.2321, "r_y2": 478.53214, "r_x3": 243.26373, "r_y3": 478.53214, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 142, "label": "text", "bbox": { "l": 264.29047, "t": 478.53214, "r": 266.25885, "b": 481.26816, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.29047, "r_y0": 481.26816, "r_x1": 266.25885, "r_y1": 481.26816, "r_x2": 266.25885, "r_y2": 478.53214, "r_x3": 264.29047, "r_y3": 478.53214, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 143, "label": "text", "bbox": { "l": 323.40466, "t": 478.53214, "r": 325.37305, "b": 481.26816, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.40466, "r_y0": 481.26816, "r_x1": 325.37305, "r_y1": 481.26816, "r_x2": 325.37305, "r_y2": 478.53214, "r_x3": 323.40466, "r_y3": 478.53214, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 144, "label": "text", "bbox": { "l": 397.72519, "t": 478.53214, "r": 399.69354, "b": 481.26816, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.72519, "r_y0": 481.26816, "r_x1": 399.69354, "r_y1": 481.26816, "r_x2": 399.69354, "r_y2": 478.53214, "r_x3": 397.72519, "r_y3": 478.53214, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 145, "label": "text", "bbox": { "l": 200.64, "t": 483.41086, "r": 206.51694, "b": 486.14688, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 486.14688, "r_x1": 206.51694, "r_y1": 486.14688, "r_x2": 206.51694, "r_y2": 483.41086, "r_x3": 200.64, "r_y3": 483.41086, "coord_origin": "TOPLEFT" }, "text": "276", "orig": "276", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 146, "label": "text", "bbox": { "l": 382.66132, "t": 483.41086, "r": 384.61563, "b": 486.14688, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.66132, "r_y0": 486.14688, "r_x1": 384.61563, "r_y1": 486.14688, "r_x2": 384.61563, "r_y2": 483.41086, "r_x3": 382.66132, "r_y3": 483.41086, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 147, "label": "text", "bbox": { "l": 397.72513, "t": 483.41086, "r": 401.64819, "b": 486.14688, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.72513, "r_y0": 486.14688, "r_x1": 401.64819, "r_y1": 486.14688, "r_x2": 401.64819, "r_y2": 483.41086, "r_x3": 397.72513, "r_y3": 483.41086, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 148, "label": "text", "bbox": { "l": 412.78928, "t": 483.41086, "r": 414.74359, "b": 486.14688, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 158, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 412.78928, "r_y0": 486.14688, "r_x1": 414.74359, "r_y1": 486.14688, "r_x2": 414.74359, "r_y2": 483.41086, "r_x3": 412.78928, "r_y3": 483.41086, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 149, "label": "text", "bbox": { "l": 200.64014, "t": 488.28958, "r": 207.14445, "b": 491.0256, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 159, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64014, "r_y0": 491.0256, "r_x1": 207.14445, "r_y1": 491.0256, "r_x2": 207.14445, "r_y2": 488.28958, "r_x3": 200.64014, "r_y3": 488.28958, "coord_origin": "TOPLEFT" }, "text": "320", "orig": "320", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 150, "label": "text", "bbox": { "l": 367.62616, "t": 488.28958, "r": 369.78375, "b": 491.0256, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 160, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.62616, "r_y0": 491.0256, "r_x1": 369.78375, "r_y1": 491.0256, "r_x2": 369.78375, "r_y2": 488.28958, "r_x3": 367.62616, "r_y3": 488.28958, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 151, "label": "text", "bbox": { "l": 382.66141, "t": 488.28958, "r": 384.81897, "b": 491.0256, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 161, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.66141, "r_y0": 491.0256, "r_x1": 384.81897, "r_y1": 491.0256, "r_x2": 384.81897, "r_y2": 488.28958, "r_x3": 382.66141, "r_y3": 488.28958, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 152, "label": "text", "bbox": { "l": 397.7251, "t": 488.28958, "r": 402.05087, "b": 491.0256, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 162, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.7251, "r_y0": 491.0256, "r_x1": 402.05087, "r_y1": 491.0256, "r_x2": 402.05087, "r_y2": 488.28958, "r_x3": 397.7251, "r_y3": 488.28958, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 153, "label": "text", "bbox": { "l": 200.64032, "t": 493.1683, "r": 208.48566, "b": 495.90433, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 163, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64032, "r_y0": 495.90433, "r_x1": 208.48566, "r_y1": 495.90433, "r_x2": 208.48566, "r_y2": 493.1683, "r_x3": 200.64032, "r_y3": 493.1683, "coord_origin": "TOPLEFT" }, "text": "2013", "orig": "2013", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 154, "label": "text", "bbox": { "l": 264.29044, "t": 493.1683, "r": 266.25879, "b": 495.90433, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 164, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.29044, "r_y0": 495.90433, "r_x1": 266.25879, "r_y1": 495.90433, "r_x2": 266.25879, "r_y2": 493.1683, "r_x3": 264.29044, "r_y3": 493.1683, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "text", "id": 155, "page_no": 9, "cluster": { "id": 155, "label": "text", "bbox": { "l": 227.91466, "t": 665.82603, "r": 230.10028, "b": 675.3464, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 165, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.91466, "r_y0": 675.3464, "r_x1": 230.10028, "r_y1": 675.3464, "r_x2": 230.10028, "r_y2": 665.82603, "r_x3": 227.91466, "r_y3": 665.82603, "coord_origin": "TOPLEFT" }, "text": "\u03bc", "orig": "\u03bc", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "\u03bc" }, { "label": "text", "id": 156, "page_no": 9, "cluster": { "id": 156, "label": "text", "bbox": { "l": 300.58057, "t": 683.62195, "r": 302.72638, "b": 693.428658, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 166, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 300.58057, "r_y0": 693.428658, "r_x1": 302.72638, "r_y1": 693.428658, "r_x2": 302.72638, "r_y2": 683.62195, "r_x3": 300.58057, "r_y3": 683.62195, "coord_origin": "TOPLEFT" }, "text": "\u2265", "orig": "\u2265", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "\u2265" } ], "headers": [ { "label": "page_header", "id": 7, "page_no": 9, "cluster": { "id": 7, "label": "page_header", "bbox": { "l": 134.765, "t": 93.77099999999996, "r": 143.97887, "b": 101.84069999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.8309906721115112, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 101.84069999999997, "r_x1": 143.97887, "r_y1": 101.84069999999997, "r_x2": 143.97887, "r_y2": 93.77099999999996, "r_x3": 134.765, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "10" }, { "label": "page_header", "id": 6, "page_no": 9, "cluster": { "id": 6, "label": "page_header", "bbox": { "l": 167.82053, "t": 93.77099999999996, "r": 231.72049000000004, "b": 101.84069999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.8367075324058533, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.82053, "r_y0": 101.84069999999997, "r_x1": 178.08249, "r_y1": 101.84069999999997, "r_x2": 178.08249, "r_y2": 93.77099999999996, "r_x3": 167.82053, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.37929, "r_y0": 101.84069999999997, "r_x1": 231.72049000000004, "r_y1": 101.84069999999997, "r_x2": 231.72049000000004, "r_y2": 93.77099999999996, "r_x3": 182.37929, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "M. Lysak, et al." } ] } }, { "page_no": 10, "size": { "width": 612.0, "height": 792.0 }, "parsed_page": { "dimension": { "angle": 0.0, "rect": { "r_x0": 0.0, "r_y0": 0.0, "r_x1": 612.0, "r_y1": 0.0, "r_x2": 612.0, "r_y2": 792.0, "r_x3": 0.0, "r_y3": 792.0, "coord_origin": "BOTTOMLEFT" }, "boundary_type": "crop_box", "art_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "bleed_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "crop_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "media_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "trim_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" } }, "bitmap_resources": [], "char_cells": [], "word_cells": [], "textline_cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.478, "r_y0": 101.84069999999997, "r_x1": 447.54291000000006, "r_y1": 101.84069999999997, "r_x2": 447.54291000000006, "r_y2": 93.77099999999996, "r_x3": 194.478, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 471.37561, "r_y0": 101.84069999999997, "r_x1": 480.5894799999999, "r_y1": 101.84069999999997, "r_x2": 480.5894799999999, "r_y2": 93.77099999999996, "r_x3": 471.37561, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 133.72551999999996, "r_x1": 162.64424, "r_y1": 133.72551999999996, "r_x2": 162.64424, "r_y2": 125.79918999999984, "r_x3": 134.765, "r_y3": 125.79918999999984, "coord_origin": "TOPLEFT" }, "text": "Fig. 6.", "orig": "Fig. 6.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 165.215, "r_y0": 133.93169999999998, "r_x1": 480.58752, "r_y1": 133.93169999999998, "r_x2": 480.58752, "r_y2": 125.86200000000008, "r_x3": 165.215, "r_y3": 125.86200000000008, "coord_origin": "TOPLEFT" }, "text": "Visualization of predicted structure and detected bounding boxes on a complex", "orig": "Visualization of predicted structure and detected bounding boxes on a complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 144.89068999999995, "r_x1": 480.58823, "r_y1": 144.89068999999995, "r_x2": 480.58823, "r_y2": 136.82097999999996, "r_x3": 134.765, "r_y3": 136.82097999999996, "coord_origin": "TOPLEFT" }, "text": "table with many rows. The OTSL model (B) captured repeating pattern of horizontally", "orig": "table with many rows. The OTSL model (B) captured repeating pattern of horizontally", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 155.84966999999995, "r_x1": 480.5881999999999, "r_y1": 155.84966999999995, "r_x2": 480.5881999999999, "r_y2": 147.77997000000005, "r_x3": 134.765, "r_y3": 147.77997000000005, "coord_origin": "TOPLEFT" }, "text": "merged cells from the GT (A), unlike the HTML model (C). The HTML model also", "orig": "merged cells from the GT (A), unlike the HTML model (C). The HTML model also", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 166.80864999999994, "r_x1": 480.58838000000003, "r_y1": 166.80864999999994, "r_x2": 480.58838000000003, "r_y2": 158.73895000000005, "r_x3": 134.765, "r_y3": 158.73895000000005, "coord_origin": "TOPLEFT" }, "text": "didn\u2019t complete the HTML sequence correctly and displayed a lot more of drift and", "orig": "didn\u2019t complete the HTML sequence correctly and displayed a lot more of drift and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 177.76764000000003, "r_x1": 415.84454, "r_y1": 177.76764000000003, "r_x2": 415.84454, "r_y2": 169.69794000000002, "r_x3": 134.765, "r_y3": 169.69794000000002, "coord_origin": "TOPLEFT" }, "text": "overlap of bounding boxes. \"PMC5406406_003_01.png\" PubTabNet.", "orig": "overlap of bounding boxes. \"PMC5406406_003_01.png\" PubTabNet.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.5049, "r_y0": 320.36386, "r_x1": 177.59613, "r_y1": 320.36386, "r_x2": 177.59613, "r_y2": 312.45032, "r_x3": 171.5049, "r_y3": 312.45032, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.05823, "r_y0": 500.56628, "r_x1": 177.14946, "r_y1": 500.56628, "r_x2": 177.14946, "r_y2": 492.65274, "r_x3": 171.05823, "r_y3": 492.65274, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 283.047, "r_y0": 633.4168099999999, "r_x1": 374.96332, "r_y1": 633.4168099999999, "r_x2": 374.96332, "r_y2": 627.48166, "r_x3": 283.047, "r_y3": 627.48166, "coord_origin": "TOPLEFT" }, "text": "Incorrect end of HTML sequence", "orig": "Incorrect end of HTML sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 283.047, "r_y0": 623.29291, "r_x1": 398.05978, "r_y1": 623.29291, "r_x2": 398.05978, "r_y2": 617.35776, "r_x3": 283.047, "r_y3": 617.35776, "coord_origin": "TOPLEFT" }, "text": "Horizontally merged cells are not present", "orig": "Horizontally merged cells are not present", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.64209, "r_y0": 471.53299, "r_x1": 437.50800000000004, "r_y1": 471.53299, "r_x2": 437.50800000000004, "r_y2": 465.59784, "r_x3": 293.64209, "r_y3": 465.59784, "coord_origin": "TOPLEFT" }, "text": "Repeating pattern is well represented in predictions", "orig": "Repeating pattern is well represented in predictions", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 181.89114, "r_y0": 294.2947700000001, "r_x1": 239.23492, "r_y1": 294.2947700000001, "r_x2": 239.23492, "r_y2": 288.35962000000006, "r_x3": 181.89114, "r_y3": 288.35962000000006, "coord_origin": "TOPLEFT" }, "text": "Repeating pattern of", "orig": "Repeating pattern of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 181.89114, "r_y0": 300.82938, "r_x1": 251.52917, "r_y1": 300.82938, "r_x2": 251.52917, "r_y2": 294.89423, "r_x3": 181.89114, "r_y3": 294.89423, "coord_origin": "TOPLEFT" }, "text": "horizontally merged cells", "orig": "horizontally merged cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 247.83432, "r_y0": 194.81635000000006, "r_x1": 253.61339, "r_y1": 194.81635000000006, "r_x2": 253.61339, "r_y2": 184.75989000000004, "r_x3": 247.83432, "r_y3": 184.75989000000004, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 292.18976, "r_y0": 613.7412400000001, "r_x1": 381.54663, "r_y1": 613.7412400000001, "r_x2": 381.54663, "r_y2": 607.80609, "r_x3": 292.18976, "r_y3": 607.80609, "coord_origin": "TOPLEFT" }, "text": "Bounding box drifting at the end", "orig": "Bounding box drifting at the end", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 172.27777, "r_y0": 403.40067, "r_x1": 180.18666, "r_y1": 403.40067, "r_x2": 180.18666, "r_y2": 381.36288, "r_x3": 172.27777, "r_y3": 381.36288, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 172.27747, "r_y0": 578.7478, "r_x1": 180.18663, "r_y1": 578.7478, "r_x2": 180.18663, "r_y2": 555.7769499999999, "r_x3": 172.27747, "r_y3": 555.7769499999999, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "has_chars": false, "has_words": false, "has_lines": true, "image": null, "lines": [] }, "predictions": { "layout": { "clusters": [ { "id": 0, "label": "page_header", "bbox": { "l": 194.478, "t": 93.77099999999996, "r": 447.54291000000006, "b": 101.84069999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.9301655888557434, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.478, "r_y0": 101.84069999999997, "r_x1": 447.54291000000006, "r_y1": 101.84069999999997, "r_x2": 447.54291000000006, "r_y2": 93.77099999999996, "r_x3": 194.478, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 1, "label": "page_header", "bbox": { "l": 471.37561, "t": 93.77099999999996, "r": 480.5894799999999, "b": 101.84069999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.9007201790809631, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 471.37561, "r_y0": 101.84069999999997, "r_x1": 480.5894799999999, "r_y1": 101.84069999999997, "r_x2": 480.5894799999999, "r_y2": 93.77099999999996, "r_x3": 471.37561, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 2, "label": "caption", "bbox": { "l": 134.765, "t": 125.79918999999984, "r": 480.58838000000003, "b": 177.76764000000003, "coord_origin": "TOPLEFT" }, "confidence": 0.8657060861587524, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 133.72551999999996, "r_x1": 162.64424, "r_y1": 133.72551999999996, "r_x2": 162.64424, "r_y2": 125.79918999999984, "r_x3": 134.765, "r_y3": 125.79918999999984, "coord_origin": "TOPLEFT" }, "text": "Fig. 6.", "orig": "Fig. 6.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 165.215, "r_y0": 133.93169999999998, "r_x1": 480.58752, "r_y1": 133.93169999999998, "r_x2": 480.58752, "r_y2": 125.86200000000008, "r_x3": 165.215, "r_y3": 125.86200000000008, "coord_origin": "TOPLEFT" }, "text": "Visualization of predicted structure and detected bounding boxes on a complex", "orig": "Visualization of predicted structure and detected bounding boxes on a complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 144.89068999999995, "r_x1": 480.58823, "r_y1": 144.89068999999995, "r_x2": 480.58823, "r_y2": 136.82097999999996, "r_x3": 134.765, "r_y3": 136.82097999999996, "coord_origin": "TOPLEFT" }, "text": "table with many rows. The OTSL model (B) captured repeating pattern of horizontally", "orig": "table with many rows. The OTSL model (B) captured repeating pattern of horizontally", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 155.84966999999995, "r_x1": 480.5881999999999, "r_y1": 155.84966999999995, "r_x2": 480.5881999999999, "r_y2": 147.77997000000005, "r_x3": 134.765, "r_y3": 147.77997000000005, "coord_origin": "TOPLEFT" }, "text": "merged cells from the GT (A), unlike the HTML model (C). The HTML model also", "orig": "merged cells from the GT (A), unlike the HTML model (C). The HTML model also", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 166.80864999999994, "r_x1": 480.58838000000003, "r_y1": 166.80864999999994, "r_x2": 480.58838000000003, "r_y2": 158.73895000000005, "r_x3": 134.765, "r_y3": 158.73895000000005, "coord_origin": "TOPLEFT" }, "text": "didn\u2019t complete the HTML sequence correctly and displayed a lot more of drift and", "orig": "didn\u2019t complete the HTML sequence correctly and displayed a lot more of drift and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 177.76764000000003, "r_x1": 415.84454, "r_y1": 177.76764000000003, "r_x2": 415.84454, "r_y2": 169.69794000000002, "r_x3": 134.765, "r_y3": 169.69794000000002, "coord_origin": "TOPLEFT" }, "text": "overlap of bounding boxes. \"PMC5406406_003_01.png\" PubTabNet.", "orig": "overlap of bounding boxes. \"PMC5406406_003_01.png\" PubTabNet.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 3, "label": "picture", "bbox": { "l": 168.39285278320312, "t": 181.9665069580078, "r": 447.35137939453125, "b": 634.0056762695312, "coord_origin": "TOPLEFT" }, "confidence": 0.7612658739089966, "cells": [ { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.5049, "r_y0": 320.36386, "r_x1": 177.59613, "r_y1": 320.36386, "r_x2": 177.59613, "r_y2": 312.45032, "r_x3": 171.5049, "r_y3": 312.45032, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.05823, "r_y0": 500.56628, "r_x1": 177.14946, "r_y1": 500.56628, "r_x2": 177.14946, "r_y2": 492.65274, "r_x3": 171.05823, "r_y3": 492.65274, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 283.047, "r_y0": 633.4168099999999, "r_x1": 374.96332, "r_y1": 633.4168099999999, "r_x2": 374.96332, "r_y2": 627.48166, "r_x3": 283.047, "r_y3": 627.48166, "coord_origin": "TOPLEFT" }, "text": "Incorrect end of HTML sequence", "orig": "Incorrect end of HTML sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 283.047, "r_y0": 623.29291, "r_x1": 398.05978, "r_y1": 623.29291, "r_x2": 398.05978, "r_y2": 617.35776, "r_x3": 283.047, "r_y3": 617.35776, "coord_origin": "TOPLEFT" }, "text": "Horizontally merged cells are not present", "orig": "Horizontally merged cells are not present", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.64209, "r_y0": 471.53299, "r_x1": 437.50800000000004, "r_y1": 471.53299, "r_x2": 437.50800000000004, "r_y2": 465.59784, "r_x3": 293.64209, "r_y3": 465.59784, "coord_origin": "TOPLEFT" }, "text": "Repeating pattern is well represented in predictions", "orig": "Repeating pattern is well represented in predictions", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 181.89114, "r_y0": 294.2947700000001, "r_x1": 239.23492, "r_y1": 294.2947700000001, "r_x2": 239.23492, "r_y2": 288.35962000000006, "r_x3": 181.89114, "r_y3": 288.35962000000006, "coord_origin": "TOPLEFT" }, "text": "Repeating pattern of", "orig": "Repeating pattern of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 181.89114, "r_y0": 300.82938, "r_x1": 251.52917, "r_y1": 300.82938, "r_x2": 251.52917, "r_y2": 294.89423, "r_x3": 181.89114, "r_y3": 294.89423, "coord_origin": "TOPLEFT" }, "text": "horizontally merged cells", "orig": "horizontally merged cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 247.83432, "r_y0": 194.81635000000006, "r_x1": 253.61339, "r_y1": 194.81635000000006, "r_x2": 253.61339, "r_y2": 184.75989000000004, "r_x3": 247.83432, "r_y3": 184.75989000000004, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 292.18976, "r_y0": 613.7412400000001, "r_x1": 381.54663, "r_y1": 613.7412400000001, "r_x2": 381.54663, "r_y2": 607.80609, "r_x3": 292.18976, "r_y3": 607.80609, "coord_origin": "TOPLEFT" }, "text": "Bounding box drifting at the end", "orig": "Bounding box drifting at the end", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 172.27777, "r_y0": 403.40067, "r_x1": 180.18666, "r_y1": 403.40067, "r_x2": 180.18666, "r_y2": 381.36288, "r_x3": 172.27777, "r_y3": 381.36288, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 172.27747, "r_y0": 578.7478, "r_x1": 180.18663, "r_y1": 578.7478, "r_x2": 180.18663, "r_y2": 555.7769499999999, "r_x3": 172.27747, "r_y3": 555.7769499999999, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 18, "label": "text", "bbox": { "l": 171.5049, "t": 312.45032, "r": 177.59613, "b": 320.36386, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.5049, "r_y0": 320.36386, "r_x1": 177.59613, "r_y1": 320.36386, "r_x2": 177.59613, "r_y2": 312.45032, "r_x3": 171.5049, "r_y3": 312.45032, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 19, "label": "text", "bbox": { "l": 171.05823, "t": 492.65274, "r": 177.14946, "b": 500.56628, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.05823, "r_y0": 500.56628, "r_x1": 177.14946, "r_y1": 500.56628, "r_x2": 177.14946, "r_y2": 492.65274, "r_x3": 171.05823, "r_y3": 492.65274, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 20, "label": "text", "bbox": { "l": 283.047, "t": 627.48166, "r": 374.96332, "b": 633.4168099999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 283.047, "r_y0": 633.4168099999999, "r_x1": 374.96332, "r_y1": 633.4168099999999, "r_x2": 374.96332, "r_y2": 627.48166, "r_x3": 283.047, "r_y3": 627.48166, "coord_origin": "TOPLEFT" }, "text": "Incorrect end of HTML sequence", "orig": "Incorrect end of HTML sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 21, "label": "text", "bbox": { "l": 283.047, "t": 617.35776, "r": 398.05978, "b": 623.29291, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 283.047, "r_y0": 623.29291, "r_x1": 398.05978, "r_y1": 623.29291, "r_x2": 398.05978, "r_y2": 617.35776, "r_x3": 283.047, "r_y3": 617.35776, "coord_origin": "TOPLEFT" }, "text": "Horizontally merged cells are not present", "orig": "Horizontally merged cells are not present", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 22, "label": "text", "bbox": { "l": 293.64209, "t": 465.59784, "r": 437.50800000000004, "b": 471.53299, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.64209, "r_y0": 471.53299, "r_x1": 437.50800000000004, "r_y1": 471.53299, "r_x2": 437.50800000000004, "r_y2": 465.59784, "r_x3": 293.64209, "r_y3": 465.59784, "coord_origin": "TOPLEFT" }, "text": "Repeating pattern is well represented in predictions", "orig": "Repeating pattern is well represented in predictions", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 23, "label": "text", "bbox": { "l": 181.89114, "t": 288.35962000000006, "r": 239.23492, "b": 294.2947700000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 181.89114, "r_y0": 294.2947700000001, "r_x1": 239.23492, "r_y1": 294.2947700000001, "r_x2": 239.23492, "r_y2": 288.35962000000006, "r_x3": 181.89114, "r_y3": 288.35962000000006, "coord_origin": "TOPLEFT" }, "text": "Repeating pattern of", "orig": "Repeating pattern of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 24, "label": "text", "bbox": { "l": 181.89114, "t": 294.89423, "r": 251.52917, "b": 300.82938, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 181.89114, "r_y0": 300.82938, "r_x1": 251.52917, "r_y1": 300.82938, "r_x2": 251.52917, "r_y2": 294.89423, "r_x3": 181.89114, "r_y3": 294.89423, "coord_origin": "TOPLEFT" }, "text": "horizontally merged cells", "orig": "horizontally merged cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 25, "label": "text", "bbox": { "l": 247.83432, "t": 184.75989000000004, "r": 253.61339, "b": 194.81635000000006, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 247.83432, "r_y0": 194.81635000000006, "r_x1": 253.61339, "r_y1": 194.81635000000006, "r_x2": 253.61339, "r_y2": 184.75989000000004, "r_x3": 247.83432, "r_y3": 184.75989000000004, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 26, "label": "text", "bbox": { "l": 292.18976, "t": 607.80609, "r": 381.54663, "b": 613.7412400000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 292.18976, "r_y0": 613.7412400000001, "r_x1": 381.54663, "r_y1": 613.7412400000001, "r_x2": 381.54663, "r_y2": 607.80609, "r_x3": 292.18976, "r_y3": 607.80609, "coord_origin": "TOPLEFT" }, "text": "Bounding box drifting at the end", "orig": "Bounding box drifting at the end", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 27, "label": "text", "bbox": { "l": 172.27777, "t": 381.36288, "r": 180.18666, "b": 403.40067, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 172.27777, "r_y0": 403.40067, "r_x1": 180.18666, "r_y1": 403.40067, "r_x2": 180.18666, "r_y2": 381.36288, "r_x3": 172.27777, "r_y3": 381.36288, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 28, "label": "text", "bbox": { "l": 172.27747, "t": 555.7769499999999, "r": 180.18663, "b": 578.7478, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 172.27747, "r_y0": 578.7478, "r_x1": 180.18663, "r_y1": 578.7478, "r_x2": 180.18663, "r_y2": 555.7769499999999, "r_x3": 172.27747, "r_y3": 555.7769499999999, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] } ] }, "tablestructure": { "table_map": {} }, "figures_classification": null, "equations_prediction": null, "vlm_response": null }, "assembled": { "elements": [ { "label": "page_header", "id": 0, "page_no": 10, "cluster": { "id": 0, "label": "page_header", "bbox": { "l": 194.478, "t": 93.77099999999996, "r": 447.54291000000006, "b": 101.84069999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.9301655888557434, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.478, "r_y0": 101.84069999999997, "r_x1": 447.54291000000006, "r_y1": 101.84069999999997, "r_x2": 447.54291000000006, "r_y2": 93.77099999999996, "r_x3": 194.478, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Optimized Table Tokenization for Table Structure Recognition" }, { "label": "page_header", "id": 1, "page_no": 10, "cluster": { "id": 1, "label": "page_header", "bbox": { "l": 471.37561, "t": 93.77099999999996, "r": 480.5894799999999, "b": 101.84069999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.9007201790809631, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 471.37561, "r_y0": 101.84069999999997, "r_x1": 480.5894799999999, "r_y1": 101.84069999999997, "r_x2": 480.5894799999999, "r_y2": 93.77099999999996, "r_x3": 471.37561, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "11" }, { "label": "caption", "id": 2, "page_no": 10, "cluster": { "id": 2, "label": "caption", "bbox": { "l": 134.765, "t": 125.79918999999984, "r": 480.58838000000003, "b": 177.76764000000003, "coord_origin": "TOPLEFT" }, "confidence": 0.8657060861587524, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 133.72551999999996, "r_x1": 162.64424, "r_y1": 133.72551999999996, "r_x2": 162.64424, "r_y2": 125.79918999999984, "r_x3": 134.765, "r_y3": 125.79918999999984, "coord_origin": "TOPLEFT" }, "text": "Fig. 6.", "orig": "Fig. 6.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 165.215, "r_y0": 133.93169999999998, "r_x1": 480.58752, "r_y1": 133.93169999999998, "r_x2": 480.58752, "r_y2": 125.86200000000008, "r_x3": 165.215, "r_y3": 125.86200000000008, "coord_origin": "TOPLEFT" }, "text": "Visualization of predicted structure and detected bounding boxes on a complex", "orig": "Visualization of predicted structure and detected bounding boxes on a complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 144.89068999999995, "r_x1": 480.58823, "r_y1": 144.89068999999995, "r_x2": 480.58823, "r_y2": 136.82097999999996, "r_x3": 134.765, "r_y3": 136.82097999999996, "coord_origin": "TOPLEFT" }, "text": "table with many rows. The OTSL model (B) captured repeating pattern of horizontally", "orig": "table with many rows. The OTSL model (B) captured repeating pattern of horizontally", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 155.84966999999995, "r_x1": 480.5881999999999, "r_y1": 155.84966999999995, "r_x2": 480.5881999999999, "r_y2": 147.77997000000005, "r_x3": 134.765, "r_y3": 147.77997000000005, "coord_origin": "TOPLEFT" }, "text": "merged cells from the GT (A), unlike the HTML model (C). The HTML model also", "orig": "merged cells from the GT (A), unlike the HTML model (C). The HTML model also", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 166.80864999999994, "r_x1": 480.58838000000003, "r_y1": 166.80864999999994, "r_x2": 480.58838000000003, "r_y2": 158.73895000000005, "r_x3": 134.765, "r_y3": 158.73895000000005, "coord_origin": "TOPLEFT" }, "text": "didn\u2019t complete the HTML sequence correctly and displayed a lot more of drift and", "orig": "didn\u2019t complete the HTML sequence correctly and displayed a lot more of drift and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 177.76764000000003, "r_x1": 415.84454, "r_y1": 177.76764000000003, "r_x2": 415.84454, "r_y2": 169.69794000000002, "r_x3": 134.765, "r_y3": 169.69794000000002, "coord_origin": "TOPLEFT" }, "text": "overlap of bounding boxes. \"PMC5406406_003_01.png\" PubTabNet.", "orig": "overlap of bounding boxes. \"PMC5406406_003_01.png\" PubTabNet.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Fig. 6. Visualization of predicted structure and detected bounding boxes on a complex table with many rows. The OTSL model (B) captured repeating pattern of horizontally merged cells from the GT (A), unlike the HTML model (C). The HTML model also didn't complete the HTML sequence correctly and displayed a lot more of drift and overlap of bounding boxes. \"PMC5406406_003_01.png\" PubTabNet." }, { "label": "picture", "id": 3, "page_no": 10, "cluster": { "id": 3, "label": "picture", "bbox": { "l": 168.39285278320312, "t": 181.9665069580078, "r": 447.35137939453125, "b": 634.0056762695312, "coord_origin": "TOPLEFT" }, "confidence": 0.7612658739089966, "cells": [ { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.5049, "r_y0": 320.36386, "r_x1": 177.59613, "r_y1": 320.36386, "r_x2": 177.59613, "r_y2": 312.45032, "r_x3": 171.5049, "r_y3": 312.45032, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.05823, "r_y0": 500.56628, "r_x1": 177.14946, "r_y1": 500.56628, "r_x2": 177.14946, "r_y2": 492.65274, "r_x3": 171.05823, "r_y3": 492.65274, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 283.047, "r_y0": 633.4168099999999, "r_x1": 374.96332, "r_y1": 633.4168099999999, "r_x2": 374.96332, "r_y2": 627.48166, "r_x3": 283.047, "r_y3": 627.48166, "coord_origin": "TOPLEFT" }, "text": "Incorrect end of HTML sequence", "orig": "Incorrect end of HTML sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 283.047, "r_y0": 623.29291, "r_x1": 398.05978, "r_y1": 623.29291, "r_x2": 398.05978, "r_y2": 617.35776, "r_x3": 283.047, "r_y3": 617.35776, "coord_origin": "TOPLEFT" }, "text": "Horizontally merged cells are not present", "orig": "Horizontally merged cells are not present", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.64209, "r_y0": 471.53299, "r_x1": 437.50800000000004, "r_y1": 471.53299, "r_x2": 437.50800000000004, "r_y2": 465.59784, "r_x3": 293.64209, "r_y3": 465.59784, "coord_origin": "TOPLEFT" }, "text": "Repeating pattern is well represented in predictions", "orig": "Repeating pattern is well represented in predictions", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 181.89114, "r_y0": 294.2947700000001, "r_x1": 239.23492, "r_y1": 294.2947700000001, "r_x2": 239.23492, "r_y2": 288.35962000000006, "r_x3": 181.89114, "r_y3": 288.35962000000006, "coord_origin": "TOPLEFT" }, "text": "Repeating pattern of", "orig": "Repeating pattern of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 181.89114, "r_y0": 300.82938, "r_x1": 251.52917, "r_y1": 300.82938, "r_x2": 251.52917, "r_y2": 294.89423, "r_x3": 181.89114, "r_y3": 294.89423, "coord_origin": "TOPLEFT" }, "text": "horizontally merged cells", "orig": "horizontally merged cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 247.83432, "r_y0": 194.81635000000006, "r_x1": 253.61339, "r_y1": 194.81635000000006, "r_x2": 253.61339, "r_y2": 184.75989000000004, "r_x3": 247.83432, "r_y3": 184.75989000000004, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 292.18976, "r_y0": 613.7412400000001, "r_x1": 381.54663, "r_y1": 613.7412400000001, "r_x2": 381.54663, "r_y2": 607.80609, "r_x3": 292.18976, "r_y3": 607.80609, "coord_origin": "TOPLEFT" }, "text": "Bounding box drifting at the end", "orig": "Bounding box drifting at the end", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 172.27777, "r_y0": 403.40067, "r_x1": 180.18666, "r_y1": 403.40067, "r_x2": 180.18666, "r_y2": 381.36288, "r_x3": 172.27777, "r_y3": 381.36288, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 172.27747, "r_y0": 578.7478, "r_x1": 180.18663, "r_y1": 578.7478, "r_x2": 180.18663, "r_y2": 555.7769499999999, "r_x3": 172.27747, "r_y3": 555.7769499999999, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 18, "label": "text", "bbox": { "l": 171.5049, "t": 312.45032, "r": 177.59613, "b": 320.36386, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.5049, "r_y0": 320.36386, "r_x1": 177.59613, "r_y1": 320.36386, "r_x2": 177.59613, "r_y2": 312.45032, "r_x3": 171.5049, "r_y3": 312.45032, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 19, "label": "text", "bbox": { "l": 171.05823, "t": 492.65274, "r": 177.14946, "b": 500.56628, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.05823, "r_y0": 500.56628, "r_x1": 177.14946, "r_y1": 500.56628, "r_x2": 177.14946, "r_y2": 492.65274, "r_x3": 171.05823, "r_y3": 492.65274, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 20, "label": "text", "bbox": { "l": 283.047, "t": 627.48166, "r": 374.96332, "b": 633.4168099999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 283.047, "r_y0": 633.4168099999999, "r_x1": 374.96332, "r_y1": 633.4168099999999, "r_x2": 374.96332, "r_y2": 627.48166, "r_x3": 283.047, "r_y3": 627.48166, "coord_origin": "TOPLEFT" }, "text": "Incorrect end of HTML sequence", "orig": "Incorrect end of HTML sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 21, "label": "text", "bbox": { "l": 283.047, "t": 617.35776, "r": 398.05978, "b": 623.29291, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 283.047, "r_y0": 623.29291, "r_x1": 398.05978, "r_y1": 623.29291, "r_x2": 398.05978, "r_y2": 617.35776, "r_x3": 283.047, "r_y3": 617.35776, "coord_origin": "TOPLEFT" }, "text": "Horizontally merged cells are not present", "orig": "Horizontally merged cells are not present", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 22, "label": "text", "bbox": { "l": 293.64209, "t": 465.59784, "r": 437.50800000000004, "b": 471.53299, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.64209, "r_y0": 471.53299, "r_x1": 437.50800000000004, "r_y1": 471.53299, "r_x2": 437.50800000000004, "r_y2": 465.59784, "r_x3": 293.64209, "r_y3": 465.59784, "coord_origin": "TOPLEFT" }, "text": "Repeating pattern is well represented in predictions", "orig": "Repeating pattern is well represented in predictions", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 23, "label": "text", "bbox": { "l": 181.89114, "t": 288.35962000000006, "r": 239.23492, "b": 294.2947700000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 181.89114, "r_y0": 294.2947700000001, "r_x1": 239.23492, "r_y1": 294.2947700000001, "r_x2": 239.23492, "r_y2": 288.35962000000006, "r_x3": 181.89114, "r_y3": 288.35962000000006, "coord_origin": "TOPLEFT" }, "text": "Repeating pattern of", "orig": "Repeating pattern of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 24, "label": "text", "bbox": { "l": 181.89114, "t": 294.89423, "r": 251.52917, "b": 300.82938, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 181.89114, "r_y0": 300.82938, "r_x1": 251.52917, "r_y1": 300.82938, "r_x2": 251.52917, "r_y2": 294.89423, "r_x3": 181.89114, "r_y3": 294.89423, "coord_origin": "TOPLEFT" }, "text": "horizontally merged cells", "orig": "horizontally merged cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 25, "label": "text", "bbox": { "l": 247.83432, "t": 184.75989000000004, "r": 253.61339, "b": 194.81635000000006, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 247.83432, "r_y0": 194.81635000000006, "r_x1": 253.61339, "r_y1": 194.81635000000006, "r_x2": 253.61339, "r_y2": 184.75989000000004, "r_x3": 247.83432, "r_y3": 184.75989000000004, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 26, "label": "text", "bbox": { "l": 292.18976, "t": 607.80609, "r": 381.54663, "b": 613.7412400000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 292.18976, "r_y0": 613.7412400000001, "r_x1": 381.54663, "r_y1": 613.7412400000001, "r_x2": 381.54663, "r_y2": 607.80609, "r_x3": 292.18976, "r_y3": 607.80609, "coord_origin": "TOPLEFT" }, "text": "Bounding box drifting at the end", "orig": "Bounding box drifting at the end", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 27, "label": "text", "bbox": { "l": 172.27777, "t": 381.36288, "r": 180.18666, "b": 403.40067, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 172.27777, "r_y0": 403.40067, "r_x1": 180.18666, "r_y1": 403.40067, "r_x2": 180.18666, "r_y2": 381.36288, "r_x3": 172.27777, "r_y3": 381.36288, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 28, "label": "text", "bbox": { "l": 172.27747, "t": 555.7769499999999, "r": 180.18663, "b": 578.7478, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 172.27747, "r_y0": 578.7478, "r_x1": 180.18663, "r_y1": 578.7478, "r_x2": 180.18663, "r_y2": 555.7769499999999, "r_x3": 172.27747, "r_y3": 555.7769499999999, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null } ], "body": [ { "label": "caption", "id": 2, "page_no": 10, "cluster": { "id": 2, "label": "caption", "bbox": { "l": 134.765, "t": 125.79918999999984, "r": 480.58838000000003, "b": 177.76764000000003, "coord_origin": "TOPLEFT" }, "confidence": 0.8657060861587524, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 133.72551999999996, "r_x1": 162.64424, "r_y1": 133.72551999999996, "r_x2": 162.64424, "r_y2": 125.79918999999984, "r_x3": 134.765, "r_y3": 125.79918999999984, "coord_origin": "TOPLEFT" }, "text": "Fig. 6.", "orig": "Fig. 6.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 165.215, "r_y0": 133.93169999999998, "r_x1": 480.58752, "r_y1": 133.93169999999998, "r_x2": 480.58752, "r_y2": 125.86200000000008, "r_x3": 165.215, "r_y3": 125.86200000000008, "coord_origin": "TOPLEFT" }, "text": "Visualization of predicted structure and detected bounding boxes on a complex", "orig": "Visualization of predicted structure and detected bounding boxes on a complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 144.89068999999995, "r_x1": 480.58823, "r_y1": 144.89068999999995, "r_x2": 480.58823, "r_y2": 136.82097999999996, "r_x3": 134.765, "r_y3": 136.82097999999996, "coord_origin": "TOPLEFT" }, "text": "table with many rows. The OTSL model (B) captured repeating pattern of horizontally", "orig": "table with many rows. The OTSL model (B) captured repeating pattern of horizontally", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 155.84966999999995, "r_x1": 480.5881999999999, "r_y1": 155.84966999999995, "r_x2": 480.5881999999999, "r_y2": 147.77997000000005, "r_x3": 134.765, "r_y3": 147.77997000000005, "coord_origin": "TOPLEFT" }, "text": "merged cells from the GT (A), unlike the HTML model (C). The HTML model also", "orig": "merged cells from the GT (A), unlike the HTML model (C). The HTML model also", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 166.80864999999994, "r_x1": 480.58838000000003, "r_y1": 166.80864999999994, "r_x2": 480.58838000000003, "r_y2": 158.73895000000005, "r_x3": 134.765, "r_y3": 158.73895000000005, "coord_origin": "TOPLEFT" }, "text": "didn\u2019t complete the HTML sequence correctly and displayed a lot more of drift and", "orig": "didn\u2019t complete the HTML sequence correctly and displayed a lot more of drift and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 177.76764000000003, "r_x1": 415.84454, "r_y1": 177.76764000000003, "r_x2": 415.84454, "r_y2": 169.69794000000002, "r_x3": 134.765, "r_y3": 169.69794000000002, "coord_origin": "TOPLEFT" }, "text": "overlap of bounding boxes. \"PMC5406406_003_01.png\" PubTabNet.", "orig": "overlap of bounding boxes. \"PMC5406406_003_01.png\" PubTabNet.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Fig. 6. Visualization of predicted structure and detected bounding boxes on a complex table with many rows. The OTSL model (B) captured repeating pattern of horizontally merged cells from the GT (A), unlike the HTML model (C). The HTML model also didn't complete the HTML sequence correctly and displayed a lot more of drift and overlap of bounding boxes. \"PMC5406406_003_01.png\" PubTabNet." }, { "label": "picture", "id": 3, "page_no": 10, "cluster": { "id": 3, "label": "picture", "bbox": { "l": 168.39285278320312, "t": 181.9665069580078, "r": 447.35137939453125, "b": 634.0056762695312, "coord_origin": "TOPLEFT" }, "confidence": 0.7612658739089966, "cells": [ { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.5049, "r_y0": 320.36386, "r_x1": 177.59613, "r_y1": 320.36386, "r_x2": 177.59613, "r_y2": 312.45032, "r_x3": 171.5049, "r_y3": 312.45032, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.05823, "r_y0": 500.56628, "r_x1": 177.14946, "r_y1": 500.56628, "r_x2": 177.14946, "r_y2": 492.65274, "r_x3": 171.05823, "r_y3": 492.65274, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 283.047, "r_y0": 633.4168099999999, "r_x1": 374.96332, "r_y1": 633.4168099999999, "r_x2": 374.96332, "r_y2": 627.48166, "r_x3": 283.047, "r_y3": 627.48166, "coord_origin": "TOPLEFT" }, "text": "Incorrect end of HTML sequence", "orig": "Incorrect end of HTML sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 283.047, "r_y0": 623.29291, "r_x1": 398.05978, "r_y1": 623.29291, "r_x2": 398.05978, "r_y2": 617.35776, "r_x3": 283.047, "r_y3": 617.35776, "coord_origin": "TOPLEFT" }, "text": "Horizontally merged cells are not present", "orig": "Horizontally merged cells are not present", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.64209, "r_y0": 471.53299, "r_x1": 437.50800000000004, "r_y1": 471.53299, "r_x2": 437.50800000000004, "r_y2": 465.59784, "r_x3": 293.64209, "r_y3": 465.59784, "coord_origin": "TOPLEFT" }, "text": "Repeating pattern is well represented in predictions", "orig": "Repeating pattern is well represented in predictions", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 181.89114, "r_y0": 294.2947700000001, "r_x1": 239.23492, "r_y1": 294.2947700000001, "r_x2": 239.23492, "r_y2": 288.35962000000006, "r_x3": 181.89114, "r_y3": 288.35962000000006, "coord_origin": "TOPLEFT" }, "text": "Repeating pattern of", "orig": "Repeating pattern of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 181.89114, "r_y0": 300.82938, "r_x1": 251.52917, "r_y1": 300.82938, "r_x2": 251.52917, "r_y2": 294.89423, "r_x3": 181.89114, "r_y3": 294.89423, "coord_origin": "TOPLEFT" }, "text": "horizontally merged cells", "orig": "horizontally merged cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 247.83432, "r_y0": 194.81635000000006, "r_x1": 253.61339, "r_y1": 194.81635000000006, "r_x2": 253.61339, "r_y2": 184.75989000000004, "r_x3": 247.83432, "r_y3": 184.75989000000004, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 292.18976, "r_y0": 613.7412400000001, "r_x1": 381.54663, "r_y1": 613.7412400000001, "r_x2": 381.54663, "r_y2": 607.80609, "r_x3": 292.18976, "r_y3": 607.80609, "coord_origin": "TOPLEFT" }, "text": "Bounding box drifting at the end", "orig": "Bounding box drifting at the end", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 172.27777, "r_y0": 403.40067, "r_x1": 180.18666, "r_y1": 403.40067, "r_x2": 180.18666, "r_y2": 381.36288, "r_x3": 172.27777, "r_y3": 381.36288, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 172.27747, "r_y0": 578.7478, "r_x1": 180.18663, "r_y1": 578.7478, "r_x2": 180.18663, "r_y2": 555.7769499999999, "r_x3": 172.27747, "r_y3": 555.7769499999999, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 18, "label": "text", "bbox": { "l": 171.5049, "t": 312.45032, "r": 177.59613, "b": 320.36386, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.5049, "r_y0": 320.36386, "r_x1": 177.59613, "r_y1": 320.36386, "r_x2": 177.59613, "r_y2": 312.45032, "r_x3": 171.5049, "r_y3": 312.45032, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 19, "label": "text", "bbox": { "l": 171.05823, "t": 492.65274, "r": 177.14946, "b": 500.56628, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.05823, "r_y0": 500.56628, "r_x1": 177.14946, "r_y1": 500.56628, "r_x2": 177.14946, "r_y2": 492.65274, "r_x3": 171.05823, "r_y3": 492.65274, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 20, "label": "text", "bbox": { "l": 283.047, "t": 627.48166, "r": 374.96332, "b": 633.4168099999999, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 283.047, "r_y0": 633.4168099999999, "r_x1": 374.96332, "r_y1": 633.4168099999999, "r_x2": 374.96332, "r_y2": 627.48166, "r_x3": 283.047, "r_y3": 627.48166, "coord_origin": "TOPLEFT" }, "text": "Incorrect end of HTML sequence", "orig": "Incorrect end of HTML sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 21, "label": "text", "bbox": { "l": 283.047, "t": 617.35776, "r": 398.05978, "b": 623.29291, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 283.047, "r_y0": 623.29291, "r_x1": 398.05978, "r_y1": 623.29291, "r_x2": 398.05978, "r_y2": 617.35776, "r_x3": 283.047, "r_y3": 617.35776, "coord_origin": "TOPLEFT" }, "text": "Horizontally merged cells are not present", "orig": "Horizontally merged cells are not present", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 22, "label": "text", "bbox": { "l": 293.64209, "t": 465.59784, "r": 437.50800000000004, "b": 471.53299, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.64209, "r_y0": 471.53299, "r_x1": 437.50800000000004, "r_y1": 471.53299, "r_x2": 437.50800000000004, "r_y2": 465.59784, "r_x3": 293.64209, "r_y3": 465.59784, "coord_origin": "TOPLEFT" }, "text": "Repeating pattern is well represented in predictions", "orig": "Repeating pattern is well represented in predictions", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 23, "label": "text", "bbox": { "l": 181.89114, "t": 288.35962000000006, "r": 239.23492, "b": 294.2947700000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 181.89114, "r_y0": 294.2947700000001, "r_x1": 239.23492, "r_y1": 294.2947700000001, "r_x2": 239.23492, "r_y2": 288.35962000000006, "r_x3": 181.89114, "r_y3": 288.35962000000006, "coord_origin": "TOPLEFT" }, "text": "Repeating pattern of", "orig": "Repeating pattern of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 24, "label": "text", "bbox": { "l": 181.89114, "t": 294.89423, "r": 251.52917, "b": 300.82938, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 181.89114, "r_y0": 300.82938, "r_x1": 251.52917, "r_y1": 300.82938, "r_x2": 251.52917, "r_y2": 294.89423, "r_x3": 181.89114, "r_y3": 294.89423, "coord_origin": "TOPLEFT" }, "text": "horizontally merged cells", "orig": "horizontally merged cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 25, "label": "text", "bbox": { "l": 247.83432, "t": 184.75989000000004, "r": 253.61339, "b": 194.81635000000006, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 247.83432, "r_y0": 194.81635000000006, "r_x1": 253.61339, "r_y1": 194.81635000000006, "r_x2": 253.61339, "r_y2": 184.75989000000004, "r_x3": 247.83432, "r_y3": 184.75989000000004, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 26, "label": "text", "bbox": { "l": 292.18976, "t": 607.80609, "r": 381.54663, "b": 613.7412400000001, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 292.18976, "r_y0": 613.7412400000001, "r_x1": 381.54663, "r_y1": 613.7412400000001, "r_x2": 381.54663, "r_y2": 607.80609, "r_x3": 292.18976, "r_y3": 607.80609, "coord_origin": "TOPLEFT" }, "text": "Bounding box drifting at the end", "orig": "Bounding box drifting at the end", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 27, "label": "text", "bbox": { "l": 172.27777, "t": 381.36288, "r": 180.18666, "b": 403.40067, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 172.27777, "r_y0": 403.40067, "r_x1": 180.18666, "r_y1": 403.40067, "r_x2": 180.18666, "r_y2": 381.36288, "r_x3": 172.27777, "r_y3": 381.36288, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 28, "label": "text", "bbox": { "l": 172.27747, "t": 555.7769499999999, "r": 180.18663, "b": 578.7478, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 172.27747, "r_y0": 578.7478, "r_x1": 180.18663, "r_y1": 578.7478, "r_x2": 180.18663, "r_y2": 555.7769499999999, "r_x3": 172.27747, "r_y3": 555.7769499999999, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null } ], "headers": [ { "label": "page_header", "id": 0, "page_no": 10, "cluster": { "id": 0, "label": "page_header", "bbox": { "l": 194.478, "t": 93.77099999999996, "r": 447.54291000000006, "b": 101.84069999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.9301655888557434, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.478, "r_y0": 101.84069999999997, "r_x1": 447.54291000000006, "r_y1": 101.84069999999997, "r_x2": 447.54291000000006, "r_y2": 93.77099999999996, "r_x3": 194.478, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Optimized Table Tokenization for Table Structure Recognition" }, { "label": "page_header", "id": 1, "page_no": 10, "cluster": { "id": 1, "label": "page_header", "bbox": { "l": 471.37561, "t": 93.77099999999996, "r": 480.5894799999999, "b": 101.84069999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.9007201790809631, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 471.37561, "r_y0": 101.84069999999997, "r_x1": 480.5894799999999, "r_y1": 101.84069999999997, "r_x2": 480.5894799999999, "r_y2": 93.77099999999996, "r_x3": 471.37561, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "11" } ] } }, { "page_no": 11, "size": { "width": 612.0, "height": 792.0 }, "parsed_page": { "dimension": { "angle": 0.0, "rect": { "r_x0": 0.0, "r_y0": 0.0, "r_x1": 612.0, "r_y1": 0.0, "r_x2": 612.0, "r_y2": 792.0, "r_x3": 0.0, "r_y3": 792.0, "coord_origin": "BOTTOMLEFT" }, "boundary_type": "crop_box", "art_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "bleed_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "crop_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "media_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "trim_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" } }, "bitmap_resources": [], "char_cells": [], "word_cells": [], "textline_cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 101.84069999999997, "r_x1": 143.97887, "r_y1": 101.84069999999997, "r_x2": 143.97887, "r_y2": 93.77099999999996, "r_x3": 134.765, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.82053, "r_y0": 101.84069999999997, "r_x1": 178.08249, "r_y1": 101.84069999999997, "r_x2": 178.08249, "r_y2": 93.77099999999996, "r_x3": 167.82053, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.37929, "r_y0": 101.84069999999997, "r_x1": 231.72049000000004, "r_y1": 101.84069999999997, "r_x2": 231.72049000000004, "r_y2": 93.77099999999996, "r_x3": 182.37929, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 128.11737000000005, "r_x1": 141.4886, "r_y1": 128.11737000000005, "r_x2": 141.4886, "r_y2": 117.54894999999988, "r_x3": 134.765, "r_y3": 117.54894999999988, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.9382, "r_y0": 128.11737000000005, "r_x1": 219.25478999999999, "r_y1": 128.11737000000005, "r_x2": 219.25478999999999, "r_y2": 117.54894999999988, "r_x3": 154.9382, "r_y3": 117.54894999999988, "coord_origin": "TOPLEFT" }, "text": "Conclusion", "orig": "Conclusion", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 155.66076999999996, "r_x1": 480.59476, "r_y1": 155.66076999999996, "r_x2": 480.59476, "r_y2": 146.86377000000005, "r_x3": 134.765, "r_y3": 146.86377000000005, "coord_origin": "TOPLEFT" }, "text": "We demonstrated that representing tables in HTML for the task of table struc-", "orig": "We demonstrated that representing tables in HTML for the task of table struc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 167.61577999999997, "r_x1": 480.59476, "r_y1": 167.61577999999997, "r_x2": 480.59476, "r_y2": 158.81879000000004, "r_x3": 134.765, "r_y3": 158.81879000000004, "coord_origin": "TOPLEFT" }, "text": "ture recognition with Im2Seq models is ill-suited and has serious limitations.", "orig": "ture recognition with Im2Seq models is ill-suited and has serious limitations.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 179.57079999999996, "r_x1": 480.58978, "r_y1": 179.57079999999996, "r_x2": 480.58978, "r_y2": 170.77380000000005, "r_x3": 134.765, "r_y3": 170.77380000000005, "coord_origin": "TOPLEFT" }, "text": "Furthermore, we presented in this paper an Optimized Table Structure Language", "orig": "Furthermore, we presented in this paper an Optimized Table Structure Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 191.52679, "r_x1": 480.59569999999997, "r_y1": 191.52679, "r_x2": 480.59569999999997, "r_y2": 182.72979999999995, "r_x3": 134.765, "r_y3": 182.72979999999995, "coord_origin": "TOPLEFT" }, "text": "(OTSL) which, when compared to commonly used general purpose languages,", "orig": "(OTSL) which, when compared to commonly used general purpose languages,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 203.48181, "r_x1": 239.5387, "r_y1": 203.48181, "r_x2": 239.5387, "r_y2": 194.68480999999997, "r_x3": 134.765, "r_y3": 194.68480999999997, "coord_origin": "TOPLEFT" }, "text": "has several key benefits.", "orig": "has several key benefits.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.709, "r_y0": 216.24077999999997, "r_x1": 480.59283000000005, "r_y1": 216.24077999999997, "r_x2": 480.59283000000005, "r_y2": 207.44379000000004, "r_x3": 149.709, "r_y3": 207.44379000000004, "coord_origin": "TOPLEFT" }, "text": "First and foremost, given the same network configuration, inference time for", "orig": "First and foremost, given the same network configuration, inference time for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 228.19579999999996, "r_x1": 480.59365999999994, "r_y1": 228.19579999999996, "r_x2": 480.59365999999994, "r_y2": 219.39880000000005, "r_x3": 134.765, "r_y3": 219.39880000000005, "coord_origin": "TOPLEFT" }, "text": "a table-structure prediction is about 2 times faster compared to the conventional", "orig": "a table-structure prediction is about 2 times faster compared to the conventional", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 240.15081999999995, "r_x1": 480.59079, "r_y1": 240.15081999999995, "r_x2": 480.59079, "r_y2": 231.35382000000004, "r_x3": 134.765, "r_y3": 231.35382000000004, "coord_origin": "TOPLEFT" }, "text": "HTML approach. This is primarily owed to the shorter sequence length of the", "orig": "HTML approach. This is primarily owed to the shorter sequence length of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 252.10582999999997, "r_x1": 480.58786000000003, "r_y1": 252.10582999999997, "r_x2": 480.58786000000003, "r_y2": 243.30884000000003, "r_x3": 134.765, "r_y3": 243.30884000000003, "coord_origin": "TOPLEFT" }, "text": "OTSL representation. Additional performance benefits can be obtained with", "orig": "OTSL representation. Additional performance benefits can be obtained with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 264.06183, "r_x1": 480.59479, "r_y1": 264.06183, "r_x2": 480.59479, "r_y2": 255.26482999999996, "r_x3": 134.765, "r_y3": 255.26482999999996, "coord_origin": "TOPLEFT" }, "text": "HPO (hyper parameter optimization). As we demonstrate in our experiments,", "orig": "HPO (hyper parameter optimization). As we demonstrate in our experiments,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 276.01685, "r_x1": 480.5878000000001, "r_y1": 276.01685, "r_x2": 480.5878000000001, "r_y2": 267.21984999999995, "r_x3": 134.765, "r_y3": 267.21984999999995, "coord_origin": "TOPLEFT" }, "text": "models trained on OTSL can be significantly smaller, e.g. by reducing the number", "orig": "models trained on OTSL can be significantly smaller, e.g. by reducing the number", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 287.97183, "r_x1": 480.59268, "r_y1": 287.97183, "r_x2": 480.59268, "r_y2": 279.17487000000006, "r_x3": 134.765, "r_y3": 279.17487000000006, "coord_origin": "TOPLEFT" }, "text": "of encoder and decoder layers, while preserving comparatively good prediction", "orig": "of encoder and decoder layers, while preserving comparatively good prediction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 299.92682, "r_x1": 480.58871, "r_y1": 299.92682, "r_x2": 480.58871, "r_y2": 291.12985, "r_x3": 134.765, "r_y3": 291.12985, "coord_origin": "TOPLEFT" }, "text": "quality. This can further improve inference performance, yielding 5-6 times faster", "orig": "quality. This can further improve inference performance, yielding 5-6 times faster", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 311.88181, "r_x1": 480.59375, "r_y1": 311.88181, "r_x2": 480.59375, "r_y2": 303.08484, "r_x3": 134.765, "r_y3": 303.08484, "coord_origin": "TOPLEFT" }, "text": "inference speed in OTSL with prediction quality comparable to models trained", "orig": "inference speed in OTSL with prediction quality comparable to models trained", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 323.83679, "r_x1": 240.92351000000002, "r_y1": 323.83679, "r_x2": 240.92351000000002, "r_y2": 315.03983, "r_x3": 134.765, "r_y3": 315.03983, "coord_origin": "TOPLEFT" }, "text": "on HTML (see Table 1).", "orig": "on HTML (see Table 1).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.709, "r_y0": 336.5957900000001, "r_x1": 480.58984, "r_y1": 336.5957900000001, "r_x2": 480.58984, "r_y2": 327.79883, "r_x3": 149.709, "r_y3": 327.79883, "coord_origin": "TOPLEFT" }, "text": "Secondly, OTSL has more inherent structure and a significantly restricted vo-", "orig": "Secondly, OTSL has more inherent structure and a significantly restricted vo-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 348.55179, "r_x1": 480.59473, "r_y1": 348.55179, "r_x2": 480.59473, "r_y2": 339.75482, "r_x3": 134.765, "r_y3": 339.75482, "coord_origin": "TOPLEFT" }, "text": "cabulary size. This allows autoregressive models to perform better in the TED", "orig": "cabulary size. This allows autoregressive models to perform better in the TED", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 360.50677, "r_x1": 480.58664, "r_y1": 360.50677, "r_x2": 480.58664, "r_y2": 351.70981, "r_x3": 134.765, "r_y3": 351.70981, "coord_origin": "TOPLEFT" }, "text": "metric, but especially with regards to prediction accuracy of the table-cell bound-", "orig": "metric, but especially with regards to prediction accuracy of the table-cell bound-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 372.46176, "r_x1": 480.59479, "r_y1": 372.46176, "r_x2": 480.59479, "r_y2": 363.66479, "r_x3": 134.765, "r_y3": 363.66479, "coord_origin": "TOPLEFT" }, "text": "ing boxes (see Table 2). As shown in Figure 5, we observe that the OTSL dras-", "orig": "ing boxes (see Table 2). As shown in Figure 5, we observe that the OTSL dras-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 384.41675, "r_x1": 480.58971999999994, "r_y1": 384.41675, "r_x2": 480.58971999999994, "r_y2": 375.61978, "r_x3": 134.765, "r_y3": 375.61978, "coord_origin": "TOPLEFT" }, "text": "tically reduces the drift for table cell bounding boxes at high row count and in", "orig": "tically reduces the drift for table cell bounding boxes at high row count and in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 396.37173, "r_x1": 480.58673, "r_y1": 396.37173, "r_x2": 480.58673, "r_y2": 387.57477, "r_x3": 134.765, "r_y3": 387.57477, "coord_origin": "TOPLEFT" }, "text": "sparse tables. This leads to more accurate predictions and a significant reduction", "orig": "sparse tables. This leads to more accurate predictions and a significant reduction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 408.32773, "r_x1": 480.58574999999996, "r_y1": 408.32773, "r_x2": 480.58574999999996, "r_y2": 399.53076, "r_x3": 134.765, "r_y3": 399.53076, "coord_origin": "TOPLEFT" }, "text": "in post-processing complexity, which is an undesired necessity in HTML-based", "orig": "in post-processing complexity, which is an undesired necessity in HTML-based", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 420.28271, "r_x1": 480.58675999999997, "r_y1": 420.28271, "r_x2": 480.58675999999997, "r_y2": 411.48575, "r_x3": 134.765, "r_y3": 411.48575, "coord_origin": "TOPLEFT" }, "text": "Im2Seq models. Significant novelty lies in OTSL syntactical rules, which are few,", "orig": "Im2Seq models. Significant novelty lies in OTSL syntactical rules, which are few,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 432.23769999999996, "r_x1": 480.59482, "r_y1": 432.23769999999996, "r_x2": 480.59482, "r_y2": 423.44073, "r_x3": 134.765, "r_y3": 423.44073, "coord_origin": "TOPLEFT" }, "text": "simple and always backwards looking. Each new token can be validated only by", "orig": "simple and always backwards looking. Each new token can be validated only by", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 444.19269, "r_x1": 480.58777, "r_y1": 444.19269, "r_x2": 480.58777, "r_y2": 435.39572, "r_x3": 134.765, "r_y3": 435.39572, "coord_origin": "TOPLEFT" }, "text": "analyzing the sequence of previous tokens, without requiring the entire sequence", "orig": "analyzing the sequence of previous tokens, without requiring the entire sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 456.14767, "r_x1": 480.58968999999996, "r_y1": 456.14767, "r_x2": 480.58968999999996, "r_y2": 447.35071, "r_x3": 134.765, "r_y3": 447.35071, "coord_origin": "TOPLEFT" }, "text": "to detect mistakes. This in return allows to perform structural error detection", "orig": "to detect mistakes. This in return allows to perform structural error detection", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 468.10266, "r_x1": 366.77698, "r_y1": 468.10266, "r_x2": 366.77698, "r_y2": 459.30569, "r_x3": 134.765, "r_y3": 459.30569, "coord_origin": "TOPLEFT" }, "text": "and correction on-the-fly during sequence generation.", "orig": "and correction on-the-fly during sequence generation.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 504.38922, "r_x1": 197.68642, "r_y1": 504.38922, "r_x2": 197.68642, "r_y2": 493.82083, "r_x3": 134.765, "r_y3": 493.82083, "coord_origin": "TOPLEFT" }, "text": "References", "orig": "References", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.371, "r_y0": 530.94962, "r_x1": 146.46127, "r_y1": 530.94962, "r_x2": 146.46127, "r_y2": 522.87985, "r_x3": 139.371, "r_y3": 522.87985, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.01955, "r_y0": 530.94962, "r_x1": 480.5920100000001, "r_y1": 530.94962, "r_x2": 480.5920100000001, "r_y2": 522.87985, "r_x3": 151.01955, "r_y3": 522.87985, "coord_origin": "TOPLEFT" }, "text": "Auer, C., Dolfi, M., Carvalho, A., Ramis, C.B., Staar, P.W.J.: Delivering doc-", "orig": "Auer, C., Dolfi, M., Carvalho, A., Ramis, C.B., Staar, P.W.J.: Delivering doc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 541.90862, "r_x1": 480.58667, "r_y1": 541.90862, "r_x2": 480.58667, "r_y2": 533.83887, "r_x3": 151.51801, "r_y3": 533.83887, "coord_origin": "TOPLEFT" }, "text": "ument conversion as a cloud service with high throughput and responsiveness.", "orig": "ument conversion as a cloud service with high throughput and responsiveness.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 552.86761, "r_x1": 176.34149, "r_y1": 552.86761, "r_x2": 176.34149, "r_y2": 544.79785, "r_x3": 151.51801, "r_y3": 544.79785, "coord_origin": "TOPLEFT" }, "text": "CoRR", "orig": "CoRR", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 179.464, "r_y0": 552.66139, "r_x1": 250.67963, "r_y1": 552.66139, "r_x2": 250.67963, "r_y2": 544.73509, "r_x3": 179.464, "r_y3": 544.73509, "coord_origin": "TOPLEFT" }, "text": "abs/2206.00785", "orig": "abs/2206.00785", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 253.804, "r_y0": 552.86761, "r_x1": 281.9567, "r_y1": 552.86761, "r_x2": 281.9567, "r_y2": 544.79785, "r_x3": 253.804, "r_y3": 544.79785, "coord_origin": "TOPLEFT" }, "text": "(2022).", "orig": "(2022).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.078, "r_y0": 552.91245, "r_x1": 478.03403000000003, "r_y1": 552.91245, "r_x2": 478.03403000000003, "r_y2": 545.44344, "r_x3": 285.078, "r_y3": 545.44344, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.48550/arXiv.2206.00785", "orig": "https://doi.org/10.48550/arXiv.2206.00785", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 478.0319799999999, "r_y0": 552.86761, "r_x1": 480.59099999999995, "r_y1": 552.86761, "r_x2": 480.59099999999995, "r_y2": 544.79785, "r_x3": 478.0319799999999, "r_y3": 544.79785, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51797, "r_y0": 563.87144, "r_x1": 344.474, "r_y1": 563.87144, "r_x2": 344.474, "r_y2": 556.4024400000001, "r_x3": 151.51797, "r_y3": 556.4024400000001, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.48550/arXiv.2206.00785", "orig": "https://doi.org/10.48550/arXiv.2206.00785", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.37097, "r_y0": 575.58861, "r_x1": 145.94186, "r_y1": 575.58861, "r_x2": 145.94186, "r_y2": 567.51884, "r_x3": 139.37097, "r_y3": 567.51884, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.16624, "r_y0": 575.58861, "r_x1": 480.58636, "r_y1": 575.58861, "r_x2": 480.58636, "r_y2": 567.51884, "r_x3": 150.16624, "r_y3": 567.51884, "coord_origin": "TOPLEFT" }, "text": "Chen, B., Peng, D., Zhang, J., Ren, Y., Jin, L.: Complex table structure recognition", "orig": "Chen, B., Peng, D., Zhang, J., Ren, Y., Jin, L.: Complex table structure recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51797, "r_y0": 586.5476100000001, "r_x1": 480.59012, "r_y1": 586.5476100000001, "r_x2": 480.59012, "r_y2": 578.47784, "r_x3": 151.51797, "r_y3": 578.47784, "coord_origin": "TOPLEFT" }, "text": "in the wild using transformer and identity matrix-based augmentation. In: Porwal,", "orig": "in the wild using transformer and identity matrix-based augmentation. In: Porwal,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51797, "r_y0": 597.50661, "r_x1": 480.5920100000001, "r_y1": 597.50661, "r_x2": 480.5920100000001, "r_y2": 589.43684, "r_x3": 151.51797, "r_y3": 589.43684, "coord_origin": "TOPLEFT" }, "text": "U., Forn\u00e9s, A., Shafait, F. (eds.) Frontiers in Handwriting Recognition. pp. 545-", "orig": "U., Forn\u00e9s, A., Shafait, F. (eds.) Frontiers in Handwriting Recognition. pp. 545-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51797, "r_y0": 608.46561, "r_x1": 364.17856, "r_y1": 608.46561, "r_x2": 364.17856, "r_y2": 600.39584, "r_x3": 151.51797, "r_y3": 600.39584, "coord_origin": "TOPLEFT" }, "text": "561. Springer International Publishing, Cham (2022)", "orig": "561. Springer International Publishing, Cham (2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.37097, "r_y0": 620.22861, "r_x1": 146.4379, "r_y1": 620.22861, "r_x2": 146.4379, "r_y2": 612.1588399999999, "r_x3": 139.37097, "r_y3": 612.1588399999999, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.98117, "r_y0": 620.22861, "r_x1": 480.58731000000006, "r_y1": 620.22861, "r_x2": 480.58731000000006, "r_y2": 612.1588399999999, "r_x3": 150.98117, "r_y3": 612.1588399999999, "coord_origin": "TOPLEFT" }, "text": "Chi, Z., Huang, H., Xu, H.D., Yu, H., Yin, W., Mao, X.L.: Complicated table", "orig": "Chi, Z., Huang, H., Xu, H.D., Yu, H., Yin, W., Mao, X.L.: Complicated table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51797, "r_y0": 631.18761, "r_x1": 400.22525, "r_y1": 631.18761, "r_x2": 400.22525, "r_y2": 623.11784, "r_x3": 151.51797, "r_y3": 623.11784, "coord_origin": "TOPLEFT" }, "text": "structure recognition. arXiv preprint arXiv:1908.04729 (2019)", "orig": "structure recognition. arXiv preprint arXiv:1908.04729 (2019)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.37097, "r_y0": 642.95061, "r_x1": 146.52443, "r_y1": 642.95061, "r_x2": 146.52443, "r_y2": 634.88084, "r_x3": 139.37097, "r_y3": 634.88084, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.12335, "r_y0": 642.95061, "r_x1": 480.58826, "r_y1": 642.95061, "r_x2": 480.58826, "r_y2": 634.88084, "r_x3": 151.12335, "r_y3": 634.88084, "coord_origin": "TOPLEFT" }, "text": "Deng, Y., Rosenberg, D., Mann, G.: Challenges in end-to-end neural scientific", "orig": "Deng, Y., Rosenberg, D., Mann, G.: Challenges in end-to-end neural scientific", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51797, "r_y0": 653.9096099999999, "r_x1": 480.58752, "r_y1": 653.9096099999999, "r_x2": 480.58752, "r_y2": 645.83984, "r_x3": 151.51797, "r_y3": 645.83984, "coord_origin": "TOPLEFT" }, "text": "table recognition. In: 2019 International Conference on Document Analysis and", "orig": "table recognition. In: 2019 International Conference on Document Analysis and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51797, "r_y0": 664.86761, "r_x1": 350.11115, "r_y1": 664.86761, "r_x2": 350.11115, "r_y2": 656.79785, "r_x3": 151.51797, "r_y3": 656.79785, "coord_origin": "TOPLEFT" }, "text": "Recognition (ICDAR). pp. 894-901. IEEE (2019)", "orig": "Recognition (ICDAR). pp. 894-901. IEEE (2019)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "has_chars": false, "has_words": false, "has_lines": true, "image": null, "lines": [] }, "predictions": { "layout": { "clusters": [ { "id": 10, "label": "page_header", "bbox": { "l": 134.765, "t": 93.77099999999996, "r": 143.97887, "b": 101.84069999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.8610832691192627, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 101.84069999999997, "r_x1": 143.97887, "r_y1": 101.84069999999997, "r_x2": 143.97887, "r_y2": 93.77099999999996, "r_x3": 134.765, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 9, "label": "page_header", "bbox": { "l": 167.82053, "t": 93.77099999999996, "r": 231.72049000000004, "b": 101.84069999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.8927664756774902, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.82053, "r_y0": 101.84069999999997, "r_x1": 178.08249, "r_y1": 101.84069999999997, "r_x2": 178.08249, "r_y2": 93.77099999999996, "r_x3": 167.82053, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.37929, "r_y0": 101.84069999999997, "r_x1": 231.72049000000004, "r_y1": 101.84069999999997, "r_x2": 231.72049000000004, "r_y2": 93.77099999999996, "r_x3": 182.37929, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 8, "label": "section_header", "bbox": { "l": 134.765, "t": 117.54894999999988, "r": 219.25478999999999, "b": 128.11737000000005, "coord_origin": "TOPLEFT" }, "confidence": 0.915635347366333, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 128.11737000000005, "r_x1": 141.4886, "r_y1": 128.11737000000005, "r_x2": 141.4886, "r_y2": 117.54894999999988, "r_x3": 134.765, "r_y3": 117.54894999999988, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.9382, "r_y0": 128.11737000000005, "r_x1": 219.25478999999999, "r_y1": 128.11737000000005, "r_x2": 219.25478999999999, "r_y2": 117.54894999999988, "r_x3": 154.9382, "r_y3": 117.54894999999988, "coord_origin": "TOPLEFT" }, "text": "Conclusion", "orig": "Conclusion", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 2, "label": "text", "bbox": { "l": 134.765, "t": 146.86377000000005, "r": 480.59569999999997, "b": 203.48181, "coord_origin": "TOPLEFT" }, "confidence": 0.9806171655654907, "cells": [ { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 155.66076999999996, "r_x1": 480.59476, "r_y1": 155.66076999999996, "r_x2": 480.59476, "r_y2": 146.86377000000005, "r_x3": 134.765, "r_y3": 146.86377000000005, "coord_origin": "TOPLEFT" }, "text": "We demonstrated that representing tables in HTML for the task of table struc-", "orig": "We demonstrated that representing tables in HTML for the task of table struc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 167.61577999999997, "r_x1": 480.59476, "r_y1": 167.61577999999997, "r_x2": 480.59476, "r_y2": 158.81879000000004, "r_x3": 134.765, "r_y3": 158.81879000000004, "coord_origin": "TOPLEFT" }, "text": "ture recognition with Im2Seq models is ill-suited and has serious limitations.", "orig": "ture recognition with Im2Seq models is ill-suited and has serious limitations.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 179.57079999999996, "r_x1": 480.58978, "r_y1": 179.57079999999996, "r_x2": 480.58978, "r_y2": 170.77380000000005, "r_x3": 134.765, "r_y3": 170.77380000000005, "coord_origin": "TOPLEFT" }, "text": "Furthermore, we presented in this paper an Optimized Table Structure Language", "orig": "Furthermore, we presented in this paper an Optimized Table Structure Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 191.52679, "r_x1": 480.59569999999997, "r_y1": 191.52679, "r_x2": 480.59569999999997, "r_y2": 182.72979999999995, "r_x3": 134.765, "r_y3": 182.72979999999995, "coord_origin": "TOPLEFT" }, "text": "(OTSL) which, when compared to commonly used general purpose languages,", "orig": "(OTSL) which, when compared to commonly used general purpose languages,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 203.48181, "r_x1": 239.5387, "r_y1": 203.48181, "r_x2": 239.5387, "r_y2": 194.68480999999997, "r_x3": 134.765, "r_y3": 194.68480999999997, "coord_origin": "TOPLEFT" }, "text": "has several key benefits.", "orig": "has several key benefits.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 0, "label": "text", "bbox": { "l": 134.765, "t": 207.44379000000004, "r": 480.59479, "b": 323.83679, "coord_origin": "TOPLEFT" }, "confidence": 0.9873476028442383, "cells": [ { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.709, "r_y0": 216.24077999999997, "r_x1": 480.59283000000005, "r_y1": 216.24077999999997, "r_x2": 480.59283000000005, "r_y2": 207.44379000000004, "r_x3": 149.709, "r_y3": 207.44379000000004, "coord_origin": "TOPLEFT" }, "text": "First and foremost, given the same network configuration, inference time for", "orig": "First and foremost, given the same network configuration, inference time for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 228.19579999999996, "r_x1": 480.59365999999994, "r_y1": 228.19579999999996, "r_x2": 480.59365999999994, "r_y2": 219.39880000000005, "r_x3": 134.765, "r_y3": 219.39880000000005, "coord_origin": "TOPLEFT" }, "text": "a table-structure prediction is about 2 times faster compared to the conventional", "orig": "a table-structure prediction is about 2 times faster compared to the conventional", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 240.15081999999995, "r_x1": 480.59079, "r_y1": 240.15081999999995, "r_x2": 480.59079, "r_y2": 231.35382000000004, "r_x3": 134.765, "r_y3": 231.35382000000004, "coord_origin": "TOPLEFT" }, "text": "HTML approach. This is primarily owed to the shorter sequence length of the", "orig": "HTML approach. This is primarily owed to the shorter sequence length of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 252.10582999999997, "r_x1": 480.58786000000003, "r_y1": 252.10582999999997, "r_x2": 480.58786000000003, "r_y2": 243.30884000000003, "r_x3": 134.765, "r_y3": 243.30884000000003, "coord_origin": "TOPLEFT" }, "text": "OTSL representation. Additional performance benefits can be obtained with", "orig": "OTSL representation. Additional performance benefits can be obtained with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 264.06183, "r_x1": 480.59479, "r_y1": 264.06183, "r_x2": 480.59479, "r_y2": 255.26482999999996, "r_x3": 134.765, "r_y3": 255.26482999999996, "coord_origin": "TOPLEFT" }, "text": "HPO (hyper parameter optimization). As we demonstrate in our experiments,", "orig": "HPO (hyper parameter optimization). As we demonstrate in our experiments,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 276.01685, "r_x1": 480.5878000000001, "r_y1": 276.01685, "r_x2": 480.5878000000001, "r_y2": 267.21984999999995, "r_x3": 134.765, "r_y3": 267.21984999999995, "coord_origin": "TOPLEFT" }, "text": "models trained on OTSL can be significantly smaller, e.g. by reducing the number", "orig": "models trained on OTSL can be significantly smaller, e.g. by reducing the number", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 287.97183, "r_x1": 480.59268, "r_y1": 287.97183, "r_x2": 480.59268, "r_y2": 279.17487000000006, "r_x3": 134.765, "r_y3": 279.17487000000006, "coord_origin": "TOPLEFT" }, "text": "of encoder and decoder layers, while preserving comparatively good prediction", "orig": "of encoder and decoder layers, while preserving comparatively good prediction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 299.92682, "r_x1": 480.58871, "r_y1": 299.92682, "r_x2": 480.58871, "r_y2": 291.12985, "r_x3": 134.765, "r_y3": 291.12985, "coord_origin": "TOPLEFT" }, "text": "quality. This can further improve inference performance, yielding 5-6 times faster", "orig": "quality. This can further improve inference performance, yielding 5-6 times faster", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 311.88181, "r_x1": 480.59375, "r_y1": 311.88181, "r_x2": 480.59375, "r_y2": 303.08484, "r_x3": 134.765, "r_y3": 303.08484, "coord_origin": "TOPLEFT" }, "text": "inference speed in OTSL with prediction quality comparable to models trained", "orig": "inference speed in OTSL with prediction quality comparable to models trained", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 323.83679, "r_x1": 240.92351000000002, "r_y1": 323.83679, "r_x2": 240.92351000000002, "r_y2": 315.03983, "r_x3": 134.765, "r_y3": 315.03983, "coord_origin": "TOPLEFT" }, "text": "on HTML (see Table 1).", "orig": "on HTML (see Table 1).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 1, "label": "text", "bbox": { "l": 134.765, "t": 327.79883, "r": 480.59482, "b": 468.10266, "coord_origin": "TOPLEFT" }, "confidence": 0.9868747591972351, "cells": [ { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.709, "r_y0": 336.5957900000001, "r_x1": 480.58984, "r_y1": 336.5957900000001, "r_x2": 480.58984, "r_y2": 327.79883, "r_x3": 149.709, "r_y3": 327.79883, "coord_origin": "TOPLEFT" }, "text": "Secondly, OTSL has more inherent structure and a significantly restricted vo-", "orig": "Secondly, OTSL has more inherent structure and a significantly restricted vo-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 348.55179, "r_x1": 480.59473, "r_y1": 348.55179, "r_x2": 480.59473, "r_y2": 339.75482, "r_x3": 134.765, "r_y3": 339.75482, "coord_origin": "TOPLEFT" }, "text": "cabulary size. This allows autoregressive models to perform better in the TED", "orig": "cabulary size. This allows autoregressive models to perform better in the TED", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 360.50677, "r_x1": 480.58664, "r_y1": 360.50677, "r_x2": 480.58664, "r_y2": 351.70981, "r_x3": 134.765, "r_y3": 351.70981, "coord_origin": "TOPLEFT" }, "text": "metric, but especially with regards to prediction accuracy of the table-cell bound-", "orig": "metric, but especially with regards to prediction accuracy of the table-cell bound-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 372.46176, "r_x1": 480.59479, "r_y1": 372.46176, "r_x2": 480.59479, "r_y2": 363.66479, "r_x3": 134.765, "r_y3": 363.66479, "coord_origin": "TOPLEFT" }, "text": "ing boxes (see Table 2). As shown in Figure 5, we observe that the OTSL dras-", "orig": "ing boxes (see Table 2). As shown in Figure 5, we observe that the OTSL dras-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 384.41675, "r_x1": 480.58971999999994, "r_y1": 384.41675, "r_x2": 480.58971999999994, "r_y2": 375.61978, "r_x3": 134.765, "r_y3": 375.61978, "coord_origin": "TOPLEFT" }, "text": "tically reduces the drift for table cell bounding boxes at high row count and in", "orig": "tically reduces the drift for table cell bounding boxes at high row count and in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 396.37173, "r_x1": 480.58673, "r_y1": 396.37173, "r_x2": 480.58673, "r_y2": 387.57477, "r_x3": 134.765, "r_y3": 387.57477, "coord_origin": "TOPLEFT" }, "text": "sparse tables. This leads to more accurate predictions and a significant reduction", "orig": "sparse tables. This leads to more accurate predictions and a significant reduction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 408.32773, "r_x1": 480.58574999999996, "r_y1": 408.32773, "r_x2": 480.58574999999996, "r_y2": 399.53076, "r_x3": 134.765, "r_y3": 399.53076, "coord_origin": "TOPLEFT" }, "text": "in post-processing complexity, which is an undesired necessity in HTML-based", "orig": "in post-processing complexity, which is an undesired necessity in HTML-based", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 420.28271, "r_x1": 480.58675999999997, "r_y1": 420.28271, "r_x2": 480.58675999999997, "r_y2": 411.48575, "r_x3": 134.765, "r_y3": 411.48575, "coord_origin": "TOPLEFT" }, "text": "Im2Seq models. Significant novelty lies in OTSL syntactical rules, which are few,", "orig": "Im2Seq models. Significant novelty lies in OTSL syntactical rules, which are few,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 432.23769999999996, "r_x1": 480.59482, "r_y1": 432.23769999999996, "r_x2": 480.59482, "r_y2": 423.44073, "r_x3": 134.765, "r_y3": 423.44073, "coord_origin": "TOPLEFT" }, "text": "simple and always backwards looking. Each new token can be validated only by", "orig": "simple and always backwards looking. Each new token can be validated only by", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 444.19269, "r_x1": 480.58777, "r_y1": 444.19269, "r_x2": 480.58777, "r_y2": 435.39572, "r_x3": 134.765, "r_y3": 435.39572, "coord_origin": "TOPLEFT" }, "text": "analyzing the sequence of previous tokens, without requiring the entire sequence", "orig": "analyzing the sequence of previous tokens, without requiring the entire sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 456.14767, "r_x1": 480.58968999999996, "r_y1": 456.14767, "r_x2": 480.58968999999996, "r_y2": 447.35071, "r_x3": 134.765, "r_y3": 447.35071, "coord_origin": "TOPLEFT" }, "text": "to detect mistakes. This in return allows to perform structural error detection", "orig": "to detect mistakes. This in return allows to perform structural error detection", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 468.10266, "r_x1": 366.77698, "r_y1": 468.10266, "r_x2": 366.77698, "r_y2": 459.30569, "r_x3": 134.765, "r_y3": 459.30569, "coord_origin": "TOPLEFT" }, "text": "and correction on-the-fly during sequence generation.", "orig": "and correction on-the-fly during sequence generation.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 7, "label": "section_header", "bbox": { "l": 134.765, "t": 493.82083, "r": 197.68642, "b": 504.38922, "coord_origin": "TOPLEFT" }, "confidence": 0.9403266310691833, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 504.38922, "r_x1": 197.68642, "r_y1": 504.38922, "r_x2": 197.68642, "r_y2": 493.82083, "r_x3": 134.765, "r_y3": 493.82083, "coord_origin": "TOPLEFT" }, "text": "References", "orig": "References", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 5, "label": "list_item", "bbox": { "l": 139.371, "t": 522.87985, "r": 480.5920100000001, "b": 563.87144, "coord_origin": "TOPLEFT" }, "confidence": 0.9698606729507446, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.371, "r_y0": 530.94962, "r_x1": 146.46127, "r_y1": 530.94962, "r_x2": 146.46127, "r_y2": 522.87985, "r_x3": 139.371, "r_y3": 522.87985, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.01955, "r_y0": 530.94962, "r_x1": 480.5920100000001, "r_y1": 530.94962, "r_x2": 480.5920100000001, "r_y2": 522.87985, "r_x3": 151.01955, "r_y3": 522.87985, "coord_origin": "TOPLEFT" }, "text": "Auer, C., Dolfi, M., Carvalho, A., Ramis, C.B., Staar, P.W.J.: Delivering doc-", "orig": "Auer, C., Dolfi, M., Carvalho, A., Ramis, C.B., Staar, P.W.J.: Delivering doc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 541.90862, "r_x1": 480.58667, "r_y1": 541.90862, "r_x2": 480.58667, "r_y2": 533.83887, "r_x3": 151.51801, "r_y3": 533.83887, "coord_origin": "TOPLEFT" }, "text": "ument conversion as a cloud service with high throughput and responsiveness.", "orig": "ument conversion as a cloud service with high throughput and responsiveness.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 552.86761, "r_x1": 176.34149, "r_y1": 552.86761, "r_x2": 176.34149, "r_y2": 544.79785, "r_x3": 151.51801, "r_y3": 544.79785, "coord_origin": "TOPLEFT" }, "text": "CoRR", "orig": "CoRR", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 179.464, "r_y0": 552.66139, "r_x1": 250.67963, "r_y1": 552.66139, "r_x2": 250.67963, "r_y2": 544.73509, "r_x3": 179.464, "r_y3": 544.73509, "coord_origin": "TOPLEFT" }, "text": "abs/2206.00785", "orig": "abs/2206.00785", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 253.804, "r_y0": 552.86761, "r_x1": 281.9567, "r_y1": 552.86761, "r_x2": 281.9567, "r_y2": 544.79785, "r_x3": 253.804, "r_y3": 544.79785, "coord_origin": "TOPLEFT" }, "text": "(2022).", "orig": "(2022).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.078, "r_y0": 552.91245, "r_x1": 478.03403000000003, "r_y1": 552.91245, "r_x2": 478.03403000000003, "r_y2": 545.44344, "r_x3": 285.078, "r_y3": 545.44344, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.48550/arXiv.2206.00785", "orig": "https://doi.org/10.48550/arXiv.2206.00785", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 478.0319799999999, "r_y0": 552.86761, "r_x1": 480.59099999999995, "r_y1": 552.86761, "r_x2": 480.59099999999995, "r_y2": 544.79785, "r_x3": 478.0319799999999, "r_y3": 544.79785, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51797, "r_y0": 563.87144, "r_x1": 344.474, "r_y1": 563.87144, "r_x2": 344.474, "r_y2": 556.4024400000001, "r_x3": 151.51797, "r_y3": 556.4024400000001, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.48550/arXiv.2206.00785", "orig": "https://doi.org/10.48550/arXiv.2206.00785", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 4, "label": "list_item", "bbox": { "l": 139.37097, "t": 567.51884, "r": 480.5920100000001, "b": 608.46561, "coord_origin": "TOPLEFT" }, "confidence": 0.9730570316314697, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.37097, "r_y0": 575.58861, "r_x1": 145.94186, "r_y1": 575.58861, "r_x2": 145.94186, "r_y2": 567.51884, "r_x3": 139.37097, "r_y3": 567.51884, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.16624, "r_y0": 575.58861, "r_x1": 480.58636, "r_y1": 575.58861, "r_x2": 480.58636, "r_y2": 567.51884, "r_x3": 150.16624, "r_y3": 567.51884, "coord_origin": "TOPLEFT" }, "text": "Chen, B., Peng, D., Zhang, J., Ren, Y., Jin, L.: Complex table structure recognition", "orig": "Chen, B., Peng, D., Zhang, J., Ren, Y., Jin, L.: Complex table structure recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51797, "r_y0": 586.5476100000001, "r_x1": 480.59012, "r_y1": 586.5476100000001, "r_x2": 480.59012, "r_y2": 578.47784, "r_x3": 151.51797, "r_y3": 578.47784, "coord_origin": "TOPLEFT" }, "text": "in the wild using transformer and identity matrix-based augmentation. In: Porwal,", "orig": "in the wild using transformer and identity matrix-based augmentation. In: Porwal,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51797, "r_y0": 597.50661, "r_x1": 480.5920100000001, "r_y1": 597.50661, "r_x2": 480.5920100000001, "r_y2": 589.43684, "r_x3": 151.51797, "r_y3": 589.43684, "coord_origin": "TOPLEFT" }, "text": "U., Forn\u00e9s, A., Shafait, F. (eds.) Frontiers in Handwriting Recognition. pp. 545-", "orig": "U., Forn\u00e9s, A., Shafait, F. (eds.) Frontiers in Handwriting Recognition. pp. 545-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51797, "r_y0": 608.46561, "r_x1": 364.17856, "r_y1": 608.46561, "r_x2": 364.17856, "r_y2": 600.39584, "r_x3": 151.51797, "r_y3": 600.39584, "coord_origin": "TOPLEFT" }, "text": "561. Springer International Publishing, Cham (2022)", "orig": "561. Springer International Publishing, Cham (2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 6, "label": "list_item", "bbox": { "l": 139.37097, "t": 612.1588399999999, "r": 480.58731000000006, "b": 631.18761, "coord_origin": "TOPLEFT" }, "confidence": 0.9617196321487427, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.37097, "r_y0": 620.22861, "r_x1": 146.4379, "r_y1": 620.22861, "r_x2": 146.4379, "r_y2": 612.1588399999999, "r_x3": 139.37097, "r_y3": 612.1588399999999, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.98117, "r_y0": 620.22861, "r_x1": 480.58731000000006, "r_y1": 620.22861, "r_x2": 480.58731000000006, "r_y2": 612.1588399999999, "r_x3": 150.98117, "r_y3": 612.1588399999999, "coord_origin": "TOPLEFT" }, "text": "Chi, Z., Huang, H., Xu, H.D., Yu, H., Yin, W., Mao, X.L.: Complicated table", "orig": "Chi, Z., Huang, H., Xu, H.D., Yu, H., Yin, W., Mao, X.L.: Complicated table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51797, "r_y0": 631.18761, "r_x1": 400.22525, "r_y1": 631.18761, "r_x2": 400.22525, "r_y2": 623.11784, "r_x3": 151.51797, "r_y3": 623.11784, "coord_origin": "TOPLEFT" }, "text": "structure recognition. arXiv preprint arXiv:1908.04729 (2019)", "orig": "structure recognition. arXiv preprint arXiv:1908.04729 (2019)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 3, "label": "list_item", "bbox": { "l": 139.37097, "t": 634.88084, "r": 480.58826, "b": 664.86761, "coord_origin": "TOPLEFT" }, "confidence": 0.9754673838615417, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.37097, "r_y0": 642.95061, "r_x1": 146.52443, "r_y1": 642.95061, "r_x2": 146.52443, "r_y2": 634.88084, "r_x3": 139.37097, "r_y3": 634.88084, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.12335, "r_y0": 642.95061, "r_x1": 480.58826, "r_y1": 642.95061, "r_x2": 480.58826, "r_y2": 634.88084, "r_x3": 151.12335, "r_y3": 634.88084, "coord_origin": "TOPLEFT" }, "text": "Deng, Y., Rosenberg, D., Mann, G.: Challenges in end-to-end neural scientific", "orig": "Deng, Y., Rosenberg, D., Mann, G.: Challenges in end-to-end neural scientific", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51797, "r_y0": 653.9096099999999, "r_x1": 480.58752, "r_y1": 653.9096099999999, "r_x2": 480.58752, "r_y2": 645.83984, "r_x3": 151.51797, "r_y3": 645.83984, "coord_origin": "TOPLEFT" }, "text": "table recognition. In: 2019 International Conference on Document Analysis and", "orig": "table recognition. In: 2019 International Conference on Document Analysis and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51797, "r_y0": 664.86761, "r_x1": 350.11115, "r_y1": 664.86761, "r_x2": 350.11115, "r_y2": 656.79785, "r_x3": 151.51797, "r_y3": 656.79785, "coord_origin": "TOPLEFT" }, "text": "Recognition (ICDAR). pp. 894-901. IEEE (2019)", "orig": "Recognition (ICDAR). pp. 894-901. IEEE (2019)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "tablestructure": { "table_map": {} }, "figures_classification": null, "equations_prediction": null, "vlm_response": null }, "assembled": { "elements": [ { "label": "page_header", "id": 10, "page_no": 11, "cluster": { "id": 10, "label": "page_header", "bbox": { "l": 134.765, "t": 93.77099999999996, "r": 143.97887, "b": 101.84069999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.8610832691192627, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 101.84069999999997, "r_x1": 143.97887, "r_y1": 101.84069999999997, "r_x2": 143.97887, "r_y2": 93.77099999999996, "r_x3": 134.765, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "12" }, { "label": "page_header", "id": 9, "page_no": 11, "cluster": { "id": 9, "label": "page_header", "bbox": { "l": 167.82053, "t": 93.77099999999996, "r": 231.72049000000004, "b": 101.84069999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.8927664756774902, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.82053, "r_y0": 101.84069999999997, "r_x1": 178.08249, "r_y1": 101.84069999999997, "r_x2": 178.08249, "r_y2": 93.77099999999996, "r_x3": 167.82053, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.37929, "r_y0": 101.84069999999997, "r_x1": 231.72049000000004, "r_y1": 101.84069999999997, "r_x2": 231.72049000000004, "r_y2": 93.77099999999996, "r_x3": 182.37929, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "M. Lysak, et al." }, { "label": "section_header", "id": 8, "page_no": 11, "cluster": { "id": 8, "label": "section_header", "bbox": { "l": 134.765, "t": 117.54894999999988, "r": 219.25478999999999, "b": 128.11737000000005, "coord_origin": "TOPLEFT" }, "confidence": 0.915635347366333, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 128.11737000000005, "r_x1": 141.4886, "r_y1": 128.11737000000005, "r_x2": 141.4886, "r_y2": 117.54894999999988, "r_x3": 134.765, "r_y3": 117.54894999999988, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.9382, "r_y0": 128.11737000000005, "r_x1": 219.25478999999999, "r_y1": 128.11737000000005, "r_x2": 219.25478999999999, "r_y2": 117.54894999999988, "r_x3": 154.9382, "r_y3": 117.54894999999988, "coord_origin": "TOPLEFT" }, "text": "Conclusion", "orig": "Conclusion", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "6 Conclusion" }, { "label": "text", "id": 2, "page_no": 11, "cluster": { "id": 2, "label": "text", "bbox": { "l": 134.765, "t": 146.86377000000005, "r": 480.59569999999997, "b": 203.48181, "coord_origin": "TOPLEFT" }, "confidence": 0.9806171655654907, "cells": [ { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 155.66076999999996, "r_x1": 480.59476, "r_y1": 155.66076999999996, "r_x2": 480.59476, "r_y2": 146.86377000000005, "r_x3": 134.765, "r_y3": 146.86377000000005, "coord_origin": "TOPLEFT" }, "text": "We demonstrated that representing tables in HTML for the task of table struc-", "orig": "We demonstrated that representing tables in HTML for the task of table struc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 167.61577999999997, "r_x1": 480.59476, "r_y1": 167.61577999999997, "r_x2": 480.59476, "r_y2": 158.81879000000004, "r_x3": 134.765, "r_y3": 158.81879000000004, "coord_origin": "TOPLEFT" }, "text": "ture recognition with Im2Seq models is ill-suited and has serious limitations.", "orig": "ture recognition with Im2Seq models is ill-suited and has serious limitations.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 179.57079999999996, "r_x1": 480.58978, "r_y1": 179.57079999999996, "r_x2": 480.58978, "r_y2": 170.77380000000005, "r_x3": 134.765, "r_y3": 170.77380000000005, "coord_origin": "TOPLEFT" }, "text": "Furthermore, we presented in this paper an Optimized Table Structure Language", "orig": "Furthermore, we presented in this paper an Optimized Table Structure Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 191.52679, "r_x1": 480.59569999999997, "r_y1": 191.52679, "r_x2": 480.59569999999997, "r_y2": 182.72979999999995, "r_x3": 134.765, "r_y3": 182.72979999999995, "coord_origin": "TOPLEFT" }, "text": "(OTSL) which, when compared to commonly used general purpose languages,", "orig": "(OTSL) which, when compared to commonly used general purpose languages,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 203.48181, "r_x1": 239.5387, "r_y1": 203.48181, "r_x2": 239.5387, "r_y2": 194.68480999999997, "r_x3": 134.765, "r_y3": 194.68480999999997, "coord_origin": "TOPLEFT" }, "text": "has several key benefits.", "orig": "has several key benefits.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "We demonstrated that representing tables in HTML for the task of table structure recognition with Im2Seq models is ill-suited and has serious limitations. Furthermore, we presented in this paper an Optimized Table Structure Language (OTSL) which, when compared to commonly used general purpose languages, has several key benefits." }, { "label": "text", "id": 0, "page_no": 11, "cluster": { "id": 0, "label": "text", "bbox": { "l": 134.765, "t": 207.44379000000004, "r": 480.59479, "b": 323.83679, "coord_origin": "TOPLEFT" }, "confidence": 0.9873476028442383, "cells": [ { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.709, "r_y0": 216.24077999999997, "r_x1": 480.59283000000005, "r_y1": 216.24077999999997, "r_x2": 480.59283000000005, "r_y2": 207.44379000000004, "r_x3": 149.709, "r_y3": 207.44379000000004, "coord_origin": "TOPLEFT" }, "text": "First and foremost, given the same network configuration, inference time for", "orig": "First and foremost, given the same network configuration, inference time for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 228.19579999999996, "r_x1": 480.59365999999994, "r_y1": 228.19579999999996, "r_x2": 480.59365999999994, "r_y2": 219.39880000000005, "r_x3": 134.765, "r_y3": 219.39880000000005, "coord_origin": "TOPLEFT" }, "text": "a table-structure prediction is about 2 times faster compared to the conventional", "orig": "a table-structure prediction is about 2 times faster compared to the conventional", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 240.15081999999995, "r_x1": 480.59079, "r_y1": 240.15081999999995, "r_x2": 480.59079, "r_y2": 231.35382000000004, "r_x3": 134.765, "r_y3": 231.35382000000004, "coord_origin": "TOPLEFT" }, "text": "HTML approach. This is primarily owed to the shorter sequence length of the", "orig": "HTML approach. This is primarily owed to the shorter sequence length of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 252.10582999999997, "r_x1": 480.58786000000003, "r_y1": 252.10582999999997, "r_x2": 480.58786000000003, "r_y2": 243.30884000000003, "r_x3": 134.765, "r_y3": 243.30884000000003, "coord_origin": "TOPLEFT" }, "text": "OTSL representation. Additional performance benefits can be obtained with", "orig": "OTSL representation. Additional performance benefits can be obtained with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 264.06183, "r_x1": 480.59479, "r_y1": 264.06183, "r_x2": 480.59479, "r_y2": 255.26482999999996, "r_x3": 134.765, "r_y3": 255.26482999999996, "coord_origin": "TOPLEFT" }, "text": "HPO (hyper parameter optimization). As we demonstrate in our experiments,", "orig": "HPO (hyper parameter optimization). As we demonstrate in our experiments,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 276.01685, "r_x1": 480.5878000000001, "r_y1": 276.01685, "r_x2": 480.5878000000001, "r_y2": 267.21984999999995, "r_x3": 134.765, "r_y3": 267.21984999999995, "coord_origin": "TOPLEFT" }, "text": "models trained on OTSL can be significantly smaller, e.g. by reducing the number", "orig": "models trained on OTSL can be significantly smaller, e.g. by reducing the number", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 287.97183, "r_x1": 480.59268, "r_y1": 287.97183, "r_x2": 480.59268, "r_y2": 279.17487000000006, "r_x3": 134.765, "r_y3": 279.17487000000006, "coord_origin": "TOPLEFT" }, "text": "of encoder and decoder layers, while preserving comparatively good prediction", "orig": "of encoder and decoder layers, while preserving comparatively good prediction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 299.92682, "r_x1": 480.58871, "r_y1": 299.92682, "r_x2": 480.58871, "r_y2": 291.12985, "r_x3": 134.765, "r_y3": 291.12985, "coord_origin": "TOPLEFT" }, "text": "quality. This can further improve inference performance, yielding 5-6 times faster", "orig": "quality. This can further improve inference performance, yielding 5-6 times faster", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 311.88181, "r_x1": 480.59375, "r_y1": 311.88181, "r_x2": 480.59375, "r_y2": 303.08484, "r_x3": 134.765, "r_y3": 303.08484, "coord_origin": "TOPLEFT" }, "text": "inference speed in OTSL with prediction quality comparable to models trained", "orig": "inference speed in OTSL with prediction quality comparable to models trained", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 323.83679, "r_x1": 240.92351000000002, "r_y1": 323.83679, "r_x2": 240.92351000000002, "r_y2": 315.03983, "r_x3": 134.765, "r_y3": 315.03983, "coord_origin": "TOPLEFT" }, "text": "on HTML (see Table 1).", "orig": "on HTML (see Table 1).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "First and foremost, given the same network configuration, inference time for a table-structure prediction is about 2 times faster compared to the conventional HTML approach. This is primarily owed to the shorter sequence length of the OTSL representation. Additional performance benefits can be obtained with HPO (hyper parameter optimization). As we demonstrate in our experiments, models trained on OTSL can be significantly smaller, e.g. by reducing the number of encoder and decoder layers, while preserving comparatively good prediction quality. This can further improve inference performance, yielding 5-6 times faster inference speed in OTSL with prediction quality comparable to models trained on HTML (see Table 1)." }, { "label": "text", "id": 1, "page_no": 11, "cluster": { "id": 1, "label": "text", "bbox": { "l": 134.765, "t": 327.79883, "r": 480.59482, "b": 468.10266, "coord_origin": "TOPLEFT" }, "confidence": 0.9868747591972351, "cells": [ { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.709, "r_y0": 336.5957900000001, "r_x1": 480.58984, "r_y1": 336.5957900000001, "r_x2": 480.58984, "r_y2": 327.79883, "r_x3": 149.709, "r_y3": 327.79883, "coord_origin": "TOPLEFT" }, "text": "Secondly, OTSL has more inherent structure and a significantly restricted vo-", "orig": "Secondly, OTSL has more inherent structure and a significantly restricted vo-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 348.55179, "r_x1": 480.59473, "r_y1": 348.55179, "r_x2": 480.59473, "r_y2": 339.75482, "r_x3": 134.765, "r_y3": 339.75482, "coord_origin": "TOPLEFT" }, "text": "cabulary size. This allows autoregressive models to perform better in the TED", "orig": "cabulary size. This allows autoregressive models to perform better in the TED", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 360.50677, "r_x1": 480.58664, "r_y1": 360.50677, "r_x2": 480.58664, "r_y2": 351.70981, "r_x3": 134.765, "r_y3": 351.70981, "coord_origin": "TOPLEFT" }, "text": "metric, but especially with regards to prediction accuracy of the table-cell bound-", "orig": "metric, but especially with regards to prediction accuracy of the table-cell bound-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 372.46176, "r_x1": 480.59479, "r_y1": 372.46176, "r_x2": 480.59479, "r_y2": 363.66479, "r_x3": 134.765, "r_y3": 363.66479, "coord_origin": "TOPLEFT" }, "text": "ing boxes (see Table 2). As shown in Figure 5, we observe that the OTSL dras-", "orig": "ing boxes (see Table 2). As shown in Figure 5, we observe that the OTSL dras-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 384.41675, "r_x1": 480.58971999999994, "r_y1": 384.41675, "r_x2": 480.58971999999994, "r_y2": 375.61978, "r_x3": 134.765, "r_y3": 375.61978, "coord_origin": "TOPLEFT" }, "text": "tically reduces the drift for table cell bounding boxes at high row count and in", "orig": "tically reduces the drift for table cell bounding boxes at high row count and in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 396.37173, "r_x1": 480.58673, "r_y1": 396.37173, "r_x2": 480.58673, "r_y2": 387.57477, "r_x3": 134.765, "r_y3": 387.57477, "coord_origin": "TOPLEFT" }, "text": "sparse tables. This leads to more accurate predictions and a significant reduction", "orig": "sparse tables. This leads to more accurate predictions and a significant reduction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 408.32773, "r_x1": 480.58574999999996, "r_y1": 408.32773, "r_x2": 480.58574999999996, "r_y2": 399.53076, "r_x3": 134.765, "r_y3": 399.53076, "coord_origin": "TOPLEFT" }, "text": "in post-processing complexity, which is an undesired necessity in HTML-based", "orig": "in post-processing complexity, which is an undesired necessity in HTML-based", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 420.28271, "r_x1": 480.58675999999997, "r_y1": 420.28271, "r_x2": 480.58675999999997, "r_y2": 411.48575, "r_x3": 134.765, "r_y3": 411.48575, "coord_origin": "TOPLEFT" }, "text": "Im2Seq models. Significant novelty lies in OTSL syntactical rules, which are few,", "orig": "Im2Seq models. Significant novelty lies in OTSL syntactical rules, which are few,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 432.23769999999996, "r_x1": 480.59482, "r_y1": 432.23769999999996, "r_x2": 480.59482, "r_y2": 423.44073, "r_x3": 134.765, "r_y3": 423.44073, "coord_origin": "TOPLEFT" }, "text": "simple and always backwards looking. Each new token can be validated only by", "orig": "simple and always backwards looking. Each new token can be validated only by", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 444.19269, "r_x1": 480.58777, "r_y1": 444.19269, "r_x2": 480.58777, "r_y2": 435.39572, "r_x3": 134.765, "r_y3": 435.39572, "coord_origin": "TOPLEFT" }, "text": "analyzing the sequence of previous tokens, without requiring the entire sequence", "orig": "analyzing the sequence of previous tokens, without requiring the entire sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 456.14767, "r_x1": 480.58968999999996, "r_y1": 456.14767, "r_x2": 480.58968999999996, "r_y2": 447.35071, "r_x3": 134.765, "r_y3": 447.35071, "coord_origin": "TOPLEFT" }, "text": "to detect mistakes. This in return allows to perform structural error detection", "orig": "to detect mistakes. This in return allows to perform structural error detection", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 468.10266, "r_x1": 366.77698, "r_y1": 468.10266, "r_x2": 366.77698, "r_y2": 459.30569, "r_x3": 134.765, "r_y3": 459.30569, "coord_origin": "TOPLEFT" }, "text": "and correction on-the-fly during sequence generation.", "orig": "and correction on-the-fly during sequence generation.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Secondly, OTSL has more inherent structure and a significantly restricted vocabulary size. This allows autoregressive models to perform better in the TED metric, but especially with regards to prediction accuracy of the table-cell bounding boxes (see Table 2). As shown in Figure 5, we observe that the OTSL drastically reduces the drift for table cell bounding boxes at high row count and in sparse tables. This leads to more accurate predictions and a significant reduction in post-processing complexity, which is an undesired necessity in HTML-based Im2Seq models. Significant novelty lies in OTSL syntactical rules, which are few, simple and always backwards looking. Each new token can be validated only by analyzing the sequence of previous tokens, without requiring the entire sequence to detect mistakes. This in return allows to perform structural error detection and correction on-the-fly during sequence generation." }, { "label": "section_header", "id": 7, "page_no": 11, "cluster": { "id": 7, "label": "section_header", "bbox": { "l": 134.765, "t": 493.82083, "r": 197.68642, "b": 504.38922, "coord_origin": "TOPLEFT" }, "confidence": 0.9403266310691833, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 504.38922, "r_x1": 197.68642, "r_y1": 504.38922, "r_x2": 197.68642, "r_y2": 493.82083, "r_x3": 134.765, "r_y3": 493.82083, "coord_origin": "TOPLEFT" }, "text": "References", "orig": "References", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "References" }, { "label": "list_item", "id": 5, "page_no": 11, "cluster": { "id": 5, "label": "list_item", "bbox": { "l": 139.371, "t": 522.87985, "r": 480.5920100000001, "b": 563.87144, "coord_origin": "TOPLEFT" }, "confidence": 0.9698606729507446, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.371, "r_y0": 530.94962, "r_x1": 146.46127, "r_y1": 530.94962, "r_x2": 146.46127, "r_y2": 522.87985, "r_x3": 139.371, "r_y3": 522.87985, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.01955, "r_y0": 530.94962, "r_x1": 480.5920100000001, "r_y1": 530.94962, "r_x2": 480.5920100000001, "r_y2": 522.87985, "r_x3": 151.01955, "r_y3": 522.87985, "coord_origin": "TOPLEFT" }, "text": "Auer, C., Dolfi, M., Carvalho, A., Ramis, C.B., Staar, P.W.J.: Delivering doc-", "orig": "Auer, C., Dolfi, M., Carvalho, A., Ramis, C.B., Staar, P.W.J.: Delivering doc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 541.90862, "r_x1": 480.58667, "r_y1": 541.90862, "r_x2": 480.58667, "r_y2": 533.83887, "r_x3": 151.51801, "r_y3": 533.83887, "coord_origin": "TOPLEFT" }, "text": "ument conversion as a cloud service with high throughput and responsiveness.", "orig": "ument conversion as a cloud service with high throughput and responsiveness.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 552.86761, "r_x1": 176.34149, "r_y1": 552.86761, "r_x2": 176.34149, "r_y2": 544.79785, "r_x3": 151.51801, "r_y3": 544.79785, "coord_origin": "TOPLEFT" }, "text": "CoRR", "orig": "CoRR", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 179.464, "r_y0": 552.66139, "r_x1": 250.67963, "r_y1": 552.66139, "r_x2": 250.67963, "r_y2": 544.73509, "r_x3": 179.464, "r_y3": 544.73509, "coord_origin": "TOPLEFT" }, "text": "abs/2206.00785", "orig": "abs/2206.00785", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 253.804, "r_y0": 552.86761, "r_x1": 281.9567, "r_y1": 552.86761, "r_x2": 281.9567, "r_y2": 544.79785, "r_x3": 253.804, "r_y3": 544.79785, "coord_origin": "TOPLEFT" }, "text": "(2022).", "orig": "(2022).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.078, "r_y0": 552.91245, "r_x1": 478.03403000000003, "r_y1": 552.91245, "r_x2": 478.03403000000003, "r_y2": 545.44344, "r_x3": 285.078, "r_y3": 545.44344, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.48550/arXiv.2206.00785", "orig": "https://doi.org/10.48550/arXiv.2206.00785", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 478.0319799999999, "r_y0": 552.86761, "r_x1": 480.59099999999995, "r_y1": 552.86761, "r_x2": 480.59099999999995, "r_y2": 544.79785, "r_x3": 478.0319799999999, "r_y3": 544.79785, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51797, "r_y0": 563.87144, "r_x1": 344.474, "r_y1": 563.87144, "r_x2": 344.474, "r_y2": 556.4024400000001, "r_x3": 151.51797, "r_y3": 556.4024400000001, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.48550/arXiv.2206.00785", "orig": "https://doi.org/10.48550/arXiv.2206.00785", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "1. Auer, C., Dolfi, M., Carvalho, A., Ramis, C.B., Staar, P.W.J.: Delivering document conversion as a cloud service with high throughput and responsiveness. CoRR abs/2206.00785 (2022). https://doi.org/10.48550/arXiv.2206.00785 , https://doi.org/10.48550/arXiv.2206.00785" }, { "label": "list_item", "id": 4, "page_no": 11, "cluster": { "id": 4, "label": "list_item", "bbox": { "l": 139.37097, "t": 567.51884, "r": 480.5920100000001, "b": 608.46561, "coord_origin": "TOPLEFT" }, "confidence": 0.9730570316314697, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.37097, "r_y0": 575.58861, "r_x1": 145.94186, "r_y1": 575.58861, "r_x2": 145.94186, "r_y2": 567.51884, "r_x3": 139.37097, "r_y3": 567.51884, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.16624, "r_y0": 575.58861, "r_x1": 480.58636, "r_y1": 575.58861, "r_x2": 480.58636, "r_y2": 567.51884, "r_x3": 150.16624, "r_y3": 567.51884, "coord_origin": "TOPLEFT" }, "text": "Chen, B., Peng, D., Zhang, J., Ren, Y., Jin, L.: Complex table structure recognition", "orig": "Chen, B., Peng, D., Zhang, J., Ren, Y., Jin, L.: Complex table structure recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51797, "r_y0": 586.5476100000001, "r_x1": 480.59012, "r_y1": 586.5476100000001, "r_x2": 480.59012, "r_y2": 578.47784, "r_x3": 151.51797, "r_y3": 578.47784, "coord_origin": "TOPLEFT" }, "text": "in the wild using transformer and identity matrix-based augmentation. In: Porwal,", "orig": "in the wild using transformer and identity matrix-based augmentation. In: Porwal,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51797, "r_y0": 597.50661, "r_x1": 480.5920100000001, "r_y1": 597.50661, "r_x2": 480.5920100000001, "r_y2": 589.43684, "r_x3": 151.51797, "r_y3": 589.43684, "coord_origin": "TOPLEFT" }, "text": "U., Forn\u00e9s, A., Shafait, F. (eds.) Frontiers in Handwriting Recognition. pp. 545-", "orig": "U., Forn\u00e9s, A., Shafait, F. (eds.) Frontiers in Handwriting Recognition. pp. 545-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51797, "r_y0": 608.46561, "r_x1": 364.17856, "r_y1": 608.46561, "r_x2": 364.17856, "r_y2": 600.39584, "r_x3": 151.51797, "r_y3": 600.39584, "coord_origin": "TOPLEFT" }, "text": "561. Springer International Publishing, Cham (2022)", "orig": "561. Springer International Publishing, Cham (2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "2. Chen, B., Peng, D., Zhang, J., Ren, Y., Jin, L.: Complex table structure recognition in the wild using transformer and identity matrix-based augmentation. In: Porwal, U., Forn\u00e9s, A., Shafait, F. (eds.) Frontiers in Handwriting Recognition. pp. 545561. Springer International Publishing, Cham (2022)" }, { "label": "list_item", "id": 6, "page_no": 11, "cluster": { "id": 6, "label": "list_item", "bbox": { "l": 139.37097, "t": 612.1588399999999, "r": 480.58731000000006, "b": 631.18761, "coord_origin": "TOPLEFT" }, "confidence": 0.9617196321487427, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.37097, "r_y0": 620.22861, "r_x1": 146.4379, "r_y1": 620.22861, "r_x2": 146.4379, "r_y2": 612.1588399999999, "r_x3": 139.37097, "r_y3": 612.1588399999999, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.98117, "r_y0": 620.22861, "r_x1": 480.58731000000006, "r_y1": 620.22861, "r_x2": 480.58731000000006, "r_y2": 612.1588399999999, "r_x3": 150.98117, "r_y3": 612.1588399999999, "coord_origin": "TOPLEFT" }, "text": "Chi, Z., Huang, H., Xu, H.D., Yu, H., Yin, W., Mao, X.L.: Complicated table", "orig": "Chi, Z., Huang, H., Xu, H.D., Yu, H., Yin, W., Mao, X.L.: Complicated table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51797, "r_y0": 631.18761, "r_x1": 400.22525, "r_y1": 631.18761, "r_x2": 400.22525, "r_y2": 623.11784, "r_x3": 151.51797, "r_y3": 623.11784, "coord_origin": "TOPLEFT" }, "text": "structure recognition. arXiv preprint arXiv:1908.04729 (2019)", "orig": "structure recognition. arXiv preprint arXiv:1908.04729 (2019)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "3. Chi, Z., Huang, H., Xu, H.D., Yu, H., Yin, W., Mao, X.L.: Complicated table structure recognition. arXiv preprint arXiv:1908.04729 (2019)" }, { "label": "list_item", "id": 3, "page_no": 11, "cluster": { "id": 3, "label": "list_item", "bbox": { "l": 139.37097, "t": 634.88084, "r": 480.58826, "b": 664.86761, "coord_origin": "TOPLEFT" }, "confidence": 0.9754673838615417, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.37097, "r_y0": 642.95061, "r_x1": 146.52443, "r_y1": 642.95061, "r_x2": 146.52443, "r_y2": 634.88084, "r_x3": 139.37097, "r_y3": 634.88084, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.12335, "r_y0": 642.95061, "r_x1": 480.58826, "r_y1": 642.95061, "r_x2": 480.58826, "r_y2": 634.88084, "r_x3": 151.12335, "r_y3": 634.88084, "coord_origin": "TOPLEFT" }, "text": "Deng, Y., Rosenberg, D., Mann, G.: Challenges in end-to-end neural scientific", "orig": "Deng, Y., Rosenberg, D., Mann, G.: Challenges in end-to-end neural scientific", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51797, "r_y0": 653.9096099999999, "r_x1": 480.58752, "r_y1": 653.9096099999999, "r_x2": 480.58752, "r_y2": 645.83984, "r_x3": 151.51797, "r_y3": 645.83984, "coord_origin": "TOPLEFT" }, "text": "table recognition. In: 2019 International Conference on Document Analysis and", "orig": "table recognition. In: 2019 International Conference on Document Analysis and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51797, "r_y0": 664.86761, "r_x1": 350.11115, "r_y1": 664.86761, "r_x2": 350.11115, "r_y2": 656.79785, "r_x3": 151.51797, "r_y3": 656.79785, "coord_origin": "TOPLEFT" }, "text": "Recognition (ICDAR). pp. 894-901. IEEE (2019)", "orig": "Recognition (ICDAR). pp. 894-901. IEEE (2019)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "4. Deng, Y., Rosenberg, D., Mann, G.: Challenges in end-to-end neural scientific table recognition. In: 2019 International Conference on Document Analysis and Recognition (ICDAR). pp. 894-901. IEEE (2019)" } ], "body": [ { "label": "section_header", "id": 8, "page_no": 11, "cluster": { "id": 8, "label": "section_header", "bbox": { "l": 134.765, "t": 117.54894999999988, "r": 219.25478999999999, "b": 128.11737000000005, "coord_origin": "TOPLEFT" }, "confidence": 0.915635347366333, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 128.11737000000005, "r_x1": 141.4886, "r_y1": 128.11737000000005, "r_x2": 141.4886, "r_y2": 117.54894999999988, "r_x3": 134.765, "r_y3": 117.54894999999988, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.9382, "r_y0": 128.11737000000005, "r_x1": 219.25478999999999, "r_y1": 128.11737000000005, "r_x2": 219.25478999999999, "r_y2": 117.54894999999988, "r_x3": 154.9382, "r_y3": 117.54894999999988, "coord_origin": "TOPLEFT" }, "text": "Conclusion", "orig": "Conclusion", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "6 Conclusion" }, { "label": "text", "id": 2, "page_no": 11, "cluster": { "id": 2, "label": "text", "bbox": { "l": 134.765, "t": 146.86377000000005, "r": 480.59569999999997, "b": 203.48181, "coord_origin": "TOPLEFT" }, "confidence": 0.9806171655654907, "cells": [ { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 155.66076999999996, "r_x1": 480.59476, "r_y1": 155.66076999999996, "r_x2": 480.59476, "r_y2": 146.86377000000005, "r_x3": 134.765, "r_y3": 146.86377000000005, "coord_origin": "TOPLEFT" }, "text": "We demonstrated that representing tables in HTML for the task of table struc-", "orig": "We demonstrated that representing tables in HTML for the task of table struc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 167.61577999999997, "r_x1": 480.59476, "r_y1": 167.61577999999997, "r_x2": 480.59476, "r_y2": 158.81879000000004, "r_x3": 134.765, "r_y3": 158.81879000000004, "coord_origin": "TOPLEFT" }, "text": "ture recognition with Im2Seq models is ill-suited and has serious limitations.", "orig": "ture recognition with Im2Seq models is ill-suited and has serious limitations.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 179.57079999999996, "r_x1": 480.58978, "r_y1": 179.57079999999996, "r_x2": 480.58978, "r_y2": 170.77380000000005, "r_x3": 134.765, "r_y3": 170.77380000000005, "coord_origin": "TOPLEFT" }, "text": "Furthermore, we presented in this paper an Optimized Table Structure Language", "orig": "Furthermore, we presented in this paper an Optimized Table Structure Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 191.52679, "r_x1": 480.59569999999997, "r_y1": 191.52679, "r_x2": 480.59569999999997, "r_y2": 182.72979999999995, "r_x3": 134.765, "r_y3": 182.72979999999995, "coord_origin": "TOPLEFT" }, "text": "(OTSL) which, when compared to commonly used general purpose languages,", "orig": "(OTSL) which, when compared to commonly used general purpose languages,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 203.48181, "r_x1": 239.5387, "r_y1": 203.48181, "r_x2": 239.5387, "r_y2": 194.68480999999997, "r_x3": 134.765, "r_y3": 194.68480999999997, "coord_origin": "TOPLEFT" }, "text": "has several key benefits.", "orig": "has several key benefits.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "We demonstrated that representing tables in HTML for the task of table structure recognition with Im2Seq models is ill-suited and has serious limitations. Furthermore, we presented in this paper an Optimized Table Structure Language (OTSL) which, when compared to commonly used general purpose languages, has several key benefits." }, { "label": "text", "id": 0, "page_no": 11, "cluster": { "id": 0, "label": "text", "bbox": { "l": 134.765, "t": 207.44379000000004, "r": 480.59479, "b": 323.83679, "coord_origin": "TOPLEFT" }, "confidence": 0.9873476028442383, "cells": [ { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.709, "r_y0": 216.24077999999997, "r_x1": 480.59283000000005, "r_y1": 216.24077999999997, "r_x2": 480.59283000000005, "r_y2": 207.44379000000004, "r_x3": 149.709, "r_y3": 207.44379000000004, "coord_origin": "TOPLEFT" }, "text": "First and foremost, given the same network configuration, inference time for", "orig": "First and foremost, given the same network configuration, inference time for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 228.19579999999996, "r_x1": 480.59365999999994, "r_y1": 228.19579999999996, "r_x2": 480.59365999999994, "r_y2": 219.39880000000005, "r_x3": 134.765, "r_y3": 219.39880000000005, "coord_origin": "TOPLEFT" }, "text": "a table-structure prediction is about 2 times faster compared to the conventional", "orig": "a table-structure prediction is about 2 times faster compared to the conventional", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 240.15081999999995, "r_x1": 480.59079, "r_y1": 240.15081999999995, "r_x2": 480.59079, "r_y2": 231.35382000000004, "r_x3": 134.765, "r_y3": 231.35382000000004, "coord_origin": "TOPLEFT" }, "text": "HTML approach. This is primarily owed to the shorter sequence length of the", "orig": "HTML approach. This is primarily owed to the shorter sequence length of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 252.10582999999997, "r_x1": 480.58786000000003, "r_y1": 252.10582999999997, "r_x2": 480.58786000000003, "r_y2": 243.30884000000003, "r_x3": 134.765, "r_y3": 243.30884000000003, "coord_origin": "TOPLEFT" }, "text": "OTSL representation. Additional performance benefits can be obtained with", "orig": "OTSL representation. Additional performance benefits can be obtained with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 264.06183, "r_x1": 480.59479, "r_y1": 264.06183, "r_x2": 480.59479, "r_y2": 255.26482999999996, "r_x3": 134.765, "r_y3": 255.26482999999996, "coord_origin": "TOPLEFT" }, "text": "HPO (hyper parameter optimization). As we demonstrate in our experiments,", "orig": "HPO (hyper parameter optimization). As we demonstrate in our experiments,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 276.01685, "r_x1": 480.5878000000001, "r_y1": 276.01685, "r_x2": 480.5878000000001, "r_y2": 267.21984999999995, "r_x3": 134.765, "r_y3": 267.21984999999995, "coord_origin": "TOPLEFT" }, "text": "models trained on OTSL can be significantly smaller, e.g. by reducing the number", "orig": "models trained on OTSL can be significantly smaller, e.g. by reducing the number", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 287.97183, "r_x1": 480.59268, "r_y1": 287.97183, "r_x2": 480.59268, "r_y2": 279.17487000000006, "r_x3": 134.765, "r_y3": 279.17487000000006, "coord_origin": "TOPLEFT" }, "text": "of encoder and decoder layers, while preserving comparatively good prediction", "orig": "of encoder and decoder layers, while preserving comparatively good prediction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 299.92682, "r_x1": 480.58871, "r_y1": 299.92682, "r_x2": 480.58871, "r_y2": 291.12985, "r_x3": 134.765, "r_y3": 291.12985, "coord_origin": "TOPLEFT" }, "text": "quality. This can further improve inference performance, yielding 5-6 times faster", "orig": "quality. This can further improve inference performance, yielding 5-6 times faster", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 311.88181, "r_x1": 480.59375, "r_y1": 311.88181, "r_x2": 480.59375, "r_y2": 303.08484, "r_x3": 134.765, "r_y3": 303.08484, "coord_origin": "TOPLEFT" }, "text": "inference speed in OTSL with prediction quality comparable to models trained", "orig": "inference speed in OTSL with prediction quality comparable to models trained", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 323.83679, "r_x1": 240.92351000000002, "r_y1": 323.83679, "r_x2": 240.92351000000002, "r_y2": 315.03983, "r_x3": 134.765, "r_y3": 315.03983, "coord_origin": "TOPLEFT" }, "text": "on HTML (see Table 1).", "orig": "on HTML (see Table 1).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "First and foremost, given the same network configuration, inference time for a table-structure prediction is about 2 times faster compared to the conventional HTML approach. This is primarily owed to the shorter sequence length of the OTSL representation. Additional performance benefits can be obtained with HPO (hyper parameter optimization). As we demonstrate in our experiments, models trained on OTSL can be significantly smaller, e.g. by reducing the number of encoder and decoder layers, while preserving comparatively good prediction quality. This can further improve inference performance, yielding 5-6 times faster inference speed in OTSL with prediction quality comparable to models trained on HTML (see Table 1)." }, { "label": "text", "id": 1, "page_no": 11, "cluster": { "id": 1, "label": "text", "bbox": { "l": 134.765, "t": 327.79883, "r": 480.59482, "b": 468.10266, "coord_origin": "TOPLEFT" }, "confidence": 0.9868747591972351, "cells": [ { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.709, "r_y0": 336.5957900000001, "r_x1": 480.58984, "r_y1": 336.5957900000001, "r_x2": 480.58984, "r_y2": 327.79883, "r_x3": 149.709, "r_y3": 327.79883, "coord_origin": "TOPLEFT" }, "text": "Secondly, OTSL has more inherent structure and a significantly restricted vo-", "orig": "Secondly, OTSL has more inherent structure and a significantly restricted vo-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 348.55179, "r_x1": 480.59473, "r_y1": 348.55179, "r_x2": 480.59473, "r_y2": 339.75482, "r_x3": 134.765, "r_y3": 339.75482, "coord_origin": "TOPLEFT" }, "text": "cabulary size. This allows autoregressive models to perform better in the TED", "orig": "cabulary size. This allows autoregressive models to perform better in the TED", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 360.50677, "r_x1": 480.58664, "r_y1": 360.50677, "r_x2": 480.58664, "r_y2": 351.70981, "r_x3": 134.765, "r_y3": 351.70981, "coord_origin": "TOPLEFT" }, "text": "metric, but especially with regards to prediction accuracy of the table-cell bound-", "orig": "metric, but especially with regards to prediction accuracy of the table-cell bound-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 372.46176, "r_x1": 480.59479, "r_y1": 372.46176, "r_x2": 480.59479, "r_y2": 363.66479, "r_x3": 134.765, "r_y3": 363.66479, "coord_origin": "TOPLEFT" }, "text": "ing boxes (see Table 2). As shown in Figure 5, we observe that the OTSL dras-", "orig": "ing boxes (see Table 2). As shown in Figure 5, we observe that the OTSL dras-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 384.41675, "r_x1": 480.58971999999994, "r_y1": 384.41675, "r_x2": 480.58971999999994, "r_y2": 375.61978, "r_x3": 134.765, "r_y3": 375.61978, "coord_origin": "TOPLEFT" }, "text": "tically reduces the drift for table cell bounding boxes at high row count and in", "orig": "tically reduces the drift for table cell bounding boxes at high row count and in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 396.37173, "r_x1": 480.58673, "r_y1": 396.37173, "r_x2": 480.58673, "r_y2": 387.57477, "r_x3": 134.765, "r_y3": 387.57477, "coord_origin": "TOPLEFT" }, "text": "sparse tables. This leads to more accurate predictions and a significant reduction", "orig": "sparse tables. This leads to more accurate predictions and a significant reduction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 408.32773, "r_x1": 480.58574999999996, "r_y1": 408.32773, "r_x2": 480.58574999999996, "r_y2": 399.53076, "r_x3": 134.765, "r_y3": 399.53076, "coord_origin": "TOPLEFT" }, "text": "in post-processing complexity, which is an undesired necessity in HTML-based", "orig": "in post-processing complexity, which is an undesired necessity in HTML-based", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 420.28271, "r_x1": 480.58675999999997, "r_y1": 420.28271, "r_x2": 480.58675999999997, "r_y2": 411.48575, "r_x3": 134.765, "r_y3": 411.48575, "coord_origin": "TOPLEFT" }, "text": "Im2Seq models. Significant novelty lies in OTSL syntactical rules, which are few,", "orig": "Im2Seq models. Significant novelty lies in OTSL syntactical rules, which are few,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 432.23769999999996, "r_x1": 480.59482, "r_y1": 432.23769999999996, "r_x2": 480.59482, "r_y2": 423.44073, "r_x3": 134.765, "r_y3": 423.44073, "coord_origin": "TOPLEFT" }, "text": "simple and always backwards looking. Each new token can be validated only by", "orig": "simple and always backwards looking. Each new token can be validated only by", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 444.19269, "r_x1": 480.58777, "r_y1": 444.19269, "r_x2": 480.58777, "r_y2": 435.39572, "r_x3": 134.765, "r_y3": 435.39572, "coord_origin": "TOPLEFT" }, "text": "analyzing the sequence of previous tokens, without requiring the entire sequence", "orig": "analyzing the sequence of previous tokens, without requiring the entire sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 456.14767, "r_x1": 480.58968999999996, "r_y1": 456.14767, "r_x2": 480.58968999999996, "r_y2": 447.35071, "r_x3": 134.765, "r_y3": 447.35071, "coord_origin": "TOPLEFT" }, "text": "to detect mistakes. This in return allows to perform structural error detection", "orig": "to detect mistakes. This in return allows to perform structural error detection", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 468.10266, "r_x1": 366.77698, "r_y1": 468.10266, "r_x2": 366.77698, "r_y2": 459.30569, "r_x3": 134.765, "r_y3": 459.30569, "coord_origin": "TOPLEFT" }, "text": "and correction on-the-fly during sequence generation.", "orig": "and correction on-the-fly during sequence generation.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Secondly, OTSL has more inherent structure and a significantly restricted vocabulary size. This allows autoregressive models to perform better in the TED metric, but especially with regards to prediction accuracy of the table-cell bounding boxes (see Table 2). As shown in Figure 5, we observe that the OTSL drastically reduces the drift for table cell bounding boxes at high row count and in sparse tables. This leads to more accurate predictions and a significant reduction in post-processing complexity, which is an undesired necessity in HTML-based Im2Seq models. Significant novelty lies in OTSL syntactical rules, which are few, simple and always backwards looking. Each new token can be validated only by analyzing the sequence of previous tokens, without requiring the entire sequence to detect mistakes. This in return allows to perform structural error detection and correction on-the-fly during sequence generation." }, { "label": "section_header", "id": 7, "page_no": 11, "cluster": { "id": 7, "label": "section_header", "bbox": { "l": 134.765, "t": 493.82083, "r": 197.68642, "b": 504.38922, "coord_origin": "TOPLEFT" }, "confidence": 0.9403266310691833, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 504.38922, "r_x1": 197.68642, "r_y1": 504.38922, "r_x2": 197.68642, "r_y2": 493.82083, "r_x3": 134.765, "r_y3": 493.82083, "coord_origin": "TOPLEFT" }, "text": "References", "orig": "References", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "References" }, { "label": "list_item", "id": 5, "page_no": 11, "cluster": { "id": 5, "label": "list_item", "bbox": { "l": 139.371, "t": 522.87985, "r": 480.5920100000001, "b": 563.87144, "coord_origin": "TOPLEFT" }, "confidence": 0.9698606729507446, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.371, "r_y0": 530.94962, "r_x1": 146.46127, "r_y1": 530.94962, "r_x2": 146.46127, "r_y2": 522.87985, "r_x3": 139.371, "r_y3": 522.87985, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.01955, "r_y0": 530.94962, "r_x1": 480.5920100000001, "r_y1": 530.94962, "r_x2": 480.5920100000001, "r_y2": 522.87985, "r_x3": 151.01955, "r_y3": 522.87985, "coord_origin": "TOPLEFT" }, "text": "Auer, C., Dolfi, M., Carvalho, A., Ramis, C.B., Staar, P.W.J.: Delivering doc-", "orig": "Auer, C., Dolfi, M., Carvalho, A., Ramis, C.B., Staar, P.W.J.: Delivering doc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 541.90862, "r_x1": 480.58667, "r_y1": 541.90862, "r_x2": 480.58667, "r_y2": 533.83887, "r_x3": 151.51801, "r_y3": 533.83887, "coord_origin": "TOPLEFT" }, "text": "ument conversion as a cloud service with high throughput and responsiveness.", "orig": "ument conversion as a cloud service with high throughput and responsiveness.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 552.86761, "r_x1": 176.34149, "r_y1": 552.86761, "r_x2": 176.34149, "r_y2": 544.79785, "r_x3": 151.51801, "r_y3": 544.79785, "coord_origin": "TOPLEFT" }, "text": "CoRR", "orig": "CoRR", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 179.464, "r_y0": 552.66139, "r_x1": 250.67963, "r_y1": 552.66139, "r_x2": 250.67963, "r_y2": 544.73509, "r_x3": 179.464, "r_y3": 544.73509, "coord_origin": "TOPLEFT" }, "text": "abs/2206.00785", "orig": "abs/2206.00785", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 253.804, "r_y0": 552.86761, "r_x1": 281.9567, "r_y1": 552.86761, "r_x2": 281.9567, "r_y2": 544.79785, "r_x3": 253.804, "r_y3": 544.79785, "coord_origin": "TOPLEFT" }, "text": "(2022).", "orig": "(2022).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.078, "r_y0": 552.91245, "r_x1": 478.03403000000003, "r_y1": 552.91245, "r_x2": 478.03403000000003, "r_y2": 545.44344, "r_x3": 285.078, "r_y3": 545.44344, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.48550/arXiv.2206.00785", "orig": "https://doi.org/10.48550/arXiv.2206.00785", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 478.0319799999999, "r_y0": 552.86761, "r_x1": 480.59099999999995, "r_y1": 552.86761, "r_x2": 480.59099999999995, "r_y2": 544.79785, "r_x3": 478.0319799999999, "r_y3": 544.79785, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51797, "r_y0": 563.87144, "r_x1": 344.474, "r_y1": 563.87144, "r_x2": 344.474, "r_y2": 556.4024400000001, "r_x3": 151.51797, "r_y3": 556.4024400000001, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.48550/arXiv.2206.00785", "orig": "https://doi.org/10.48550/arXiv.2206.00785", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "1. Auer, C., Dolfi, M., Carvalho, A., Ramis, C.B., Staar, P.W.J.: Delivering document conversion as a cloud service with high throughput and responsiveness. CoRR abs/2206.00785 (2022). https://doi.org/10.48550/arXiv.2206.00785 , https://doi.org/10.48550/arXiv.2206.00785" }, { "label": "list_item", "id": 4, "page_no": 11, "cluster": { "id": 4, "label": "list_item", "bbox": { "l": 139.37097, "t": 567.51884, "r": 480.5920100000001, "b": 608.46561, "coord_origin": "TOPLEFT" }, "confidence": 0.9730570316314697, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.37097, "r_y0": 575.58861, "r_x1": 145.94186, "r_y1": 575.58861, "r_x2": 145.94186, "r_y2": 567.51884, "r_x3": 139.37097, "r_y3": 567.51884, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.16624, "r_y0": 575.58861, "r_x1": 480.58636, "r_y1": 575.58861, "r_x2": 480.58636, "r_y2": 567.51884, "r_x3": 150.16624, "r_y3": 567.51884, "coord_origin": "TOPLEFT" }, "text": "Chen, B., Peng, D., Zhang, J., Ren, Y., Jin, L.: Complex table structure recognition", "orig": "Chen, B., Peng, D., Zhang, J., Ren, Y., Jin, L.: Complex table structure recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51797, "r_y0": 586.5476100000001, "r_x1": 480.59012, "r_y1": 586.5476100000001, "r_x2": 480.59012, "r_y2": 578.47784, "r_x3": 151.51797, "r_y3": 578.47784, "coord_origin": "TOPLEFT" }, "text": "in the wild using transformer and identity matrix-based augmentation. In: Porwal,", "orig": "in the wild using transformer and identity matrix-based augmentation. In: Porwal,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51797, "r_y0": 597.50661, "r_x1": 480.5920100000001, "r_y1": 597.50661, "r_x2": 480.5920100000001, "r_y2": 589.43684, "r_x3": 151.51797, "r_y3": 589.43684, "coord_origin": "TOPLEFT" }, "text": "U., Forn\u00e9s, A., Shafait, F. (eds.) Frontiers in Handwriting Recognition. pp. 545-", "orig": "U., Forn\u00e9s, A., Shafait, F. (eds.) Frontiers in Handwriting Recognition. pp. 545-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51797, "r_y0": 608.46561, "r_x1": 364.17856, "r_y1": 608.46561, "r_x2": 364.17856, "r_y2": 600.39584, "r_x3": 151.51797, "r_y3": 600.39584, "coord_origin": "TOPLEFT" }, "text": "561. Springer International Publishing, Cham (2022)", "orig": "561. Springer International Publishing, Cham (2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "2. Chen, B., Peng, D., Zhang, J., Ren, Y., Jin, L.: Complex table structure recognition in the wild using transformer and identity matrix-based augmentation. In: Porwal, U., Forn\u00e9s, A., Shafait, F. (eds.) Frontiers in Handwriting Recognition. pp. 545561. Springer International Publishing, Cham (2022)" }, { "label": "list_item", "id": 6, "page_no": 11, "cluster": { "id": 6, "label": "list_item", "bbox": { "l": 139.37097, "t": 612.1588399999999, "r": 480.58731000000006, "b": 631.18761, "coord_origin": "TOPLEFT" }, "confidence": 0.9617196321487427, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.37097, "r_y0": 620.22861, "r_x1": 146.4379, "r_y1": 620.22861, "r_x2": 146.4379, "r_y2": 612.1588399999999, "r_x3": 139.37097, "r_y3": 612.1588399999999, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.98117, "r_y0": 620.22861, "r_x1": 480.58731000000006, "r_y1": 620.22861, "r_x2": 480.58731000000006, "r_y2": 612.1588399999999, "r_x3": 150.98117, "r_y3": 612.1588399999999, "coord_origin": "TOPLEFT" }, "text": "Chi, Z., Huang, H., Xu, H.D., Yu, H., Yin, W., Mao, X.L.: Complicated table", "orig": "Chi, Z., Huang, H., Xu, H.D., Yu, H., Yin, W., Mao, X.L.: Complicated table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51797, "r_y0": 631.18761, "r_x1": 400.22525, "r_y1": 631.18761, "r_x2": 400.22525, "r_y2": 623.11784, "r_x3": 151.51797, "r_y3": 623.11784, "coord_origin": "TOPLEFT" }, "text": "structure recognition. arXiv preprint arXiv:1908.04729 (2019)", "orig": "structure recognition. arXiv preprint arXiv:1908.04729 (2019)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "3. Chi, Z., Huang, H., Xu, H.D., Yu, H., Yin, W., Mao, X.L.: Complicated table structure recognition. arXiv preprint arXiv:1908.04729 (2019)" }, { "label": "list_item", "id": 3, "page_no": 11, "cluster": { "id": 3, "label": "list_item", "bbox": { "l": 139.37097, "t": 634.88084, "r": 480.58826, "b": 664.86761, "coord_origin": "TOPLEFT" }, "confidence": 0.9754673838615417, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.37097, "r_y0": 642.95061, "r_x1": 146.52443, "r_y1": 642.95061, "r_x2": 146.52443, "r_y2": 634.88084, "r_x3": 139.37097, "r_y3": 634.88084, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.12335, "r_y0": 642.95061, "r_x1": 480.58826, "r_y1": 642.95061, "r_x2": 480.58826, "r_y2": 634.88084, "r_x3": 151.12335, "r_y3": 634.88084, "coord_origin": "TOPLEFT" }, "text": "Deng, Y., Rosenberg, D., Mann, G.: Challenges in end-to-end neural scientific", "orig": "Deng, Y., Rosenberg, D., Mann, G.: Challenges in end-to-end neural scientific", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51797, "r_y0": 653.9096099999999, "r_x1": 480.58752, "r_y1": 653.9096099999999, "r_x2": 480.58752, "r_y2": 645.83984, "r_x3": 151.51797, "r_y3": 645.83984, "coord_origin": "TOPLEFT" }, "text": "table recognition. In: 2019 International Conference on Document Analysis and", "orig": "table recognition. In: 2019 International Conference on Document Analysis and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51797, "r_y0": 664.86761, "r_x1": 350.11115, "r_y1": 664.86761, "r_x2": 350.11115, "r_y2": 656.79785, "r_x3": 151.51797, "r_y3": 656.79785, "coord_origin": "TOPLEFT" }, "text": "Recognition (ICDAR). pp. 894-901. IEEE (2019)", "orig": "Recognition (ICDAR). pp. 894-901. IEEE (2019)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "4. Deng, Y., Rosenberg, D., Mann, G.: Challenges in end-to-end neural scientific table recognition. In: 2019 International Conference on Document Analysis and Recognition (ICDAR). pp. 894-901. IEEE (2019)" } ], "headers": [ { "label": "page_header", "id": 10, "page_no": 11, "cluster": { "id": 10, "label": "page_header", "bbox": { "l": 134.765, "t": 93.77099999999996, "r": 143.97887, "b": 101.84069999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.8610832691192627, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 101.84069999999997, "r_x1": 143.97887, "r_y1": 101.84069999999997, "r_x2": 143.97887, "r_y2": 93.77099999999996, "r_x3": 134.765, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "12" }, { "label": "page_header", "id": 9, "page_no": 11, "cluster": { "id": 9, "label": "page_header", "bbox": { "l": 167.82053, "t": 93.77099999999996, "r": 231.72049000000004, "b": 101.84069999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.8927664756774902, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.82053, "r_y0": 101.84069999999997, "r_x1": 178.08249, "r_y1": 101.84069999999997, "r_x2": 178.08249, "r_y2": 93.77099999999996, "r_x3": 167.82053, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.37929, "r_y0": 101.84069999999997, "r_x1": 231.72049000000004, "r_y1": 101.84069999999997, "r_x2": 231.72049000000004, "r_y2": 93.77099999999996, "r_x3": 182.37929, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "M. Lysak, et al." } ] } }, { "page_no": 12, "size": { "width": 612.0, "height": 792.0 }, "parsed_page": { "dimension": { "angle": 0.0, "rect": { "r_x0": 0.0, "r_y0": 0.0, "r_x1": 612.0, "r_y1": 0.0, "r_x2": 612.0, "r_y2": 792.0, "r_x3": 0.0, "r_y3": 792.0, "coord_origin": "BOTTOMLEFT" }, "boundary_type": "crop_box", "art_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "bleed_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "crop_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "media_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "trim_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" } }, "bitmap_resources": [], "char_cells": [], "word_cells": [], "textline_cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.478, "r_y0": 101.84069999999997, "r_x1": 447.54291000000006, "r_y1": 101.84069999999997, "r_x2": 447.54291000000006, "r_y2": 93.77099999999996, "r_x3": 194.478, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 471.37561, "r_y0": 101.84069999999997, "r_x1": 480.5894799999999, "r_y1": 101.84069999999997, "r_x2": 480.5894799999999, "r_y2": 93.77099999999996, "r_x3": 471.37561, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.371, "r_y0": 127.74370999999985, "r_x1": 146.04857, "r_y1": 127.74370999999985, "r_x2": 146.04857, "r_y2": 119.67400999999995, "r_x3": 139.371, "r_y3": 119.67400999999995, "coord_origin": "TOPLEFT" }, "text": "5.", "orig": "5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.34157, "r_y0": 127.74370999999985, "r_x1": 480.58826, "r_y1": 127.74370999999985, "r_x2": 480.58826, "r_y2": 119.67400999999995, "r_x3": 150.34157, "r_y3": 119.67400999999995, "coord_origin": "TOPLEFT" }, "text": "Kayal, P., Anand, M., Desai, H., Singh, M.: Tables to latex: structure and content", "orig": "Kayal, P., Anand, M., Desai, H., Singh, M.: Tables to latex: structure and content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 138.70270000000005, "r_x1": 480.59479, "r_y1": 138.70270000000005, "r_x2": 480.59479, "r_y2": 130.63300000000004, "r_x3": 151.51801, "r_y3": 130.63300000000004, "coord_origin": "TOPLEFT" }, "text": "extraction from scientific tables. International Journal on Document Analysis and", "orig": "extraction from scientific tables. International Journal on Document Analysis and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 149.66168000000005, "r_x1": 304.04364, "r_y1": 149.66168000000005, "r_x2": 304.04364, "r_y2": 141.59198000000004, "r_x3": 151.51801, "r_y3": 141.59198000000004, "coord_origin": "TOPLEFT" }, "text": "Recognition (IJDAR) pp. 1-10 (2022)", "orig": "Recognition (IJDAR) pp. 1-10 (2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.371, "r_y0": 160.63165000000004, "r_x1": 145.93991, "r_y1": 160.63165000000004, "r_x2": 145.93991, "r_y2": 152.56195000000002, "r_x3": 139.371, "r_y3": 152.56195000000002, "coord_origin": "TOPLEFT" }, "text": "6.", "orig": "6.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.16298, "r_y0": 160.63165000000004, "r_x1": 480.59015, "r_y1": 160.63165000000004, "r_x2": 480.59015, "r_y2": 152.56195000000002, "r_x3": 150.16298, "r_y3": 152.56195000000002, "coord_origin": "TOPLEFT" }, "text": "Lee, E., Kwon, J., Yang, H., Park, J., Lee, S., Koo, H.I., Cho, N.I.: Table structure", "orig": "Lee, E., Kwon, J., Yang, H., Park, J., Lee, S., Koo, H.I., Cho, N.I.: Table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 171.59064, "r_x1": 480.5903, "r_y1": 171.59064, "r_x2": 480.5903, "r_y2": 163.52094, "r_x3": 151.51801, "r_y3": 163.52094, "coord_origin": "TOPLEFT" }, "text": "recognition based on grid shape graph. In: 2022 Asia-Pacific Signal and Information", "orig": "recognition based on grid shape graph. In: 2022 Asia-Pacific Signal and Information", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 182.54962, "r_x1": 480.59286000000003, "r_y1": 182.54962, "r_x2": 480.59286000000003, "r_y2": 174.47992, "r_x3": 151.51801, "r_y3": 174.47992, "coord_origin": "TOPLEFT" }, "text": "Processing Association Annual Summit and Conference (APSIPA ASC). pp. 1868-", "orig": "Processing Association Annual Summit and Conference (APSIPA ASC). pp. 1868-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 193.50860999999998, "r_x1": 226.37399, "r_y1": 193.50860999999998, "r_x2": 226.37399, "r_y2": 185.4389, "r_x3": 151.51801, "r_y3": 185.4389, "coord_origin": "TOPLEFT" }, "text": "1873. IEEE (2022)", "orig": "1873. IEEE (2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.371, "r_y0": 204.47857999999997, "r_x1": 146.31418, "r_y1": 204.47857999999997, "r_x2": 146.31418, "r_y2": 196.40886999999998, "r_x3": 139.371, "r_y3": 196.40886999999998, "coord_origin": "TOPLEFT" }, "text": "7.", "orig": "7.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.77789, "r_y0": 204.47857999999997, "r_x1": 480.59012, "r_y1": 204.47857999999997, "r_x2": 480.59012, "r_y2": 196.40886999999998, "r_x3": 150.77789, "r_y3": 196.40886999999998, "coord_origin": "TOPLEFT" }, "text": "Li, M., Cui, L., Huang, S., Wei, F., Zhou, M., Li, Z.: Tablebank: A benchmark", "orig": "Li, M., Cui, L., Huang, S., Wei, F., Zhou, M., Li, Z.: Tablebank: A benchmark", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 215.43755999999996, "r_x1": 352.01746, "r_y1": 215.43755999999996, "r_x2": 352.01746, "r_y2": 207.36785999999995, "r_x3": 151.51801, "r_y3": 207.36785999999995, "coord_origin": "TOPLEFT" }, "text": "dataset for table detection and recognition (2019)", "orig": "dataset for table detection and recognition (2019)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.371, "r_y0": 226.40857000000005, "r_x1": 146.37106, "r_y1": 226.40857000000005, "r_x2": 146.37106, "r_y2": 218.33887000000004, "r_x3": 139.371, "r_y3": 218.33887000000004, "coord_origin": "TOPLEFT" }, "text": "8.", "orig": "8.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.87132, "r_y0": 226.40857000000005, "r_x1": 480.58731000000006, "r_y1": 226.40857000000005, "r_x2": 480.58731000000006, "r_y2": 218.33887000000004, "r_x3": 150.87132, "r_y3": 218.33887000000004, "coord_origin": "TOPLEFT" }, "text": "Livathinos, N., Berrospi, C., Lysak, M., Kuropiatnyk, V., Nassar, A., Carvalho,", "orig": "Livathinos, N., Berrospi, C., Lysak, M., Kuropiatnyk, V., Nassar, A., Carvalho,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 237.36755000000005, "r_x1": 480.59020999999996, "r_y1": 237.36755000000005, "r_x2": 480.59020999999996, "r_y2": 229.29785000000004, "r_x3": 151.51801, "r_y3": 229.29785000000004, "coord_origin": "TOPLEFT" }, "text": "A., Dolfi, M., Auer, C., Dinkla, K., Staar, P.: Robust pdf document conversion", "orig": "A., Dolfi, M., Auer, C., Dinkla, K., Staar, P.: Robust pdf document conversion", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 248.32654000000002, "r_x1": 480.59473, "r_y1": 248.32654000000002, "r_x2": 480.59473, "r_y2": 240.25684, "r_x3": 151.51801, "r_y3": 240.25684, "coord_origin": "TOPLEFT" }, "text": "using recurrent neural networks. Proceedings of the AAAI Conference on Artificial", "orig": "using recurrent neural networks. Proceedings of the AAAI Conference on Artificial", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 259.28552, "r_x1": 197.08617, "r_y1": 259.28552, "r_x2": 197.08617, "r_y2": 251.21582, "r_x3": 151.51801, "r_y3": 251.21582, "coord_origin": "TOPLEFT" }, "text": "Intelligence", "orig": "Intelligence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 199.40001, "r_y0": 259.07935, "r_x1": 210.00726, "r_y1": 259.07935, "r_x2": 210.00726, "r_y2": 251.15301999999997, "r_x3": 199.40001, "r_y3": 251.15301999999997, "coord_origin": "TOPLEFT" }, "text": "35", "orig": "35", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.007, "r_y0": 259.28552, "r_x1": 332.37683, "r_y1": 259.28552, "r_x2": 332.37683, "r_y2": 251.21582, "r_x3": 210.007, "r_y3": 251.21582, "coord_origin": "TOPLEFT" }, "text": "(17), 15137-15145 (May 2021),", "orig": "(17), 15137-15145 (May 2021),", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.69901, "r_y0": 259.33038, "r_x1": 480.59039000000007, "r_y1": 259.33038, "r_x2": 480.59039000000007, "r_y2": 251.86139000000003, "r_x3": 334.69901, "r_y3": 251.86139000000003, "coord_origin": "TOPLEFT" }, "text": "https://ojs.aaai.org/index.php/", "orig": "https://ojs.aaai.org/index.php/", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 270.28839000000005, "r_x1": 259.75769, "r_y1": 270.28839000000005, "r_x2": 259.75769, "r_y2": 262.8194, "r_x3": 151.51801, "r_y3": 262.8194, "coord_origin": "TOPLEFT" }, "text": "AAAI/article/view/17777", "orig": "AAAI/article/view/17777", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.371, "r_y0": 281.21457, "r_x1": 146.14218, "r_y1": 281.21457, "r_x2": 146.14218, "r_y2": 273.14484000000004, "r_x3": 139.371, "r_y3": 273.14484000000004, "coord_origin": "TOPLEFT" }, "text": "9.", "orig": "9.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.49533, "r_y0": 281.21457, "r_x1": 480.5881999999999, "r_y1": 281.21457, "r_x2": 480.5881999999999, "r_y2": 273.14484000000004, "r_x3": 150.49533, "r_y3": 273.14484000000004, "coord_origin": "TOPLEFT" }, "text": "Nassar, A., Livathinos, N., Lysak, M., Staar, P.: Tableformer: Table structure un-", "orig": "Nassar, A., Livathinos, N., Lysak, M., Staar, P.: Tableformer: Table structure un-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 292.17355, "r_x1": 480.59387000000004, "r_y1": 292.17355, "r_x2": 480.59387000000004, "r_y2": 284.10379, "r_x3": 151.51801, "r_y3": 284.10379, "coord_origin": "TOPLEFT" }, "text": "derstanding with transformers. In: Proceedings of the IEEE/CVF Conference on", "orig": "derstanding with transformers. In: Proceedings of the IEEE/CVF Conference on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 303.13254, "r_x1": 473.44308000000007, "r_y1": 303.13254, "r_x2": 473.44308000000007, "r_y2": 295.06277, "r_x3": 151.51801, "r_y3": 295.06277, "coord_origin": "TOPLEFT" }, "text": "Computer Vision and Pattern Recognition (CVPR). pp. 4614-4623 (June 2022)", "orig": "Computer Vision and Pattern Recognition (CVPR). pp. 4614-4623 (June 2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76401, "r_y0": 314.10254000000003, "r_x1": 146.49922, "r_y1": 314.10254000000003, "r_x2": 146.49922, "r_y2": 306.03277999999995, "r_x3": 134.76401, "r_y3": 306.03277999999995, "coord_origin": "TOPLEFT" }, "text": "10.", "orig": "10.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.09138, "r_y0": 314.10254000000003, "r_x1": 480.58905, "r_y1": 314.10254000000003, "r_x2": 480.58905, "r_y2": 306.03277999999995, "r_x3": 151.09138, "r_y3": 306.03277999999995, "coord_origin": "TOPLEFT" }, "text": "Pfitzmann, B., Auer, C., Dolfi, M., Nassar, A.S., Staar, P.W.J.: Doclaynet: A", "orig": "Pfitzmann, B., Auer, C., Dolfi, M., Nassar, A.S., Staar, P.W.J.: Doclaynet: A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 325.06155, "r_x1": 480.59015, "r_y1": 325.06155, "r_x2": 480.59015, "r_y2": 316.99179, "r_x3": 151.51801, "r_y3": 316.99179, "coord_origin": "TOPLEFT" }, "text": "large human-annotated dataset for document-layout segmentation. In: Zhang, A.,", "orig": "large human-annotated dataset for document-layout segmentation. In: Zhang, A.,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 336.02054, "r_x1": 480.59113, "r_y1": 336.02054, "r_x2": 480.59113, "r_y2": 327.95078, "r_x3": 151.51801, "r_y3": 327.95078, "coord_origin": "TOPLEFT" }, "text": "Rangwala, H. (eds.) KDD \u201922: The 28th ACM SIGKDD Conference on Knowledge", "orig": "Rangwala, H. (eds.) KDD \u201922: The 28th ACM SIGKDD Conference on Knowledge", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 346.97952, "r_x1": 480.59113, "r_y1": 346.97952, "r_x2": 480.59113, "r_y2": 338.90976, "r_x3": 151.51801, "r_y3": 338.90976, "coord_origin": "TOPLEFT" }, "text": "Discovery and Data Mining, Washington, DC, USA, August 14 - 18, 2022. pp.", "orig": "Discovery and Data Mining, Washington, DC, USA, August 14 - 18, 2022. pp.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 357.93851, "r_x1": 251.14098999999996, "r_y1": 357.93851, "r_x2": 251.14098999999996, "r_y2": 349.86874, "r_x3": 151.51801, "r_y3": 349.86874, "coord_origin": "TOPLEFT" }, "text": "3743-3751. ACM (2022).", "orig": "3743-3751. ACM (2022).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 253.99001, "r_y0": 357.98333999999994, "r_x1": 437.53311, "r_y1": 357.98333999999994, "r_x2": 437.53311, "r_y2": 350.5143100000001, "r_x3": 253.99001, "r_y3": 350.5143100000001, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.1145/3534678.3539043", "orig": "https://doi.org/10.1145/3534678.3539043", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.53201, "r_y0": 357.93851, "r_x1": 440.09102999999993, "r_y1": 357.93851, "r_x2": 440.09102999999993, "r_y2": 349.86874, "r_x3": 437.53201, "r_y3": 349.86874, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.94202000000007, "r_y0": 357.98333999999994, "r_x1": 480.59372, "r_y1": 357.98333999999994, "r_x2": 480.59372, "r_y2": 350.5143100000001, "r_x3": 442.94202000000007, "r_y3": 350.5143100000001, "coord_origin": "TOPLEFT" }, "text": "https://", "orig": "https://", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 368.94232, "r_x1": 297.40939, "r_y1": 368.94232, "r_x2": 297.40939, "r_y2": 361.47329999999994, "r_x3": 151.51801, "r_y3": 361.47329999999994, "coord_origin": "TOPLEFT" }, "text": "doi.org/10.1145/3534678.3539043", "orig": "doi.org/10.1145/3534678.3539043", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76401, "r_y0": 379.86749, "r_x1": 146.03854, "r_y1": 379.86749, "r_x2": 146.03854, "r_y2": 371.79773, "r_x3": 134.76401, "r_y3": 371.79773, "coord_origin": "TOPLEFT" }, "text": "11.", "orig": "11.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.4505, "r_y0": 379.86749, "r_x1": 480.58914000000004, "r_y1": 379.86749, "r_x2": 480.58914000000004, "r_y2": 371.79773, "r_x3": 150.4505, "r_y3": 371.79773, "coord_origin": "TOPLEFT" }, "text": "Prasad, D., Gadpal, A., Kapadni, K., Visave, M., Sultanpure, K.: Cascadetabnet:", "orig": "Prasad, D., Gadpal, A., Kapadni, K., Visave, M., Sultanpure, K.: Cascadetabnet:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 390.82651, "r_x1": 480.59296, "r_y1": 390.82651, "r_x2": 480.59296, "r_y2": 382.7567399999999, "r_x3": 151.51801, "r_y3": 382.7567399999999, "coord_origin": "TOPLEFT" }, "text": "An approach for end to end table detection and structure recognition from image-", "orig": "An approach for end to end table detection and structure recognition from image-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 401.78549, "r_x1": 480.59293, "r_y1": 401.78549, "r_x2": 480.59293, "r_y2": 393.71573, "r_x3": 151.51801, "r_y3": 393.71573, "coord_origin": "TOPLEFT" }, "text": "based documents. In: Proceedings of the IEEE/CVF conference on computer vision", "orig": "based documents. In: Proceedings of the IEEE/CVF conference on computer vision", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 412.74448, "r_x1": 373.82727, "r_y1": 412.74448, "r_x2": 373.82727, "r_y2": 404.67471, "r_x3": 151.51801, "r_y3": 404.67471, "coord_origin": "TOPLEFT" }, "text": "and pattern recognition workshops. pp. 572-573 (2020)", "orig": "and pattern recognition workshops. pp. 572-573 (2020)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76401, "r_y0": 423.71448000000004, "r_x1": 145.91106, "r_y1": 423.71448000000004, "r_x2": 145.91106, "r_y2": 415.64471, "r_x3": 134.76401, "r_y3": 415.64471, "coord_origin": "TOPLEFT" }, "text": "12.", "orig": "12.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.27309, "r_y0": 423.71448000000004, "r_x1": 480.5874, "r_y1": 423.71448000000004, "r_x2": 480.5874, "r_y2": 415.64471, "r_x3": 150.27309, "r_y3": 415.64471, "coord_origin": "TOPLEFT" }, "text": "Schreiber, S., Agne, S., Wolf, I., Dengel, A., Ahmed, S.: Deepdesrt: Deep learning", "orig": "Schreiber, S., Agne, S., Wolf, I., Dengel, A., Ahmed, S.: Deepdesrt: Deep learning", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 434.67349, "r_x1": 480.59469999999993, "r_y1": 434.67349, "r_x2": 480.59469999999993, "r_y2": 426.60373, "r_x3": 151.51801, "r_y3": 426.60373, "coord_origin": "TOPLEFT" }, "text": "for detection and structure recognition of tables in document images. In: 2017 14th", "orig": "for detection and structure recognition of tables in document images. In: 2017 14th", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 445.63248, "r_x1": 480.58844, "r_y1": 445.63248, "r_x2": 480.58844, "r_y2": 437.5627099999999, "r_x3": 151.51801, "r_y3": 437.5627099999999, "coord_origin": "TOPLEFT" }, "text": "IAPR international conference on document analysis and recognition (ICDAR).", "orig": "IAPR international conference on document analysis and recognition (ICDAR).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 456.59146, "r_x1": 292.91455, "r_y1": 456.59146, "r_x2": 292.91455, "r_y2": 448.5217, "r_x3": 151.51801, "r_y3": 448.5217, "coord_origin": "TOPLEFT" }, "text": "vol. 1, pp. 1162-1167. IEEE (2017)", "orig": "vol. 1, pp. 1162-1167. IEEE (2017)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76401, "r_y0": 467.56146, "r_x1": 145.7785, "r_y1": 467.56146, "r_x2": 145.7785, "r_y2": 459.4917, "r_x3": 134.76401, "r_y3": 459.4917, "coord_origin": "TOPLEFT" }, "text": "13.", "orig": "13.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.08871, "r_y0": 467.56146, "r_x1": 480.59006, "r_y1": 467.56146, "r_x2": 480.59006, "r_y2": 459.4917, "r_x3": 150.08871, "r_y3": 459.4917, "coord_origin": "TOPLEFT" }, "text": "Siddiqui, S.A., Fateh, I.A., Rizvi, S.T.R., Dengel, A., Ahmed, S.: Deeptabstr: Deep", "orig": "Siddiqui, S.A., Fateh, I.A., Rizvi, S.T.R., Dengel, A., Ahmed, S.: Deeptabstr: Deep", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 478.52048, "r_x1": 480.59116, "r_y1": 478.52048, "r_x2": 480.59116, "r_y2": 470.45071, "r_x3": 151.51801, "r_y3": 470.45071, "coord_origin": "TOPLEFT" }, "text": "learning based table structure recognition. In: 2019 International Conference on", "orig": "learning based table structure recognition. In: 2019 International Conference on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 489.47946, "r_x1": 439.05963, "r_y1": 489.47946, "r_x2": 439.05963, "r_y2": 481.4097, "r_x3": 151.51801, "r_y3": 481.4097, "coord_origin": "TOPLEFT" }, "text": "Document Analysis and Recognition (ICDAR). pp. 1403-1409 (2019).", "orig": "Document Analysis and Recognition (ICDAR). pp. 1403-1409 (2019).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.94202000000007, "r_y0": 489.52429, "r_x1": 480.59372, "r_y1": 489.52429, "r_x2": 480.59372, "r_y2": 482.05527, "r_x3": 442.94202000000007, "r_y3": 482.05527, "coord_origin": "TOPLEFT" }, "text": "https://", "orig": "https://", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 500.48328, "r_x1": 302.11584, "r_y1": 500.48328, "r_x2": 302.11584, "r_y2": 493.01425, "r_x3": 151.51801, "r_y3": 493.01425, "coord_origin": "TOPLEFT" }, "text": "doi.org/10.1109/ICDAR.2019.00226", "orig": "doi.org/10.1109/ICDAR.2019.00226", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76401, "r_y0": 511.40845, "r_x1": 146.15501, "r_y1": 511.40845, "r_x2": 146.15501, "r_y2": 503.33868, "r_x3": 134.76401, "r_y3": 503.33868, "coord_origin": "TOPLEFT" }, "text": "14.", "orig": "14.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.61252, "r_y0": 511.40845, "r_x1": 480.59088, "r_y1": 511.40845, "r_x2": 480.59088, "r_y2": 503.33868, "r_x3": 150.61252, "r_y3": 503.33868, "coord_origin": "TOPLEFT" }, "text": "Smock, B., Pesala, R., Abraham, R.: PubTables-1M: Towards comprehensive ta-", "orig": "Smock, B., Pesala, R., Abraham, R.: PubTables-1M: Towards comprehensive ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 522.3674599999999, "r_x1": 480.59286000000003, "r_y1": 522.3674599999999, "r_x2": 480.59286000000003, "r_y2": 514.2977000000001, "r_x3": 151.51801, "r_y3": 514.2977000000001, "coord_origin": "TOPLEFT" }, "text": "ble extraction from unstructured documents. In: Proceedings of the IEEE/CVF", "orig": "ble extraction from unstructured documents. In: Proceedings of the IEEE/CVF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 533.32645, "r_x1": 480.58838000000003, "r_y1": 533.32645, "r_x2": 480.58838000000003, "r_y2": 525.25668, "r_x3": 151.51801, "r_y3": 525.25668, "coord_origin": "TOPLEFT" }, "text": "Conference on Computer Vision and Pattern Recognition (CVPR). pp. 4634-4642", "orig": "Conference on Computer Vision and Pattern Recognition (CVPR). pp. 4634-4642", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 544.28545, "r_x1": 199.24704, "r_y1": 544.28545, "r_x2": 199.24704, "r_y2": 536.21568, "r_x3": 151.51801, "r_y3": 536.21568, "coord_origin": "TOPLEFT" }, "text": "(June 2022)", "orig": "(June 2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76401, "r_y0": 555.25545, "r_x1": 146.16588, "r_y1": 555.25545, "r_x2": 146.16588, "r_y2": 547.18568, "r_x3": 134.76401, "r_y3": 547.18568, "coord_origin": "TOPLEFT" }, "text": "15.", "orig": "15.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.62764, "r_y0": 555.25545, "r_x1": 480.58734000000004, "r_y1": 555.25545, "r_x2": 480.58734000000004, "r_y2": 547.18568, "r_x3": 150.62764, "r_y3": 547.18568, "coord_origin": "TOPLEFT" }, "text": "Staar, P.W.J., Dolfi, M., Auer, C., Bekas, C.: Corpus conversion service: A ma-", "orig": "Staar, P.W.J., Dolfi, M., Auer, C., Bekas, C.: Corpus conversion service: A ma-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 566.2144499999999, "r_x1": 480.58838000000003, "r_y1": 566.2144499999999, "r_x2": 480.58838000000003, "r_y2": 558.14468, "r_x3": 151.51801, "r_y3": 558.14468, "coord_origin": "TOPLEFT" }, "text": "chine learning platform to ingest documents at scale. In: Proceedings of the 24th", "orig": "chine learning platform to ingest documents at scale. In: Proceedings of the 24th", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 577.17345, "r_x1": 480.59109, "r_y1": 577.17345, "r_x2": 480.59109, "r_y2": 569.1036799999999, "r_x3": 151.51801, "r_y3": 569.1036799999999, "coord_origin": "TOPLEFT" }, "text": "ACM SIGKDD International Conference on Knowledge Discovery & Data Min-", "orig": "ACM SIGKDD International Conference on Knowledge Discovery & Data Min-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 588.1324500000001, "r_x1": 480.59195, "r_y1": 588.1324500000001, "r_x2": 480.59195, "r_y2": 580.06268, "r_x3": 151.51801, "r_y3": 580.06268, "coord_origin": "TOPLEFT" }, "text": "ing. pp. 774-782. KDD \u201918, Association for Computing Machinery, New York, NY,", "orig": "ing. pp. 774-782. KDD \u201918, Association for Computing Machinery, New York, NY,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 599.09145, "r_x1": 200.75787, "r_y1": 599.09145, "r_x2": 200.75787, "r_y2": 591.0216800000001, "r_x3": 151.51801, "r_y3": 591.0216800000001, "coord_origin": "TOPLEFT" }, "text": "USA (2018).", "orig": "USA (2018).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 202.916, "r_y0": 599.1362799999999, "r_x1": 386.45911, "r_y1": 599.1362799999999, "r_x2": 386.45911, "r_y2": 591.66727, "r_x3": 202.916, "r_y3": 591.66727, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.1145/3219819.3219834", "orig": "https://doi.org/10.1145/3219819.3219834", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.45801, "r_y0": 599.09145, "r_x1": 389.01703, "r_y1": 599.09145, "r_x2": 389.01703, "r_y2": 591.0216800000001, "r_x3": 386.45801, "r_y3": 591.0216800000001, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 391.173, "r_y0": 599.1362799999999, "r_x1": 480.59583, "r_y1": 599.1362799999999, "r_x2": 480.59583, "r_y2": 591.66727, "r_x3": 391.173, "r_y3": 591.66727, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.", "orig": "https://doi.org/10.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 610.09528, "r_x1": 245.63831, "r_y1": 610.09528, "r_x2": 245.63831, "r_y2": 602.62627, "r_x3": 151.51801, "r_y3": 602.62627, "coord_origin": "TOPLEFT" }, "text": "1145/3219819.3219834", "orig": "1145/3219819.3219834", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76401, "r_y0": 621.02045, "r_x1": 146.62019, "r_y1": 621.02045, "r_x2": 146.62019, "r_y2": 612.95068, "r_x3": 134.76401, "r_y3": 612.95068, "coord_origin": "TOPLEFT" }, "text": "16.", "orig": "16.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.25977, "r_y0": 621.02045, "r_x1": 480.59542999999996, "r_y1": 621.02045, "r_x2": 480.59542999999996, "r_y2": 612.95068, "r_x3": 151.25977, "r_y3": 612.95068, "coord_origin": "TOPLEFT" }, "text": "Wang, X.: Tabular Abstraction, Editing, and Formatting. Ph.D. thesis, CAN", "orig": "Wang, X.: Tabular Abstraction, Editing, and Formatting. Ph.D. thesis, CAN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 631.97945, "r_x1": 234.43031, "r_y1": 631.97945, "r_x2": 234.43031, "r_y2": 623.90968, "r_x3": 151.51801, "r_y3": 623.90968, "coord_origin": "TOPLEFT" }, "text": "(1996), aAINN09397", "orig": "(1996), aAINN09397", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76401, "r_y0": 642.9494500000001, "r_x1": 146.30539, "r_y1": 642.9494500000001, "r_x2": 146.30539, "r_y2": 634.87968, "r_x3": 134.76401, "r_y3": 634.87968, "coord_origin": "TOPLEFT" }, "text": "17.", "orig": "17.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.82175, "r_y0": 642.9494500000001, "r_x1": 480.58731000000006, "r_y1": 642.9494500000001, "r_x2": 480.58731000000006, "r_y2": 634.87968, "r_x3": 150.82175, "r_y3": 634.87968, "coord_origin": "TOPLEFT" }, "text": "Xue, W., Li, Q., Tao, D.: Res2tim: Reconstruct syntactic structures from table", "orig": "Xue, W., Li, Q., Tao, D.: Res2tim: Reconstruct syntactic structures from table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 653.90845, "r_x1": 480.59119, "r_y1": 653.90845, "r_x2": 480.59119, "r_y2": 645.8386800000001, "r_x3": 151.51801, "r_y3": 645.8386800000001, "coord_origin": "TOPLEFT" }, "text": "images. In: 2019 International Conference on Document Analysis and Recognition", "orig": "images. In: 2019 International Conference on Document Analysis and Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 664.86745, "r_x1": 299.30307, "r_y1": 664.86745, "r_x2": 299.30307, "r_y2": 656.79768, "r_x3": 151.51801, "r_y3": 656.79768, "coord_origin": "TOPLEFT" }, "text": "(ICDAR). pp. 749-755. IEEE (2019)", "orig": "(ICDAR). pp. 749-755. IEEE (2019)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "has_chars": false, "has_words": false, "has_lines": true, "image": null, "lines": [] }, "predictions": { "layout": { "clusters": [ { "id": 13, "label": "page_header", "bbox": { "l": 194.478, "t": 93.77099999999996, "r": 447.54291000000006, "b": 101.84069999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.9163166880607605, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.478, "r_y0": 101.84069999999997, "r_x1": 447.54291000000006, "r_y1": 101.84069999999997, "r_x2": 447.54291000000006, "r_y2": 93.77099999999996, "r_x3": 194.478, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 14, "label": "page_header", "bbox": { "l": 471.37561, "t": 93.77099999999996, "r": 480.5894799999999, "b": 101.84069999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.9061064720153809, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 471.37561, "r_y0": 101.84069999999997, "r_x1": 480.5894799999999, "r_y1": 101.84069999999997, "r_x2": 480.5894799999999, "r_y2": 93.77099999999996, "r_x3": 471.37561, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 5, "label": "list_item", "bbox": { "l": 139.371, "t": 119.67400999999995, "r": 480.59479, "b": 149.66168000000005, "coord_origin": "TOPLEFT" }, "confidence": 0.9677112698554993, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.371, "r_y0": 127.74370999999985, "r_x1": 146.04857, "r_y1": 127.74370999999985, "r_x2": 146.04857, "r_y2": 119.67400999999995, "r_x3": 139.371, "r_y3": 119.67400999999995, "coord_origin": "TOPLEFT" }, "text": "5.", "orig": "5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.34157, "r_y0": 127.74370999999985, "r_x1": 480.58826, "r_y1": 127.74370999999985, "r_x2": 480.58826, "r_y2": 119.67400999999995, "r_x3": 150.34157, "r_y3": 119.67400999999995, "coord_origin": "TOPLEFT" }, "text": "Kayal, P., Anand, M., Desai, H., Singh, M.: Tables to latex: structure and content", "orig": "Kayal, P., Anand, M., Desai, H., Singh, M.: Tables to latex: structure and content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 138.70270000000005, "r_x1": 480.59479, "r_y1": 138.70270000000005, "r_x2": 480.59479, "r_y2": 130.63300000000004, "r_x3": 151.51801, "r_y3": 130.63300000000004, "coord_origin": "TOPLEFT" }, "text": "extraction from scientific tables. International Journal on Document Analysis and", "orig": "extraction from scientific tables. International Journal on Document Analysis and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 149.66168000000005, "r_x1": 304.04364, "r_y1": 149.66168000000005, "r_x2": 304.04364, "r_y2": 141.59198000000004, "r_x3": 151.51801, "r_y3": 141.59198000000004, "coord_origin": "TOPLEFT" }, "text": "Recognition (IJDAR) pp. 1-10 (2022)", "orig": "Recognition (IJDAR) pp. 1-10 (2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 1, "label": "list_item", "bbox": { "l": 139.371, "t": 152.56195000000002, "r": 480.59286000000003, "b": 193.50860999999998, "coord_origin": "TOPLEFT" }, "confidence": 0.973045289516449, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.371, "r_y0": 160.63165000000004, "r_x1": 145.93991, "r_y1": 160.63165000000004, "r_x2": 145.93991, "r_y2": 152.56195000000002, "r_x3": 139.371, "r_y3": 152.56195000000002, "coord_origin": "TOPLEFT" }, "text": "6.", "orig": "6.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.16298, "r_y0": 160.63165000000004, "r_x1": 480.59015, "r_y1": 160.63165000000004, "r_x2": 480.59015, "r_y2": 152.56195000000002, "r_x3": 150.16298, "r_y3": 152.56195000000002, "coord_origin": "TOPLEFT" }, "text": "Lee, E., Kwon, J., Yang, H., Park, J., Lee, S., Koo, H.I., Cho, N.I.: Table structure", "orig": "Lee, E., Kwon, J., Yang, H., Park, J., Lee, S., Koo, H.I., Cho, N.I.: Table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 171.59064, "r_x1": 480.5903, "r_y1": 171.59064, "r_x2": 480.5903, "r_y2": 163.52094, "r_x3": 151.51801, "r_y3": 163.52094, "coord_origin": "TOPLEFT" }, "text": "recognition based on grid shape graph. In: 2022 Asia-Pacific Signal and Information", "orig": "recognition based on grid shape graph. In: 2022 Asia-Pacific Signal and Information", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 182.54962, "r_x1": 480.59286000000003, "r_y1": 182.54962, "r_x2": 480.59286000000003, "r_y2": 174.47992, "r_x3": 151.51801, "r_y3": 174.47992, "coord_origin": "TOPLEFT" }, "text": "Processing Association Annual Summit and Conference (APSIPA ASC). pp. 1868-", "orig": "Processing Association Annual Summit and Conference (APSIPA ASC). pp. 1868-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 193.50860999999998, "r_x1": 226.37399, "r_y1": 193.50860999999998, "r_x2": 226.37399, "r_y2": 185.4389, "r_x3": 151.51801, "r_y3": 185.4389, "coord_origin": "TOPLEFT" }, "text": "1873. IEEE (2022)", "orig": "1873. IEEE (2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 10, "label": "list_item", "bbox": { "l": 139.371, "t": 196.40886999999998, "r": 480.59012, "b": 215.43755999999996, "coord_origin": "TOPLEFT" }, "confidence": 0.9582491517066956, "cells": [ { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.371, "r_y0": 204.47857999999997, "r_x1": 146.31418, "r_y1": 204.47857999999997, "r_x2": 146.31418, "r_y2": 196.40886999999998, "r_x3": 139.371, "r_y3": 196.40886999999998, "coord_origin": "TOPLEFT" }, "text": "7.", "orig": "7.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.77789, "r_y0": 204.47857999999997, "r_x1": 480.59012, "r_y1": 204.47857999999997, "r_x2": 480.59012, "r_y2": 196.40886999999998, "r_x3": 150.77789, "r_y3": 196.40886999999998, "coord_origin": "TOPLEFT" }, "text": "Li, M., Cui, L., Huang, S., Wei, F., Zhou, M., Li, Z.: Tablebank: A benchmark", "orig": "Li, M., Cui, L., Huang, S., Wei, F., Zhou, M., Li, Z.: Tablebank: A benchmark", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 215.43755999999996, "r_x1": 352.01746, "r_y1": 215.43755999999996, "r_x2": 352.01746, "r_y2": 207.36785999999995, "r_x3": 151.51801, "r_y3": 207.36785999999995, "coord_origin": "TOPLEFT" }, "text": "dataset for table detection and recognition (2019)", "orig": "dataset for table detection and recognition (2019)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 4, "label": "list_item", "bbox": { "l": 139.371, "t": 218.33887000000004, "r": 480.59473, "b": 270.28839000000005, "coord_origin": "TOPLEFT" }, "confidence": 0.967814564704895, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.371, "r_y0": 226.40857000000005, "r_x1": 146.37106, "r_y1": 226.40857000000005, "r_x2": 146.37106, "r_y2": 218.33887000000004, "r_x3": 139.371, "r_y3": 218.33887000000004, "coord_origin": "TOPLEFT" }, "text": "8.", "orig": "8.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.87132, "r_y0": 226.40857000000005, "r_x1": 480.58731000000006, "r_y1": 226.40857000000005, "r_x2": 480.58731000000006, "r_y2": 218.33887000000004, "r_x3": 150.87132, "r_y3": 218.33887000000004, "coord_origin": "TOPLEFT" }, "text": "Livathinos, N., Berrospi, C., Lysak, M., Kuropiatnyk, V., Nassar, A., Carvalho,", "orig": "Livathinos, N., Berrospi, C., Lysak, M., Kuropiatnyk, V., Nassar, A., Carvalho,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 237.36755000000005, "r_x1": 480.59020999999996, "r_y1": 237.36755000000005, "r_x2": 480.59020999999996, "r_y2": 229.29785000000004, "r_x3": 151.51801, "r_y3": 229.29785000000004, "coord_origin": "TOPLEFT" }, "text": "A., Dolfi, M., Auer, C., Dinkla, K., Staar, P.: Robust pdf document conversion", "orig": "A., Dolfi, M., Auer, C., Dinkla, K., Staar, P.: Robust pdf document conversion", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 248.32654000000002, "r_x1": 480.59473, "r_y1": 248.32654000000002, "r_x2": 480.59473, "r_y2": 240.25684, "r_x3": 151.51801, "r_y3": 240.25684, "coord_origin": "TOPLEFT" }, "text": "using recurrent neural networks. Proceedings of the AAAI Conference on Artificial", "orig": "using recurrent neural networks. Proceedings of the AAAI Conference on Artificial", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 259.28552, "r_x1": 197.08617, "r_y1": 259.28552, "r_x2": 197.08617, "r_y2": 251.21582, "r_x3": 151.51801, "r_y3": 251.21582, "coord_origin": "TOPLEFT" }, "text": "Intelligence", "orig": "Intelligence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 199.40001, "r_y0": 259.07935, "r_x1": 210.00726, "r_y1": 259.07935, "r_x2": 210.00726, "r_y2": 251.15301999999997, "r_x3": 199.40001, "r_y3": 251.15301999999997, "coord_origin": "TOPLEFT" }, "text": "35", "orig": "35", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.007, "r_y0": 259.28552, "r_x1": 332.37683, "r_y1": 259.28552, "r_x2": 332.37683, "r_y2": 251.21582, "r_x3": 210.007, "r_y3": 251.21582, "coord_origin": "TOPLEFT" }, "text": "(17), 15137-15145 (May 2021),", "orig": "(17), 15137-15145 (May 2021),", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.69901, "r_y0": 259.33038, "r_x1": 480.59039000000007, "r_y1": 259.33038, "r_x2": 480.59039000000007, "r_y2": 251.86139000000003, "r_x3": 334.69901, "r_y3": 251.86139000000003, "coord_origin": "TOPLEFT" }, "text": "https://ojs.aaai.org/index.php/", "orig": "https://ojs.aaai.org/index.php/", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 270.28839000000005, "r_x1": 259.75769, "r_y1": 270.28839000000005, "r_x2": 259.75769, "r_y2": 262.8194, "r_x3": 151.51801, "r_y3": 262.8194, "coord_origin": "TOPLEFT" }, "text": "AAAI/article/view/17777", "orig": "AAAI/article/view/17777", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 11, "label": "list_item", "bbox": { "l": 139.371, "t": 273.14484000000004, "r": 480.59387000000004, "b": 303.13254, "coord_origin": "TOPLEFT" }, "confidence": 0.9557179808616638, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.371, "r_y0": 281.21457, "r_x1": 146.14218, "r_y1": 281.21457, "r_x2": 146.14218, "r_y2": 273.14484000000004, "r_x3": 139.371, "r_y3": 273.14484000000004, "coord_origin": "TOPLEFT" }, "text": "9.", "orig": "9.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.49533, "r_y0": 281.21457, "r_x1": 480.5881999999999, "r_y1": 281.21457, "r_x2": 480.5881999999999, "r_y2": 273.14484000000004, "r_x3": 150.49533, "r_y3": 273.14484000000004, "coord_origin": "TOPLEFT" }, "text": "Nassar, A., Livathinos, N., Lysak, M., Staar, P.: Tableformer: Table structure un-", "orig": "Nassar, A., Livathinos, N., Lysak, M., Staar, P.: Tableformer: Table structure un-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 292.17355, "r_x1": 480.59387000000004, "r_y1": 292.17355, "r_x2": 480.59387000000004, "r_y2": 284.10379, "r_x3": 151.51801, "r_y3": 284.10379, "coord_origin": "TOPLEFT" }, "text": "derstanding with transformers. In: Proceedings of the IEEE/CVF Conference on", "orig": "derstanding with transformers. In: Proceedings of the IEEE/CVF Conference on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 303.13254, "r_x1": 473.44308000000007, "r_y1": 303.13254, "r_x2": 473.44308000000007, "r_y2": 295.06277, "r_x3": 151.51801, "r_y3": 295.06277, "coord_origin": "TOPLEFT" }, "text": "Computer Vision and Pattern Recognition (CVPR). pp. 4614-4623 (June 2022)", "orig": "Computer Vision and Pattern Recognition (CVPR). pp. 4614-4623 (June 2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 9, "label": "list_item", "bbox": { "l": 134.76401, "t": 306.03277999999995, "r": 480.59372, "b": 368.94232, "coord_origin": "TOPLEFT" }, "confidence": 0.9639304876327515, "cells": [ { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76401, "r_y0": 314.10254000000003, "r_x1": 146.49922, "r_y1": 314.10254000000003, "r_x2": 146.49922, "r_y2": 306.03277999999995, "r_x3": 134.76401, "r_y3": 306.03277999999995, "coord_origin": "TOPLEFT" }, "text": "10.", "orig": "10.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.09138, "r_y0": 314.10254000000003, "r_x1": 480.58905, "r_y1": 314.10254000000003, "r_x2": 480.58905, "r_y2": 306.03277999999995, "r_x3": 151.09138, "r_y3": 306.03277999999995, "coord_origin": "TOPLEFT" }, "text": "Pfitzmann, B., Auer, C., Dolfi, M., Nassar, A.S., Staar, P.W.J.: Doclaynet: A", "orig": "Pfitzmann, B., Auer, C., Dolfi, M., Nassar, A.S., Staar, P.W.J.: Doclaynet: A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 325.06155, "r_x1": 480.59015, "r_y1": 325.06155, "r_x2": 480.59015, "r_y2": 316.99179, "r_x3": 151.51801, "r_y3": 316.99179, "coord_origin": "TOPLEFT" }, "text": "large human-annotated dataset for document-layout segmentation. In: Zhang, A.,", "orig": "large human-annotated dataset for document-layout segmentation. In: Zhang, A.,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 336.02054, "r_x1": 480.59113, "r_y1": 336.02054, "r_x2": 480.59113, "r_y2": 327.95078, "r_x3": 151.51801, "r_y3": 327.95078, "coord_origin": "TOPLEFT" }, "text": "Rangwala, H. (eds.) KDD \u201922: The 28th ACM SIGKDD Conference on Knowledge", "orig": "Rangwala, H. (eds.) KDD \u201922: The 28th ACM SIGKDD Conference on Knowledge", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 346.97952, "r_x1": 480.59113, "r_y1": 346.97952, "r_x2": 480.59113, "r_y2": 338.90976, "r_x3": 151.51801, "r_y3": 338.90976, "coord_origin": "TOPLEFT" }, "text": "Discovery and Data Mining, Washington, DC, USA, August 14 - 18, 2022. pp.", "orig": "Discovery and Data Mining, Washington, DC, USA, August 14 - 18, 2022. pp.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 357.93851, "r_x1": 251.14098999999996, "r_y1": 357.93851, "r_x2": 251.14098999999996, "r_y2": 349.86874, "r_x3": 151.51801, "r_y3": 349.86874, "coord_origin": "TOPLEFT" }, "text": "3743-3751. ACM (2022).", "orig": "3743-3751. ACM (2022).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 253.99001, "r_y0": 357.98333999999994, "r_x1": 437.53311, "r_y1": 357.98333999999994, "r_x2": 437.53311, "r_y2": 350.5143100000001, "r_x3": 253.99001, "r_y3": 350.5143100000001, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.1145/3534678.3539043", "orig": "https://doi.org/10.1145/3534678.3539043", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.53201, "r_y0": 357.93851, "r_x1": 440.09102999999993, "r_y1": 357.93851, "r_x2": 440.09102999999993, "r_y2": 349.86874, "r_x3": 437.53201, "r_y3": 349.86874, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.94202000000007, "r_y0": 357.98333999999994, "r_x1": 480.59372, "r_y1": 357.98333999999994, "r_x2": 480.59372, "r_y2": 350.5143100000001, "r_x3": 442.94202000000007, "r_y3": 350.5143100000001, "coord_origin": "TOPLEFT" }, "text": "https://", "orig": "https://", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 368.94232, "r_x1": 297.40939, "r_y1": 368.94232, "r_x2": 297.40939, "r_y2": 361.47329999999994, "r_x3": 151.51801, "r_y3": 361.47329999999994, "coord_origin": "TOPLEFT" }, "text": "doi.org/10.1145/3534678.3539043", "orig": "doi.org/10.1145/3534678.3539043", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 0, "label": "list_item", "bbox": { "l": 134.76401, "t": 371.79773, "r": 480.59296, "b": 412.74448, "coord_origin": "TOPLEFT" }, "confidence": 0.9752162098884583, "cells": [ { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76401, "r_y0": 379.86749, "r_x1": 146.03854, "r_y1": 379.86749, "r_x2": 146.03854, "r_y2": 371.79773, "r_x3": 134.76401, "r_y3": 371.79773, "coord_origin": "TOPLEFT" }, "text": "11.", "orig": "11.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.4505, "r_y0": 379.86749, "r_x1": 480.58914000000004, "r_y1": 379.86749, "r_x2": 480.58914000000004, "r_y2": 371.79773, "r_x3": 150.4505, "r_y3": 371.79773, "coord_origin": "TOPLEFT" }, "text": "Prasad, D., Gadpal, A., Kapadni, K., Visave, M., Sultanpure, K.: Cascadetabnet:", "orig": "Prasad, D., Gadpal, A., Kapadni, K., Visave, M., Sultanpure, K.: Cascadetabnet:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 390.82651, "r_x1": 480.59296, "r_y1": 390.82651, "r_x2": 480.59296, "r_y2": 382.7567399999999, "r_x3": 151.51801, "r_y3": 382.7567399999999, "coord_origin": "TOPLEFT" }, "text": "An approach for end to end table detection and structure recognition from image-", "orig": "An approach for end to end table detection and structure recognition from image-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 401.78549, "r_x1": 480.59293, "r_y1": 401.78549, "r_x2": 480.59293, "r_y2": 393.71573, "r_x3": 151.51801, "r_y3": 393.71573, "coord_origin": "TOPLEFT" }, "text": "based documents. In: Proceedings of the IEEE/CVF conference on computer vision", "orig": "based documents. In: Proceedings of the IEEE/CVF conference on computer vision", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 412.74448, "r_x1": 373.82727, "r_y1": 412.74448, "r_x2": 373.82727, "r_y2": 404.67471, "r_x3": 151.51801, "r_y3": 404.67471, "coord_origin": "TOPLEFT" }, "text": "and pattern recognition workshops. pp. 572-573 (2020)", "orig": "and pattern recognition workshops. pp. 572-573 (2020)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 3, "label": "list_item", "bbox": { "l": 134.76401, "t": 415.64471, "r": 480.59469999999993, "b": 456.59146, "coord_origin": "TOPLEFT" }, "confidence": 0.9707236886024475, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76401, "r_y0": 423.71448000000004, "r_x1": 145.91106, "r_y1": 423.71448000000004, "r_x2": 145.91106, "r_y2": 415.64471, "r_x3": 134.76401, "r_y3": 415.64471, "coord_origin": "TOPLEFT" }, "text": "12.", "orig": "12.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.27309, "r_y0": 423.71448000000004, "r_x1": 480.5874, "r_y1": 423.71448000000004, "r_x2": 480.5874, "r_y2": 415.64471, "r_x3": 150.27309, "r_y3": 415.64471, "coord_origin": "TOPLEFT" }, "text": "Schreiber, S., Agne, S., Wolf, I., Dengel, A., Ahmed, S.: Deepdesrt: Deep learning", "orig": "Schreiber, S., Agne, S., Wolf, I., Dengel, A., Ahmed, S.: Deepdesrt: Deep learning", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 434.67349, "r_x1": 480.59469999999993, "r_y1": 434.67349, "r_x2": 480.59469999999993, "r_y2": 426.60373, "r_x3": 151.51801, "r_y3": 426.60373, "coord_origin": "TOPLEFT" }, "text": "for detection and structure recognition of tables in document images. In: 2017 14th", "orig": "for detection and structure recognition of tables in document images. In: 2017 14th", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 445.63248, "r_x1": 480.58844, "r_y1": 445.63248, "r_x2": 480.58844, "r_y2": 437.5627099999999, "r_x3": 151.51801, "r_y3": 437.5627099999999, "coord_origin": "TOPLEFT" }, "text": "IAPR international conference on document analysis and recognition (ICDAR).", "orig": "IAPR international conference on document analysis and recognition (ICDAR).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 456.59146, "r_x1": 292.91455, "r_y1": 456.59146, "r_x2": 292.91455, "r_y2": 448.5217, "r_x3": 151.51801, "r_y3": 448.5217, "coord_origin": "TOPLEFT" }, "text": "vol. 1, pp. 1162-1167. IEEE (2017)", "orig": "vol. 1, pp. 1162-1167. IEEE (2017)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 7, "label": "list_item", "bbox": { "l": 134.76401, "t": 459.4917, "r": 480.59372, "b": 500.48328, "coord_origin": "TOPLEFT" }, "confidence": 0.9658119678497314, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76401, "r_y0": 467.56146, "r_x1": 145.7785, "r_y1": 467.56146, "r_x2": 145.7785, "r_y2": 459.4917, "r_x3": 134.76401, "r_y3": 459.4917, "coord_origin": "TOPLEFT" }, "text": "13.", "orig": "13.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.08871, "r_y0": 467.56146, "r_x1": 480.59006, "r_y1": 467.56146, "r_x2": 480.59006, "r_y2": 459.4917, "r_x3": 150.08871, "r_y3": 459.4917, "coord_origin": "TOPLEFT" }, "text": "Siddiqui, S.A., Fateh, I.A., Rizvi, S.T.R., Dengel, A., Ahmed, S.: Deeptabstr: Deep", "orig": "Siddiqui, S.A., Fateh, I.A., Rizvi, S.T.R., Dengel, A., Ahmed, S.: Deeptabstr: Deep", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 478.52048, "r_x1": 480.59116, "r_y1": 478.52048, "r_x2": 480.59116, "r_y2": 470.45071, "r_x3": 151.51801, "r_y3": 470.45071, "coord_origin": "TOPLEFT" }, "text": "learning based table structure recognition. In: 2019 International Conference on", "orig": "learning based table structure recognition. In: 2019 International Conference on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 489.47946, "r_x1": 439.05963, "r_y1": 489.47946, "r_x2": 439.05963, "r_y2": 481.4097, "r_x3": 151.51801, "r_y3": 481.4097, "coord_origin": "TOPLEFT" }, "text": "Document Analysis and Recognition (ICDAR). pp. 1403-1409 (2019).", "orig": "Document Analysis and Recognition (ICDAR). pp. 1403-1409 (2019).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.94202000000007, "r_y0": 489.52429, "r_x1": 480.59372, "r_y1": 489.52429, "r_x2": 480.59372, "r_y2": 482.05527, "r_x3": 442.94202000000007, "r_y3": 482.05527, "coord_origin": "TOPLEFT" }, "text": "https://", "orig": "https://", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 500.48328, "r_x1": 302.11584, "r_y1": 500.48328, "r_x2": 302.11584, "r_y2": 493.01425, "r_x3": 151.51801, "r_y3": 493.01425, "coord_origin": "TOPLEFT" }, "text": "doi.org/10.1109/ICDAR.2019.00226", "orig": "doi.org/10.1109/ICDAR.2019.00226", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 2, "label": "list_item", "bbox": { "l": 134.76401, "t": 503.33868, "r": 480.59286000000003, "b": 544.28545, "coord_origin": "TOPLEFT" }, "confidence": 0.972225546836853, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76401, "r_y0": 511.40845, "r_x1": 146.15501, "r_y1": 511.40845, "r_x2": 146.15501, "r_y2": 503.33868, "r_x3": 134.76401, "r_y3": 503.33868, "coord_origin": "TOPLEFT" }, "text": "14.", "orig": "14.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.61252, "r_y0": 511.40845, "r_x1": 480.59088, "r_y1": 511.40845, "r_x2": 480.59088, "r_y2": 503.33868, "r_x3": 150.61252, "r_y3": 503.33868, "coord_origin": "TOPLEFT" }, "text": "Smock, B., Pesala, R., Abraham, R.: PubTables-1M: Towards comprehensive ta-", "orig": "Smock, B., Pesala, R., Abraham, R.: PubTables-1M: Towards comprehensive ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 522.3674599999999, "r_x1": 480.59286000000003, "r_y1": 522.3674599999999, "r_x2": 480.59286000000003, "r_y2": 514.2977000000001, "r_x3": 151.51801, "r_y3": 514.2977000000001, "coord_origin": "TOPLEFT" }, "text": "ble extraction from unstructured documents. In: Proceedings of the IEEE/CVF", "orig": "ble extraction from unstructured documents. In: Proceedings of the IEEE/CVF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 533.32645, "r_x1": 480.58838000000003, "r_y1": 533.32645, "r_x2": 480.58838000000003, "r_y2": 525.25668, "r_x3": 151.51801, "r_y3": 525.25668, "coord_origin": "TOPLEFT" }, "text": "Conference on Computer Vision and Pattern Recognition (CVPR). pp. 4634-4642", "orig": "Conference on Computer Vision and Pattern Recognition (CVPR). pp. 4634-4642", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 544.28545, "r_x1": 199.24704, "r_y1": 544.28545, "r_x2": 199.24704, "r_y2": 536.21568, "r_x3": 151.51801, "r_y3": 536.21568, "coord_origin": "TOPLEFT" }, "text": "(June 2022)", "orig": "(June 2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 6, "label": "list_item", "bbox": { "l": 134.76401, "t": 547.18568, "r": 480.59583, "b": 610.09528, "coord_origin": "TOPLEFT" }, "confidence": 0.9674034714698792, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76401, "r_y0": 555.25545, "r_x1": 146.16588, "r_y1": 555.25545, "r_x2": 146.16588, "r_y2": 547.18568, "r_x3": 134.76401, "r_y3": 547.18568, "coord_origin": "TOPLEFT" }, "text": "15.", "orig": "15.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.62764, "r_y0": 555.25545, "r_x1": 480.58734000000004, "r_y1": 555.25545, "r_x2": 480.58734000000004, "r_y2": 547.18568, "r_x3": 150.62764, "r_y3": 547.18568, "coord_origin": "TOPLEFT" }, "text": "Staar, P.W.J., Dolfi, M., Auer, C., Bekas, C.: Corpus conversion service: A ma-", "orig": "Staar, P.W.J., Dolfi, M., Auer, C., Bekas, C.: Corpus conversion service: A ma-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 566.2144499999999, "r_x1": 480.58838000000003, "r_y1": 566.2144499999999, "r_x2": 480.58838000000003, "r_y2": 558.14468, "r_x3": 151.51801, "r_y3": 558.14468, "coord_origin": "TOPLEFT" }, "text": "chine learning platform to ingest documents at scale. In: Proceedings of the 24th", "orig": "chine learning platform to ingest documents at scale. In: Proceedings of the 24th", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 577.17345, "r_x1": 480.59109, "r_y1": 577.17345, "r_x2": 480.59109, "r_y2": 569.1036799999999, "r_x3": 151.51801, "r_y3": 569.1036799999999, "coord_origin": "TOPLEFT" }, "text": "ACM SIGKDD International Conference on Knowledge Discovery & Data Min-", "orig": "ACM SIGKDD International Conference on Knowledge Discovery & Data Min-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 588.1324500000001, "r_x1": 480.59195, "r_y1": 588.1324500000001, "r_x2": 480.59195, "r_y2": 580.06268, "r_x3": 151.51801, "r_y3": 580.06268, "coord_origin": "TOPLEFT" }, "text": "ing. pp. 774-782. KDD \u201918, Association for Computing Machinery, New York, NY,", "orig": "ing. pp. 774-782. KDD \u201918, Association for Computing Machinery, New York, NY,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 599.09145, "r_x1": 200.75787, "r_y1": 599.09145, "r_x2": 200.75787, "r_y2": 591.0216800000001, "r_x3": 151.51801, "r_y3": 591.0216800000001, "coord_origin": "TOPLEFT" }, "text": "USA (2018).", "orig": "USA (2018).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 202.916, "r_y0": 599.1362799999999, "r_x1": 386.45911, "r_y1": 599.1362799999999, "r_x2": 386.45911, "r_y2": 591.66727, "r_x3": 202.916, "r_y3": 591.66727, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.1145/3219819.3219834", "orig": "https://doi.org/10.1145/3219819.3219834", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.45801, "r_y0": 599.09145, "r_x1": 389.01703, "r_y1": 599.09145, "r_x2": 389.01703, "r_y2": 591.0216800000001, "r_x3": 386.45801, "r_y3": 591.0216800000001, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 391.173, "r_y0": 599.1362799999999, "r_x1": 480.59583, "r_y1": 599.1362799999999, "r_x2": 480.59583, "r_y2": 591.66727, "r_x3": 391.173, "r_y3": 591.66727, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.", "orig": "https://doi.org/10.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 610.09528, "r_x1": 245.63831, "r_y1": 610.09528, "r_x2": 245.63831, "r_y2": 602.62627, "r_x3": 151.51801, "r_y3": 602.62627, "coord_origin": "TOPLEFT" }, "text": "1145/3219819.3219834", "orig": "1145/3219819.3219834", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 12, "label": "list_item", "bbox": { "l": 134.76401, "t": 612.95068, "r": 480.59542999999996, "b": 631.97945, "coord_origin": "TOPLEFT" }, "confidence": 0.9416429996490479, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76401, "r_y0": 621.02045, "r_x1": 146.62019, "r_y1": 621.02045, "r_x2": 146.62019, "r_y2": 612.95068, "r_x3": 134.76401, "r_y3": 612.95068, "coord_origin": "TOPLEFT" }, "text": "16.", "orig": "16.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.25977, "r_y0": 621.02045, "r_x1": 480.59542999999996, "r_y1": 621.02045, "r_x2": 480.59542999999996, "r_y2": 612.95068, "r_x3": 151.25977, "r_y3": 612.95068, "coord_origin": "TOPLEFT" }, "text": "Wang, X.: Tabular Abstraction, Editing, and Formatting. Ph.D. thesis, CAN", "orig": "Wang, X.: Tabular Abstraction, Editing, and Formatting. Ph.D. thesis, CAN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 631.97945, "r_x1": 234.43031, "r_y1": 631.97945, "r_x2": 234.43031, "r_y2": 623.90968, "r_x3": 151.51801, "r_y3": 623.90968, "coord_origin": "TOPLEFT" }, "text": "(1996), aAINN09397", "orig": "(1996), aAINN09397", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 8, "label": "list_item", "bbox": { "l": 134.76401, "t": 634.87968, "r": 480.59119, "b": 664.86745, "coord_origin": "TOPLEFT" }, "confidence": 0.9646382331848145, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76401, "r_y0": 642.9494500000001, "r_x1": 146.30539, "r_y1": 642.9494500000001, "r_x2": 146.30539, "r_y2": 634.87968, "r_x3": 134.76401, "r_y3": 634.87968, "coord_origin": "TOPLEFT" }, "text": "17.", "orig": "17.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.82175, "r_y0": 642.9494500000001, "r_x1": 480.58731000000006, "r_y1": 642.9494500000001, "r_x2": 480.58731000000006, "r_y2": 634.87968, "r_x3": 150.82175, "r_y3": 634.87968, "coord_origin": "TOPLEFT" }, "text": "Xue, W., Li, Q., Tao, D.: Res2tim: Reconstruct syntactic structures from table", "orig": "Xue, W., Li, Q., Tao, D.: Res2tim: Reconstruct syntactic structures from table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 653.90845, "r_x1": 480.59119, "r_y1": 653.90845, "r_x2": 480.59119, "r_y2": 645.8386800000001, "r_x3": 151.51801, "r_y3": 645.8386800000001, "coord_origin": "TOPLEFT" }, "text": "images. In: 2019 International Conference on Document Analysis and Recognition", "orig": "images. In: 2019 International Conference on Document Analysis and Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 664.86745, "r_x1": 299.30307, "r_y1": 664.86745, "r_x2": 299.30307, "r_y2": 656.79768, "r_x3": 151.51801, "r_y3": 656.79768, "coord_origin": "TOPLEFT" }, "text": "(ICDAR). pp. 749-755. IEEE (2019)", "orig": "(ICDAR). pp. 749-755. IEEE (2019)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "tablestructure": { "table_map": {} }, "figures_classification": null, "equations_prediction": null, "vlm_response": null }, "assembled": { "elements": [ { "label": "page_header", "id": 13, "page_no": 12, "cluster": { "id": 13, "label": "page_header", "bbox": { "l": 194.478, "t": 93.77099999999996, "r": 447.54291000000006, "b": 101.84069999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.9163166880607605, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.478, "r_y0": 101.84069999999997, "r_x1": 447.54291000000006, "r_y1": 101.84069999999997, "r_x2": 447.54291000000006, "r_y2": 93.77099999999996, "r_x3": 194.478, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Optimized Table Tokenization for Table Structure Recognition" }, { "label": "page_header", "id": 14, "page_no": 12, "cluster": { "id": 14, "label": "page_header", "bbox": { "l": 471.37561, "t": 93.77099999999996, "r": 480.5894799999999, "b": 101.84069999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.9061064720153809, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 471.37561, "r_y0": 101.84069999999997, "r_x1": 480.5894799999999, "r_y1": 101.84069999999997, "r_x2": 480.5894799999999, "r_y2": 93.77099999999996, "r_x3": 471.37561, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "13" }, { "label": "list_item", "id": 5, "page_no": 12, "cluster": { "id": 5, "label": "list_item", "bbox": { "l": 139.371, "t": 119.67400999999995, "r": 480.59479, "b": 149.66168000000005, "coord_origin": "TOPLEFT" }, "confidence": 0.9677112698554993, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.371, "r_y0": 127.74370999999985, "r_x1": 146.04857, "r_y1": 127.74370999999985, "r_x2": 146.04857, "r_y2": 119.67400999999995, "r_x3": 139.371, "r_y3": 119.67400999999995, "coord_origin": "TOPLEFT" }, "text": "5.", "orig": "5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.34157, "r_y0": 127.74370999999985, "r_x1": 480.58826, "r_y1": 127.74370999999985, "r_x2": 480.58826, "r_y2": 119.67400999999995, "r_x3": 150.34157, "r_y3": 119.67400999999995, "coord_origin": "TOPLEFT" }, "text": "Kayal, P., Anand, M., Desai, H., Singh, M.: Tables to latex: structure and content", "orig": "Kayal, P., Anand, M., Desai, H., Singh, M.: Tables to latex: structure and content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 138.70270000000005, "r_x1": 480.59479, "r_y1": 138.70270000000005, "r_x2": 480.59479, "r_y2": 130.63300000000004, "r_x3": 151.51801, "r_y3": 130.63300000000004, "coord_origin": "TOPLEFT" }, "text": "extraction from scientific tables. International Journal on Document Analysis and", "orig": "extraction from scientific tables. International Journal on Document Analysis and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 149.66168000000005, "r_x1": 304.04364, "r_y1": 149.66168000000005, "r_x2": 304.04364, "r_y2": 141.59198000000004, "r_x3": 151.51801, "r_y3": 141.59198000000004, "coord_origin": "TOPLEFT" }, "text": "Recognition (IJDAR) pp. 1-10 (2022)", "orig": "Recognition (IJDAR) pp. 1-10 (2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "5. Kayal, P., Anand, M., Desai, H., Singh, M.: Tables to latex: structure and content extraction from scientific tables. International Journal on Document Analysis and Recognition (IJDAR) pp. 1-10 (2022)" }, { "label": "list_item", "id": 1, "page_no": 12, "cluster": { "id": 1, "label": "list_item", "bbox": { "l": 139.371, "t": 152.56195000000002, "r": 480.59286000000003, "b": 193.50860999999998, "coord_origin": "TOPLEFT" }, "confidence": 0.973045289516449, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.371, "r_y0": 160.63165000000004, "r_x1": 145.93991, "r_y1": 160.63165000000004, "r_x2": 145.93991, "r_y2": 152.56195000000002, "r_x3": 139.371, "r_y3": 152.56195000000002, "coord_origin": "TOPLEFT" }, "text": "6.", "orig": "6.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.16298, "r_y0": 160.63165000000004, "r_x1": 480.59015, "r_y1": 160.63165000000004, "r_x2": 480.59015, "r_y2": 152.56195000000002, "r_x3": 150.16298, "r_y3": 152.56195000000002, "coord_origin": "TOPLEFT" }, "text": "Lee, E., Kwon, J., Yang, H., Park, J., Lee, S., Koo, H.I., Cho, N.I.: Table structure", "orig": "Lee, E., Kwon, J., Yang, H., Park, J., Lee, S., Koo, H.I., Cho, N.I.: Table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 171.59064, "r_x1": 480.5903, "r_y1": 171.59064, "r_x2": 480.5903, "r_y2": 163.52094, "r_x3": 151.51801, "r_y3": 163.52094, "coord_origin": "TOPLEFT" }, "text": "recognition based on grid shape graph. In: 2022 Asia-Pacific Signal and Information", "orig": "recognition based on grid shape graph. In: 2022 Asia-Pacific Signal and Information", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 182.54962, "r_x1": 480.59286000000003, "r_y1": 182.54962, "r_x2": 480.59286000000003, "r_y2": 174.47992, "r_x3": 151.51801, "r_y3": 174.47992, "coord_origin": "TOPLEFT" }, "text": "Processing Association Annual Summit and Conference (APSIPA ASC). pp. 1868-", "orig": "Processing Association Annual Summit and Conference (APSIPA ASC). pp. 1868-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 193.50860999999998, "r_x1": 226.37399, "r_y1": 193.50860999999998, "r_x2": 226.37399, "r_y2": 185.4389, "r_x3": 151.51801, "r_y3": 185.4389, "coord_origin": "TOPLEFT" }, "text": "1873. IEEE (2022)", "orig": "1873. IEEE (2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "6. Lee, E., Kwon, J., Yang, H., Park, J., Lee, S., Koo, H.I., Cho, N.I.: Table structure recognition based on grid shape graph. In: 2022 Asia-Pacific Signal and Information Processing Association Annual Summit and Conference (APSIPA ASC). pp. 18681873. IEEE (2022)" }, { "label": "list_item", "id": 10, "page_no": 12, "cluster": { "id": 10, "label": "list_item", "bbox": { "l": 139.371, "t": 196.40886999999998, "r": 480.59012, "b": 215.43755999999996, "coord_origin": "TOPLEFT" }, "confidence": 0.9582491517066956, "cells": [ { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.371, "r_y0": 204.47857999999997, "r_x1": 146.31418, "r_y1": 204.47857999999997, "r_x2": 146.31418, "r_y2": 196.40886999999998, "r_x3": 139.371, "r_y3": 196.40886999999998, "coord_origin": "TOPLEFT" }, "text": "7.", "orig": "7.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.77789, "r_y0": 204.47857999999997, "r_x1": 480.59012, "r_y1": 204.47857999999997, "r_x2": 480.59012, "r_y2": 196.40886999999998, "r_x3": 150.77789, "r_y3": 196.40886999999998, "coord_origin": "TOPLEFT" }, "text": "Li, M., Cui, L., Huang, S., Wei, F., Zhou, M., Li, Z.: Tablebank: A benchmark", "orig": "Li, M., Cui, L., Huang, S., Wei, F., Zhou, M., Li, Z.: Tablebank: A benchmark", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 215.43755999999996, "r_x1": 352.01746, "r_y1": 215.43755999999996, "r_x2": 352.01746, "r_y2": 207.36785999999995, "r_x3": 151.51801, "r_y3": 207.36785999999995, "coord_origin": "TOPLEFT" }, "text": "dataset for table detection and recognition (2019)", "orig": "dataset for table detection and recognition (2019)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "7. Li, M., Cui, L., Huang, S., Wei, F., Zhou, M., Li, Z.: Tablebank: A benchmark dataset for table detection and recognition (2019)" }, { "label": "list_item", "id": 4, "page_no": 12, "cluster": { "id": 4, "label": "list_item", "bbox": { "l": 139.371, "t": 218.33887000000004, "r": 480.59473, "b": 270.28839000000005, "coord_origin": "TOPLEFT" }, "confidence": 0.967814564704895, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.371, "r_y0": 226.40857000000005, "r_x1": 146.37106, "r_y1": 226.40857000000005, "r_x2": 146.37106, "r_y2": 218.33887000000004, "r_x3": 139.371, "r_y3": 218.33887000000004, "coord_origin": "TOPLEFT" }, "text": "8.", "orig": "8.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.87132, "r_y0": 226.40857000000005, "r_x1": 480.58731000000006, "r_y1": 226.40857000000005, "r_x2": 480.58731000000006, "r_y2": 218.33887000000004, "r_x3": 150.87132, "r_y3": 218.33887000000004, "coord_origin": "TOPLEFT" }, "text": "Livathinos, N., Berrospi, C., Lysak, M., Kuropiatnyk, V., Nassar, A., Carvalho,", "orig": "Livathinos, N., Berrospi, C., Lysak, M., Kuropiatnyk, V., Nassar, A., Carvalho,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 237.36755000000005, "r_x1": 480.59020999999996, "r_y1": 237.36755000000005, "r_x2": 480.59020999999996, "r_y2": 229.29785000000004, "r_x3": 151.51801, "r_y3": 229.29785000000004, "coord_origin": "TOPLEFT" }, "text": "A., Dolfi, M., Auer, C., Dinkla, K., Staar, P.: Robust pdf document conversion", "orig": "A., Dolfi, M., Auer, C., Dinkla, K., Staar, P.: Robust pdf document conversion", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 248.32654000000002, "r_x1": 480.59473, "r_y1": 248.32654000000002, "r_x2": 480.59473, "r_y2": 240.25684, "r_x3": 151.51801, "r_y3": 240.25684, "coord_origin": "TOPLEFT" }, "text": "using recurrent neural networks. Proceedings of the AAAI Conference on Artificial", "orig": "using recurrent neural networks. Proceedings of the AAAI Conference on Artificial", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 259.28552, "r_x1": 197.08617, "r_y1": 259.28552, "r_x2": 197.08617, "r_y2": 251.21582, "r_x3": 151.51801, "r_y3": 251.21582, "coord_origin": "TOPLEFT" }, "text": "Intelligence", "orig": "Intelligence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 199.40001, "r_y0": 259.07935, "r_x1": 210.00726, "r_y1": 259.07935, "r_x2": 210.00726, "r_y2": 251.15301999999997, "r_x3": 199.40001, "r_y3": 251.15301999999997, "coord_origin": "TOPLEFT" }, "text": "35", "orig": "35", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.007, "r_y0": 259.28552, "r_x1": 332.37683, "r_y1": 259.28552, "r_x2": 332.37683, "r_y2": 251.21582, "r_x3": 210.007, "r_y3": 251.21582, "coord_origin": "TOPLEFT" }, "text": "(17), 15137-15145 (May 2021),", "orig": "(17), 15137-15145 (May 2021),", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.69901, "r_y0": 259.33038, "r_x1": 480.59039000000007, "r_y1": 259.33038, "r_x2": 480.59039000000007, "r_y2": 251.86139000000003, "r_x3": 334.69901, "r_y3": 251.86139000000003, "coord_origin": "TOPLEFT" }, "text": "https://ojs.aaai.org/index.php/", "orig": "https://ojs.aaai.org/index.php/", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 270.28839000000005, "r_x1": 259.75769, "r_y1": 270.28839000000005, "r_x2": 259.75769, "r_y2": 262.8194, "r_x3": 151.51801, "r_y3": 262.8194, "coord_origin": "TOPLEFT" }, "text": "AAAI/article/view/17777", "orig": "AAAI/article/view/17777", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "8. Livathinos, N., Berrospi, C., Lysak, M., Kuropiatnyk, V., Nassar, A., Carvalho, A., Dolfi, M., Auer, C., Dinkla, K., Staar, P.: Robust pdf document conversion using recurrent neural networks. Proceedings of the AAAI Conference on Artificial Intelligence 35 (17), 15137-15145 (May 2021), https://ojs.aaai.org/index.php/ AAAI/article/view/17777" }, { "label": "list_item", "id": 11, "page_no": 12, "cluster": { "id": 11, "label": "list_item", "bbox": { "l": 139.371, "t": 273.14484000000004, "r": 480.59387000000004, "b": 303.13254, "coord_origin": "TOPLEFT" }, "confidence": 0.9557179808616638, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.371, "r_y0": 281.21457, "r_x1": 146.14218, "r_y1": 281.21457, "r_x2": 146.14218, "r_y2": 273.14484000000004, "r_x3": 139.371, "r_y3": 273.14484000000004, "coord_origin": "TOPLEFT" }, "text": "9.", "orig": "9.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.49533, "r_y0": 281.21457, "r_x1": 480.5881999999999, "r_y1": 281.21457, "r_x2": 480.5881999999999, "r_y2": 273.14484000000004, "r_x3": 150.49533, "r_y3": 273.14484000000004, "coord_origin": "TOPLEFT" }, "text": "Nassar, A., Livathinos, N., Lysak, M., Staar, P.: Tableformer: Table structure un-", "orig": "Nassar, A., Livathinos, N., Lysak, M., Staar, P.: Tableformer: Table structure un-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 292.17355, "r_x1": 480.59387000000004, "r_y1": 292.17355, "r_x2": 480.59387000000004, "r_y2": 284.10379, "r_x3": 151.51801, "r_y3": 284.10379, "coord_origin": "TOPLEFT" }, "text": "derstanding with transformers. In: Proceedings of the IEEE/CVF Conference on", "orig": "derstanding with transformers. In: Proceedings of the IEEE/CVF Conference on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 303.13254, "r_x1": 473.44308000000007, "r_y1": 303.13254, "r_x2": 473.44308000000007, "r_y2": 295.06277, "r_x3": 151.51801, "r_y3": 295.06277, "coord_origin": "TOPLEFT" }, "text": "Computer Vision and Pattern Recognition (CVPR). pp. 4614-4623 (June 2022)", "orig": "Computer Vision and Pattern Recognition (CVPR). pp. 4614-4623 (June 2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "9. Nassar, A., Livathinos, N., Lysak, M., Staar, P.: Tableformer: Table structure understanding with transformers. In: Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR). pp. 4614-4623 (June 2022)" }, { "label": "list_item", "id": 9, "page_no": 12, "cluster": { "id": 9, "label": "list_item", "bbox": { "l": 134.76401, "t": 306.03277999999995, "r": 480.59372, "b": 368.94232, "coord_origin": "TOPLEFT" }, "confidence": 0.9639304876327515, "cells": [ { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76401, "r_y0": 314.10254000000003, "r_x1": 146.49922, "r_y1": 314.10254000000003, "r_x2": 146.49922, "r_y2": 306.03277999999995, "r_x3": 134.76401, "r_y3": 306.03277999999995, "coord_origin": "TOPLEFT" }, "text": "10.", "orig": "10.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.09138, "r_y0": 314.10254000000003, "r_x1": 480.58905, "r_y1": 314.10254000000003, "r_x2": 480.58905, "r_y2": 306.03277999999995, "r_x3": 151.09138, "r_y3": 306.03277999999995, "coord_origin": "TOPLEFT" }, "text": "Pfitzmann, B., Auer, C., Dolfi, M., Nassar, A.S., Staar, P.W.J.: Doclaynet: A", "orig": "Pfitzmann, B., Auer, C., Dolfi, M., Nassar, A.S., Staar, P.W.J.: Doclaynet: A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 325.06155, "r_x1": 480.59015, "r_y1": 325.06155, "r_x2": 480.59015, "r_y2": 316.99179, "r_x3": 151.51801, "r_y3": 316.99179, "coord_origin": "TOPLEFT" }, "text": "large human-annotated dataset for document-layout segmentation. In: Zhang, A.,", "orig": "large human-annotated dataset for document-layout segmentation. In: Zhang, A.,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 336.02054, "r_x1": 480.59113, "r_y1": 336.02054, "r_x2": 480.59113, "r_y2": 327.95078, "r_x3": 151.51801, "r_y3": 327.95078, "coord_origin": "TOPLEFT" }, "text": "Rangwala, H. (eds.) KDD \u201922: The 28th ACM SIGKDD Conference on Knowledge", "orig": "Rangwala, H. (eds.) KDD \u201922: The 28th ACM SIGKDD Conference on Knowledge", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 346.97952, "r_x1": 480.59113, "r_y1": 346.97952, "r_x2": 480.59113, "r_y2": 338.90976, "r_x3": 151.51801, "r_y3": 338.90976, "coord_origin": "TOPLEFT" }, "text": "Discovery and Data Mining, Washington, DC, USA, August 14 - 18, 2022. pp.", "orig": "Discovery and Data Mining, Washington, DC, USA, August 14 - 18, 2022. pp.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 357.93851, "r_x1": 251.14098999999996, "r_y1": 357.93851, "r_x2": 251.14098999999996, "r_y2": 349.86874, "r_x3": 151.51801, "r_y3": 349.86874, "coord_origin": "TOPLEFT" }, "text": "3743-3751. ACM (2022).", "orig": "3743-3751. ACM (2022).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 253.99001, "r_y0": 357.98333999999994, "r_x1": 437.53311, "r_y1": 357.98333999999994, "r_x2": 437.53311, "r_y2": 350.5143100000001, "r_x3": 253.99001, "r_y3": 350.5143100000001, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.1145/3534678.3539043", "orig": "https://doi.org/10.1145/3534678.3539043", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.53201, "r_y0": 357.93851, "r_x1": 440.09102999999993, "r_y1": 357.93851, "r_x2": 440.09102999999993, "r_y2": 349.86874, "r_x3": 437.53201, "r_y3": 349.86874, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.94202000000007, "r_y0": 357.98333999999994, "r_x1": 480.59372, "r_y1": 357.98333999999994, "r_x2": 480.59372, "r_y2": 350.5143100000001, "r_x3": 442.94202000000007, "r_y3": 350.5143100000001, "coord_origin": "TOPLEFT" }, "text": "https://", "orig": "https://", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 368.94232, "r_x1": 297.40939, "r_y1": 368.94232, "r_x2": 297.40939, "r_y2": 361.47329999999994, "r_x3": 151.51801, "r_y3": 361.47329999999994, "coord_origin": "TOPLEFT" }, "text": "doi.org/10.1145/3534678.3539043", "orig": "doi.org/10.1145/3534678.3539043", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "10. Pfitzmann, B., Auer, C., Dolfi, M., Nassar, A.S., Staar, P.W.J.: Doclaynet: A large human-annotated dataset for document-layout segmentation. In: Zhang, A., Rangwala, H. (eds.) KDD '22: The 28th ACM SIGKDD Conference on Knowledge Discovery and Data Mining, Washington, DC, USA, August 14 - 18, 2022. pp. 3743-3751. ACM (2022). https://doi.org/10.1145/3534678.3539043 , https:// doi.org/10.1145/3534678.3539043" }, { "label": "list_item", "id": 0, "page_no": 12, "cluster": { "id": 0, "label": "list_item", "bbox": { "l": 134.76401, "t": 371.79773, "r": 480.59296, "b": 412.74448, "coord_origin": "TOPLEFT" }, "confidence": 0.9752162098884583, "cells": [ { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76401, "r_y0": 379.86749, "r_x1": 146.03854, "r_y1": 379.86749, "r_x2": 146.03854, "r_y2": 371.79773, "r_x3": 134.76401, "r_y3": 371.79773, "coord_origin": "TOPLEFT" }, "text": "11.", "orig": "11.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.4505, "r_y0": 379.86749, "r_x1": 480.58914000000004, "r_y1": 379.86749, "r_x2": 480.58914000000004, "r_y2": 371.79773, "r_x3": 150.4505, "r_y3": 371.79773, "coord_origin": "TOPLEFT" }, "text": "Prasad, D., Gadpal, A., Kapadni, K., Visave, M., Sultanpure, K.: Cascadetabnet:", "orig": "Prasad, D., Gadpal, A., Kapadni, K., Visave, M., Sultanpure, K.: Cascadetabnet:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 390.82651, "r_x1": 480.59296, "r_y1": 390.82651, "r_x2": 480.59296, "r_y2": 382.7567399999999, "r_x3": 151.51801, "r_y3": 382.7567399999999, "coord_origin": "TOPLEFT" }, "text": "An approach for end to end table detection and structure recognition from image-", "orig": "An approach for end to end table detection and structure recognition from image-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 401.78549, "r_x1": 480.59293, "r_y1": 401.78549, "r_x2": 480.59293, "r_y2": 393.71573, "r_x3": 151.51801, "r_y3": 393.71573, "coord_origin": "TOPLEFT" }, "text": "based documents. In: Proceedings of the IEEE/CVF conference on computer vision", "orig": "based documents. In: Proceedings of the IEEE/CVF conference on computer vision", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 412.74448, "r_x1": 373.82727, "r_y1": 412.74448, "r_x2": 373.82727, "r_y2": 404.67471, "r_x3": 151.51801, "r_y3": 404.67471, "coord_origin": "TOPLEFT" }, "text": "and pattern recognition workshops. pp. 572-573 (2020)", "orig": "and pattern recognition workshops. pp. 572-573 (2020)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "11. Prasad, D., Gadpal, A., Kapadni, K., Visave, M., Sultanpure, K.: Cascadetabnet: An approach for end to end table detection and structure recognition from imagebased documents. In: Proceedings of the IEEE/CVF conference on computer vision and pattern recognition workshops. pp. 572-573 (2020)" }, { "label": "list_item", "id": 3, "page_no": 12, "cluster": { "id": 3, "label": "list_item", "bbox": { "l": 134.76401, "t": 415.64471, "r": 480.59469999999993, "b": 456.59146, "coord_origin": "TOPLEFT" }, "confidence": 0.9707236886024475, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76401, "r_y0": 423.71448000000004, "r_x1": 145.91106, "r_y1": 423.71448000000004, "r_x2": 145.91106, "r_y2": 415.64471, "r_x3": 134.76401, "r_y3": 415.64471, "coord_origin": "TOPLEFT" }, "text": "12.", "orig": "12.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.27309, "r_y0": 423.71448000000004, "r_x1": 480.5874, "r_y1": 423.71448000000004, "r_x2": 480.5874, "r_y2": 415.64471, "r_x3": 150.27309, "r_y3": 415.64471, "coord_origin": "TOPLEFT" }, "text": "Schreiber, S., Agne, S., Wolf, I., Dengel, A., Ahmed, S.: Deepdesrt: Deep learning", "orig": "Schreiber, S., Agne, S., Wolf, I., Dengel, A., Ahmed, S.: Deepdesrt: Deep learning", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 434.67349, "r_x1": 480.59469999999993, "r_y1": 434.67349, "r_x2": 480.59469999999993, "r_y2": 426.60373, "r_x3": 151.51801, "r_y3": 426.60373, "coord_origin": "TOPLEFT" }, "text": "for detection and structure recognition of tables in document images. In: 2017 14th", "orig": "for detection and structure recognition of tables in document images. In: 2017 14th", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 445.63248, "r_x1": 480.58844, "r_y1": 445.63248, "r_x2": 480.58844, "r_y2": 437.5627099999999, "r_x3": 151.51801, "r_y3": 437.5627099999999, "coord_origin": "TOPLEFT" }, "text": "IAPR international conference on document analysis and recognition (ICDAR).", "orig": "IAPR international conference on document analysis and recognition (ICDAR).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 456.59146, "r_x1": 292.91455, "r_y1": 456.59146, "r_x2": 292.91455, "r_y2": 448.5217, "r_x3": 151.51801, "r_y3": 448.5217, "coord_origin": "TOPLEFT" }, "text": "vol. 1, pp. 1162-1167. IEEE (2017)", "orig": "vol. 1, pp. 1162-1167. IEEE (2017)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "12. Schreiber, S., Agne, S., Wolf, I., Dengel, A., Ahmed, S.: Deepdesrt: Deep learning for detection and structure recognition of tables in document images. In: 2017 14th IAPR international conference on document analysis and recognition (ICDAR). vol. 1, pp. 1162-1167. IEEE (2017)" }, { "label": "list_item", "id": 7, "page_no": 12, "cluster": { "id": 7, "label": "list_item", "bbox": { "l": 134.76401, "t": 459.4917, "r": 480.59372, "b": 500.48328, "coord_origin": "TOPLEFT" }, "confidence": 0.9658119678497314, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76401, "r_y0": 467.56146, "r_x1": 145.7785, "r_y1": 467.56146, "r_x2": 145.7785, "r_y2": 459.4917, "r_x3": 134.76401, "r_y3": 459.4917, "coord_origin": "TOPLEFT" }, "text": "13.", "orig": "13.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.08871, "r_y0": 467.56146, "r_x1": 480.59006, "r_y1": 467.56146, "r_x2": 480.59006, "r_y2": 459.4917, "r_x3": 150.08871, "r_y3": 459.4917, "coord_origin": "TOPLEFT" }, "text": "Siddiqui, S.A., Fateh, I.A., Rizvi, S.T.R., Dengel, A., Ahmed, S.: Deeptabstr: Deep", "orig": "Siddiqui, S.A., Fateh, I.A., Rizvi, S.T.R., Dengel, A., Ahmed, S.: Deeptabstr: Deep", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 478.52048, "r_x1": 480.59116, "r_y1": 478.52048, "r_x2": 480.59116, "r_y2": 470.45071, "r_x3": 151.51801, "r_y3": 470.45071, "coord_origin": "TOPLEFT" }, "text": "learning based table structure recognition. In: 2019 International Conference on", "orig": "learning based table structure recognition. In: 2019 International Conference on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 489.47946, "r_x1": 439.05963, "r_y1": 489.47946, "r_x2": 439.05963, "r_y2": 481.4097, "r_x3": 151.51801, "r_y3": 481.4097, "coord_origin": "TOPLEFT" }, "text": "Document Analysis and Recognition (ICDAR). pp. 1403-1409 (2019).", "orig": "Document Analysis and Recognition (ICDAR). pp. 1403-1409 (2019).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.94202000000007, "r_y0": 489.52429, "r_x1": 480.59372, "r_y1": 489.52429, "r_x2": 480.59372, "r_y2": 482.05527, "r_x3": 442.94202000000007, "r_y3": 482.05527, "coord_origin": "TOPLEFT" }, "text": "https://", "orig": "https://", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 500.48328, "r_x1": 302.11584, "r_y1": 500.48328, "r_x2": 302.11584, "r_y2": 493.01425, "r_x3": 151.51801, "r_y3": 493.01425, "coord_origin": "TOPLEFT" }, "text": "doi.org/10.1109/ICDAR.2019.00226", "orig": "doi.org/10.1109/ICDAR.2019.00226", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "13. Siddiqui, S.A., Fateh, I.A., Rizvi, S.T.R., Dengel, A., Ahmed, S.: Deeptabstr: Deep learning based table structure recognition. In: 2019 International Conference on Document Analysis and Recognition (ICDAR). pp. 1403-1409 (2019). https:// doi.org/10.1109/ICDAR.2019.00226" }, { "label": "list_item", "id": 2, "page_no": 12, "cluster": { "id": 2, "label": "list_item", "bbox": { "l": 134.76401, "t": 503.33868, "r": 480.59286000000003, "b": 544.28545, "coord_origin": "TOPLEFT" }, "confidence": 0.972225546836853, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76401, "r_y0": 511.40845, "r_x1": 146.15501, "r_y1": 511.40845, "r_x2": 146.15501, "r_y2": 503.33868, "r_x3": 134.76401, "r_y3": 503.33868, "coord_origin": "TOPLEFT" }, "text": "14.", "orig": "14.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.61252, "r_y0": 511.40845, "r_x1": 480.59088, "r_y1": 511.40845, "r_x2": 480.59088, "r_y2": 503.33868, "r_x3": 150.61252, "r_y3": 503.33868, "coord_origin": "TOPLEFT" }, "text": "Smock, B., Pesala, R., Abraham, R.: PubTables-1M: Towards comprehensive ta-", "orig": "Smock, B., Pesala, R., Abraham, R.: PubTables-1M: Towards comprehensive ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 522.3674599999999, "r_x1": 480.59286000000003, "r_y1": 522.3674599999999, "r_x2": 480.59286000000003, "r_y2": 514.2977000000001, "r_x3": 151.51801, "r_y3": 514.2977000000001, "coord_origin": "TOPLEFT" }, "text": "ble extraction from unstructured documents. In: Proceedings of the IEEE/CVF", "orig": "ble extraction from unstructured documents. In: Proceedings of the IEEE/CVF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 533.32645, "r_x1": 480.58838000000003, "r_y1": 533.32645, "r_x2": 480.58838000000003, "r_y2": 525.25668, "r_x3": 151.51801, "r_y3": 525.25668, "coord_origin": "TOPLEFT" }, "text": "Conference on Computer Vision and Pattern Recognition (CVPR). pp. 4634-4642", "orig": "Conference on Computer Vision and Pattern Recognition (CVPR). pp. 4634-4642", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 544.28545, "r_x1": 199.24704, "r_y1": 544.28545, "r_x2": 199.24704, "r_y2": 536.21568, "r_x3": 151.51801, "r_y3": 536.21568, "coord_origin": "TOPLEFT" }, "text": "(June 2022)", "orig": "(June 2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "14. Smock, B., Pesala, R., Abraham, R.: PubTables-1M: Towards comprehensive table extraction from unstructured documents. In: Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR). pp. 4634-4642 (June 2022)" }, { "label": "list_item", "id": 6, "page_no": 12, "cluster": { "id": 6, "label": "list_item", "bbox": { "l": 134.76401, "t": 547.18568, "r": 480.59583, "b": 610.09528, "coord_origin": "TOPLEFT" }, "confidence": 0.9674034714698792, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76401, "r_y0": 555.25545, "r_x1": 146.16588, "r_y1": 555.25545, "r_x2": 146.16588, "r_y2": 547.18568, "r_x3": 134.76401, "r_y3": 547.18568, "coord_origin": "TOPLEFT" }, "text": "15.", "orig": "15.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.62764, "r_y0": 555.25545, "r_x1": 480.58734000000004, "r_y1": 555.25545, "r_x2": 480.58734000000004, "r_y2": 547.18568, "r_x3": 150.62764, "r_y3": 547.18568, "coord_origin": "TOPLEFT" }, "text": "Staar, P.W.J., Dolfi, M., Auer, C., Bekas, C.: Corpus conversion service: A ma-", "orig": "Staar, P.W.J., Dolfi, M., Auer, C., Bekas, C.: Corpus conversion service: A ma-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 566.2144499999999, "r_x1": 480.58838000000003, "r_y1": 566.2144499999999, "r_x2": 480.58838000000003, "r_y2": 558.14468, "r_x3": 151.51801, "r_y3": 558.14468, "coord_origin": "TOPLEFT" }, "text": "chine learning platform to ingest documents at scale. In: Proceedings of the 24th", "orig": "chine learning platform to ingest documents at scale. In: Proceedings of the 24th", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 577.17345, "r_x1": 480.59109, "r_y1": 577.17345, "r_x2": 480.59109, "r_y2": 569.1036799999999, "r_x3": 151.51801, "r_y3": 569.1036799999999, "coord_origin": "TOPLEFT" }, "text": "ACM SIGKDD International Conference on Knowledge Discovery & Data Min-", "orig": "ACM SIGKDD International Conference on Knowledge Discovery & Data Min-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 588.1324500000001, "r_x1": 480.59195, "r_y1": 588.1324500000001, "r_x2": 480.59195, "r_y2": 580.06268, "r_x3": 151.51801, "r_y3": 580.06268, "coord_origin": "TOPLEFT" }, "text": "ing. pp. 774-782. KDD \u201918, Association for Computing Machinery, New York, NY,", "orig": "ing. pp. 774-782. KDD \u201918, Association for Computing Machinery, New York, NY,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 599.09145, "r_x1": 200.75787, "r_y1": 599.09145, "r_x2": 200.75787, "r_y2": 591.0216800000001, "r_x3": 151.51801, "r_y3": 591.0216800000001, "coord_origin": "TOPLEFT" }, "text": "USA (2018).", "orig": "USA (2018).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 202.916, "r_y0": 599.1362799999999, "r_x1": 386.45911, "r_y1": 599.1362799999999, "r_x2": 386.45911, "r_y2": 591.66727, "r_x3": 202.916, "r_y3": 591.66727, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.1145/3219819.3219834", "orig": "https://doi.org/10.1145/3219819.3219834", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.45801, "r_y0": 599.09145, "r_x1": 389.01703, "r_y1": 599.09145, "r_x2": 389.01703, "r_y2": 591.0216800000001, "r_x3": 386.45801, "r_y3": 591.0216800000001, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 391.173, "r_y0": 599.1362799999999, "r_x1": 480.59583, "r_y1": 599.1362799999999, "r_x2": 480.59583, "r_y2": 591.66727, "r_x3": 391.173, "r_y3": 591.66727, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.", "orig": "https://doi.org/10.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 610.09528, "r_x1": 245.63831, "r_y1": 610.09528, "r_x2": 245.63831, "r_y2": 602.62627, "r_x3": 151.51801, "r_y3": 602.62627, "coord_origin": "TOPLEFT" }, "text": "1145/3219819.3219834", "orig": "1145/3219819.3219834", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "15. Staar, P.W.J., Dolfi, M., Auer, C., Bekas, C.: Corpus conversion service: A machine learning platform to ingest documents at scale. In: Proceedings of the 24th ACM SIGKDD International Conference on Knowledge Discovery & Data Mining. pp. 774-782. KDD '18, Association for Computing Machinery, New York, NY, USA (2018). https://doi.org/10.1145/3219819.3219834 , https://doi.org/10. 1145/3219819.3219834" }, { "label": "list_item", "id": 12, "page_no": 12, "cluster": { "id": 12, "label": "list_item", "bbox": { "l": 134.76401, "t": 612.95068, "r": 480.59542999999996, "b": 631.97945, "coord_origin": "TOPLEFT" }, "confidence": 0.9416429996490479, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76401, "r_y0": 621.02045, "r_x1": 146.62019, "r_y1": 621.02045, "r_x2": 146.62019, "r_y2": 612.95068, "r_x3": 134.76401, "r_y3": 612.95068, "coord_origin": "TOPLEFT" }, "text": "16.", "orig": "16.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.25977, "r_y0": 621.02045, "r_x1": 480.59542999999996, "r_y1": 621.02045, "r_x2": 480.59542999999996, "r_y2": 612.95068, "r_x3": 151.25977, "r_y3": 612.95068, "coord_origin": "TOPLEFT" }, "text": "Wang, X.: Tabular Abstraction, Editing, and Formatting. Ph.D. thesis, CAN", "orig": "Wang, X.: Tabular Abstraction, Editing, and Formatting. Ph.D. thesis, CAN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 631.97945, "r_x1": 234.43031, "r_y1": 631.97945, "r_x2": 234.43031, "r_y2": 623.90968, "r_x3": 151.51801, "r_y3": 623.90968, "coord_origin": "TOPLEFT" }, "text": "(1996), aAINN09397", "orig": "(1996), aAINN09397", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "16. Wang, X.: Tabular Abstraction, Editing, and Formatting. Ph.D. thesis, CAN (1996), aAINN09397" }, { "label": "list_item", "id": 8, "page_no": 12, "cluster": { "id": 8, "label": "list_item", "bbox": { "l": 134.76401, "t": 634.87968, "r": 480.59119, "b": 664.86745, "coord_origin": "TOPLEFT" }, "confidence": 0.9646382331848145, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76401, "r_y0": 642.9494500000001, "r_x1": 146.30539, "r_y1": 642.9494500000001, "r_x2": 146.30539, "r_y2": 634.87968, "r_x3": 134.76401, "r_y3": 634.87968, "coord_origin": "TOPLEFT" }, "text": "17.", "orig": "17.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.82175, "r_y0": 642.9494500000001, "r_x1": 480.58731000000006, "r_y1": 642.9494500000001, "r_x2": 480.58731000000006, "r_y2": 634.87968, "r_x3": 150.82175, "r_y3": 634.87968, "coord_origin": "TOPLEFT" }, "text": "Xue, W., Li, Q., Tao, D.: Res2tim: Reconstruct syntactic structures from table", "orig": "Xue, W., Li, Q., Tao, D.: Res2tim: Reconstruct syntactic structures from table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 653.90845, "r_x1": 480.59119, "r_y1": 653.90845, "r_x2": 480.59119, "r_y2": 645.8386800000001, "r_x3": 151.51801, "r_y3": 645.8386800000001, "coord_origin": "TOPLEFT" }, "text": "images. In: 2019 International Conference on Document Analysis and Recognition", "orig": "images. In: 2019 International Conference on Document Analysis and Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 664.86745, "r_x1": 299.30307, "r_y1": 664.86745, "r_x2": 299.30307, "r_y2": 656.79768, "r_x3": 151.51801, "r_y3": 656.79768, "coord_origin": "TOPLEFT" }, "text": "(ICDAR). pp. 749-755. IEEE (2019)", "orig": "(ICDAR). pp. 749-755. IEEE (2019)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "17. Xue, W., Li, Q., Tao, D.: Res2tim: Reconstruct syntactic structures from table images. In: 2019 International Conference on Document Analysis and Recognition (ICDAR). pp. 749-755. IEEE (2019)" } ], "body": [ { "label": "list_item", "id": 5, "page_no": 12, "cluster": { "id": 5, "label": "list_item", "bbox": { "l": 139.371, "t": 119.67400999999995, "r": 480.59479, "b": 149.66168000000005, "coord_origin": "TOPLEFT" }, "confidence": 0.9677112698554993, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.371, "r_y0": 127.74370999999985, "r_x1": 146.04857, "r_y1": 127.74370999999985, "r_x2": 146.04857, "r_y2": 119.67400999999995, "r_x3": 139.371, "r_y3": 119.67400999999995, "coord_origin": "TOPLEFT" }, "text": "5.", "orig": "5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.34157, "r_y0": 127.74370999999985, "r_x1": 480.58826, "r_y1": 127.74370999999985, "r_x2": 480.58826, "r_y2": 119.67400999999995, "r_x3": 150.34157, "r_y3": 119.67400999999995, "coord_origin": "TOPLEFT" }, "text": "Kayal, P., Anand, M., Desai, H., Singh, M.: Tables to latex: structure and content", "orig": "Kayal, P., Anand, M., Desai, H., Singh, M.: Tables to latex: structure and content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 138.70270000000005, "r_x1": 480.59479, "r_y1": 138.70270000000005, "r_x2": 480.59479, "r_y2": 130.63300000000004, "r_x3": 151.51801, "r_y3": 130.63300000000004, "coord_origin": "TOPLEFT" }, "text": "extraction from scientific tables. International Journal on Document Analysis and", "orig": "extraction from scientific tables. International Journal on Document Analysis and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 149.66168000000005, "r_x1": 304.04364, "r_y1": 149.66168000000005, "r_x2": 304.04364, "r_y2": 141.59198000000004, "r_x3": 151.51801, "r_y3": 141.59198000000004, "coord_origin": "TOPLEFT" }, "text": "Recognition (IJDAR) pp. 1-10 (2022)", "orig": "Recognition (IJDAR) pp. 1-10 (2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "5. Kayal, P., Anand, M., Desai, H., Singh, M.: Tables to latex: structure and content extraction from scientific tables. International Journal on Document Analysis and Recognition (IJDAR) pp. 1-10 (2022)" }, { "label": "list_item", "id": 1, "page_no": 12, "cluster": { "id": 1, "label": "list_item", "bbox": { "l": 139.371, "t": 152.56195000000002, "r": 480.59286000000003, "b": 193.50860999999998, "coord_origin": "TOPLEFT" }, "confidence": 0.973045289516449, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.371, "r_y0": 160.63165000000004, "r_x1": 145.93991, "r_y1": 160.63165000000004, "r_x2": 145.93991, "r_y2": 152.56195000000002, "r_x3": 139.371, "r_y3": 152.56195000000002, "coord_origin": "TOPLEFT" }, "text": "6.", "orig": "6.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.16298, "r_y0": 160.63165000000004, "r_x1": 480.59015, "r_y1": 160.63165000000004, "r_x2": 480.59015, "r_y2": 152.56195000000002, "r_x3": 150.16298, "r_y3": 152.56195000000002, "coord_origin": "TOPLEFT" }, "text": "Lee, E., Kwon, J., Yang, H., Park, J., Lee, S., Koo, H.I., Cho, N.I.: Table structure", "orig": "Lee, E., Kwon, J., Yang, H., Park, J., Lee, S., Koo, H.I., Cho, N.I.: Table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 171.59064, "r_x1": 480.5903, "r_y1": 171.59064, "r_x2": 480.5903, "r_y2": 163.52094, "r_x3": 151.51801, "r_y3": 163.52094, "coord_origin": "TOPLEFT" }, "text": "recognition based on grid shape graph. In: 2022 Asia-Pacific Signal and Information", "orig": "recognition based on grid shape graph. In: 2022 Asia-Pacific Signal and Information", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 182.54962, "r_x1": 480.59286000000003, "r_y1": 182.54962, "r_x2": 480.59286000000003, "r_y2": 174.47992, "r_x3": 151.51801, "r_y3": 174.47992, "coord_origin": "TOPLEFT" }, "text": "Processing Association Annual Summit and Conference (APSIPA ASC). pp. 1868-", "orig": "Processing Association Annual Summit and Conference (APSIPA ASC). pp. 1868-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 193.50860999999998, "r_x1": 226.37399, "r_y1": 193.50860999999998, "r_x2": 226.37399, "r_y2": 185.4389, "r_x3": 151.51801, "r_y3": 185.4389, "coord_origin": "TOPLEFT" }, "text": "1873. IEEE (2022)", "orig": "1873. IEEE (2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "6. Lee, E., Kwon, J., Yang, H., Park, J., Lee, S., Koo, H.I., Cho, N.I.: Table structure recognition based on grid shape graph. In: 2022 Asia-Pacific Signal and Information Processing Association Annual Summit and Conference (APSIPA ASC). pp. 18681873. IEEE (2022)" }, { "label": "list_item", "id": 10, "page_no": 12, "cluster": { "id": 10, "label": "list_item", "bbox": { "l": 139.371, "t": 196.40886999999998, "r": 480.59012, "b": 215.43755999999996, "coord_origin": "TOPLEFT" }, "confidence": 0.9582491517066956, "cells": [ { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.371, "r_y0": 204.47857999999997, "r_x1": 146.31418, "r_y1": 204.47857999999997, "r_x2": 146.31418, "r_y2": 196.40886999999998, "r_x3": 139.371, "r_y3": 196.40886999999998, "coord_origin": "TOPLEFT" }, "text": "7.", "orig": "7.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.77789, "r_y0": 204.47857999999997, "r_x1": 480.59012, "r_y1": 204.47857999999997, "r_x2": 480.59012, "r_y2": 196.40886999999998, "r_x3": 150.77789, "r_y3": 196.40886999999998, "coord_origin": "TOPLEFT" }, "text": "Li, M., Cui, L., Huang, S., Wei, F., Zhou, M., Li, Z.: Tablebank: A benchmark", "orig": "Li, M., Cui, L., Huang, S., Wei, F., Zhou, M., Li, Z.: Tablebank: A benchmark", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 215.43755999999996, "r_x1": 352.01746, "r_y1": 215.43755999999996, "r_x2": 352.01746, "r_y2": 207.36785999999995, "r_x3": 151.51801, "r_y3": 207.36785999999995, "coord_origin": "TOPLEFT" }, "text": "dataset for table detection and recognition (2019)", "orig": "dataset for table detection and recognition (2019)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "7. Li, M., Cui, L., Huang, S., Wei, F., Zhou, M., Li, Z.: Tablebank: A benchmark dataset for table detection and recognition (2019)" }, { "label": "list_item", "id": 4, "page_no": 12, "cluster": { "id": 4, "label": "list_item", "bbox": { "l": 139.371, "t": 218.33887000000004, "r": 480.59473, "b": 270.28839000000005, "coord_origin": "TOPLEFT" }, "confidence": 0.967814564704895, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.371, "r_y0": 226.40857000000005, "r_x1": 146.37106, "r_y1": 226.40857000000005, "r_x2": 146.37106, "r_y2": 218.33887000000004, "r_x3": 139.371, "r_y3": 218.33887000000004, "coord_origin": "TOPLEFT" }, "text": "8.", "orig": "8.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.87132, "r_y0": 226.40857000000005, "r_x1": 480.58731000000006, "r_y1": 226.40857000000005, "r_x2": 480.58731000000006, "r_y2": 218.33887000000004, "r_x3": 150.87132, "r_y3": 218.33887000000004, "coord_origin": "TOPLEFT" }, "text": "Livathinos, N., Berrospi, C., Lysak, M., Kuropiatnyk, V., Nassar, A., Carvalho,", "orig": "Livathinos, N., Berrospi, C., Lysak, M., Kuropiatnyk, V., Nassar, A., Carvalho,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 237.36755000000005, "r_x1": 480.59020999999996, "r_y1": 237.36755000000005, "r_x2": 480.59020999999996, "r_y2": 229.29785000000004, "r_x3": 151.51801, "r_y3": 229.29785000000004, "coord_origin": "TOPLEFT" }, "text": "A., Dolfi, M., Auer, C., Dinkla, K., Staar, P.: Robust pdf document conversion", "orig": "A., Dolfi, M., Auer, C., Dinkla, K., Staar, P.: Robust pdf document conversion", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 248.32654000000002, "r_x1": 480.59473, "r_y1": 248.32654000000002, "r_x2": 480.59473, "r_y2": 240.25684, "r_x3": 151.51801, "r_y3": 240.25684, "coord_origin": "TOPLEFT" }, "text": "using recurrent neural networks. Proceedings of the AAAI Conference on Artificial", "orig": "using recurrent neural networks. Proceedings of the AAAI Conference on Artificial", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 259.28552, "r_x1": 197.08617, "r_y1": 259.28552, "r_x2": 197.08617, "r_y2": 251.21582, "r_x3": 151.51801, "r_y3": 251.21582, "coord_origin": "TOPLEFT" }, "text": "Intelligence", "orig": "Intelligence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 199.40001, "r_y0": 259.07935, "r_x1": 210.00726, "r_y1": 259.07935, "r_x2": 210.00726, "r_y2": 251.15301999999997, "r_x3": 199.40001, "r_y3": 251.15301999999997, "coord_origin": "TOPLEFT" }, "text": "35", "orig": "35", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.007, "r_y0": 259.28552, "r_x1": 332.37683, "r_y1": 259.28552, "r_x2": 332.37683, "r_y2": 251.21582, "r_x3": 210.007, "r_y3": 251.21582, "coord_origin": "TOPLEFT" }, "text": "(17), 15137-15145 (May 2021),", "orig": "(17), 15137-15145 (May 2021),", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.69901, "r_y0": 259.33038, "r_x1": 480.59039000000007, "r_y1": 259.33038, "r_x2": 480.59039000000007, "r_y2": 251.86139000000003, "r_x3": 334.69901, "r_y3": 251.86139000000003, "coord_origin": "TOPLEFT" }, "text": "https://ojs.aaai.org/index.php/", "orig": "https://ojs.aaai.org/index.php/", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 270.28839000000005, "r_x1": 259.75769, "r_y1": 270.28839000000005, "r_x2": 259.75769, "r_y2": 262.8194, "r_x3": 151.51801, "r_y3": 262.8194, "coord_origin": "TOPLEFT" }, "text": "AAAI/article/view/17777", "orig": "AAAI/article/view/17777", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "8. Livathinos, N., Berrospi, C., Lysak, M., Kuropiatnyk, V., Nassar, A., Carvalho, A., Dolfi, M., Auer, C., Dinkla, K., Staar, P.: Robust pdf document conversion using recurrent neural networks. Proceedings of the AAAI Conference on Artificial Intelligence 35 (17), 15137-15145 (May 2021), https://ojs.aaai.org/index.php/ AAAI/article/view/17777" }, { "label": "list_item", "id": 11, "page_no": 12, "cluster": { "id": 11, "label": "list_item", "bbox": { "l": 139.371, "t": 273.14484000000004, "r": 480.59387000000004, "b": 303.13254, "coord_origin": "TOPLEFT" }, "confidence": 0.9557179808616638, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.371, "r_y0": 281.21457, "r_x1": 146.14218, "r_y1": 281.21457, "r_x2": 146.14218, "r_y2": 273.14484000000004, "r_x3": 139.371, "r_y3": 273.14484000000004, "coord_origin": "TOPLEFT" }, "text": "9.", "orig": "9.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.49533, "r_y0": 281.21457, "r_x1": 480.5881999999999, "r_y1": 281.21457, "r_x2": 480.5881999999999, "r_y2": 273.14484000000004, "r_x3": 150.49533, "r_y3": 273.14484000000004, "coord_origin": "TOPLEFT" }, "text": "Nassar, A., Livathinos, N., Lysak, M., Staar, P.: Tableformer: Table structure un-", "orig": "Nassar, A., Livathinos, N., Lysak, M., Staar, P.: Tableformer: Table structure un-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 292.17355, "r_x1": 480.59387000000004, "r_y1": 292.17355, "r_x2": 480.59387000000004, "r_y2": 284.10379, "r_x3": 151.51801, "r_y3": 284.10379, "coord_origin": "TOPLEFT" }, "text": "derstanding with transformers. In: Proceedings of the IEEE/CVF Conference on", "orig": "derstanding with transformers. In: Proceedings of the IEEE/CVF Conference on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 303.13254, "r_x1": 473.44308000000007, "r_y1": 303.13254, "r_x2": 473.44308000000007, "r_y2": 295.06277, "r_x3": 151.51801, "r_y3": 295.06277, "coord_origin": "TOPLEFT" }, "text": "Computer Vision and Pattern Recognition (CVPR). pp. 4614-4623 (June 2022)", "orig": "Computer Vision and Pattern Recognition (CVPR). pp. 4614-4623 (June 2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "9. Nassar, A., Livathinos, N., Lysak, M., Staar, P.: Tableformer: Table structure understanding with transformers. In: Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR). pp. 4614-4623 (June 2022)" }, { "label": "list_item", "id": 9, "page_no": 12, "cluster": { "id": 9, "label": "list_item", "bbox": { "l": 134.76401, "t": 306.03277999999995, "r": 480.59372, "b": 368.94232, "coord_origin": "TOPLEFT" }, "confidence": 0.9639304876327515, "cells": [ { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76401, "r_y0": 314.10254000000003, "r_x1": 146.49922, "r_y1": 314.10254000000003, "r_x2": 146.49922, "r_y2": 306.03277999999995, "r_x3": 134.76401, "r_y3": 306.03277999999995, "coord_origin": "TOPLEFT" }, "text": "10.", "orig": "10.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.09138, "r_y0": 314.10254000000003, "r_x1": 480.58905, "r_y1": 314.10254000000003, "r_x2": 480.58905, "r_y2": 306.03277999999995, "r_x3": 151.09138, "r_y3": 306.03277999999995, "coord_origin": "TOPLEFT" }, "text": "Pfitzmann, B., Auer, C., Dolfi, M., Nassar, A.S., Staar, P.W.J.: Doclaynet: A", "orig": "Pfitzmann, B., Auer, C., Dolfi, M., Nassar, A.S., Staar, P.W.J.: Doclaynet: A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 325.06155, "r_x1": 480.59015, "r_y1": 325.06155, "r_x2": 480.59015, "r_y2": 316.99179, "r_x3": 151.51801, "r_y3": 316.99179, "coord_origin": "TOPLEFT" }, "text": "large human-annotated dataset for document-layout segmentation. In: Zhang, A.,", "orig": "large human-annotated dataset for document-layout segmentation. In: Zhang, A.,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 336.02054, "r_x1": 480.59113, "r_y1": 336.02054, "r_x2": 480.59113, "r_y2": 327.95078, "r_x3": 151.51801, "r_y3": 327.95078, "coord_origin": "TOPLEFT" }, "text": "Rangwala, H. (eds.) KDD \u201922: The 28th ACM SIGKDD Conference on Knowledge", "orig": "Rangwala, H. (eds.) KDD \u201922: The 28th ACM SIGKDD Conference on Knowledge", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 346.97952, "r_x1": 480.59113, "r_y1": 346.97952, "r_x2": 480.59113, "r_y2": 338.90976, "r_x3": 151.51801, "r_y3": 338.90976, "coord_origin": "TOPLEFT" }, "text": "Discovery and Data Mining, Washington, DC, USA, August 14 - 18, 2022. pp.", "orig": "Discovery and Data Mining, Washington, DC, USA, August 14 - 18, 2022. pp.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 357.93851, "r_x1": 251.14098999999996, "r_y1": 357.93851, "r_x2": 251.14098999999996, "r_y2": 349.86874, "r_x3": 151.51801, "r_y3": 349.86874, "coord_origin": "TOPLEFT" }, "text": "3743-3751. ACM (2022).", "orig": "3743-3751. ACM (2022).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 253.99001, "r_y0": 357.98333999999994, "r_x1": 437.53311, "r_y1": 357.98333999999994, "r_x2": 437.53311, "r_y2": 350.5143100000001, "r_x3": 253.99001, "r_y3": 350.5143100000001, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.1145/3534678.3539043", "orig": "https://doi.org/10.1145/3534678.3539043", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.53201, "r_y0": 357.93851, "r_x1": 440.09102999999993, "r_y1": 357.93851, "r_x2": 440.09102999999993, "r_y2": 349.86874, "r_x3": 437.53201, "r_y3": 349.86874, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.94202000000007, "r_y0": 357.98333999999994, "r_x1": 480.59372, "r_y1": 357.98333999999994, "r_x2": 480.59372, "r_y2": 350.5143100000001, "r_x3": 442.94202000000007, "r_y3": 350.5143100000001, "coord_origin": "TOPLEFT" }, "text": "https://", "orig": "https://", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 368.94232, "r_x1": 297.40939, "r_y1": 368.94232, "r_x2": 297.40939, "r_y2": 361.47329999999994, "r_x3": 151.51801, "r_y3": 361.47329999999994, "coord_origin": "TOPLEFT" }, "text": "doi.org/10.1145/3534678.3539043", "orig": "doi.org/10.1145/3534678.3539043", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "10. Pfitzmann, B., Auer, C., Dolfi, M., Nassar, A.S., Staar, P.W.J.: Doclaynet: A large human-annotated dataset for document-layout segmentation. In: Zhang, A., Rangwala, H. (eds.) KDD '22: The 28th ACM SIGKDD Conference on Knowledge Discovery and Data Mining, Washington, DC, USA, August 14 - 18, 2022. pp. 3743-3751. ACM (2022). https://doi.org/10.1145/3534678.3539043 , https:// doi.org/10.1145/3534678.3539043" }, { "label": "list_item", "id": 0, "page_no": 12, "cluster": { "id": 0, "label": "list_item", "bbox": { "l": 134.76401, "t": 371.79773, "r": 480.59296, "b": 412.74448, "coord_origin": "TOPLEFT" }, "confidence": 0.9752162098884583, "cells": [ { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76401, "r_y0": 379.86749, "r_x1": 146.03854, "r_y1": 379.86749, "r_x2": 146.03854, "r_y2": 371.79773, "r_x3": 134.76401, "r_y3": 371.79773, "coord_origin": "TOPLEFT" }, "text": "11.", "orig": "11.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.4505, "r_y0": 379.86749, "r_x1": 480.58914000000004, "r_y1": 379.86749, "r_x2": 480.58914000000004, "r_y2": 371.79773, "r_x3": 150.4505, "r_y3": 371.79773, "coord_origin": "TOPLEFT" }, "text": "Prasad, D., Gadpal, A., Kapadni, K., Visave, M., Sultanpure, K.: Cascadetabnet:", "orig": "Prasad, D., Gadpal, A., Kapadni, K., Visave, M., Sultanpure, K.: Cascadetabnet:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 390.82651, "r_x1": 480.59296, "r_y1": 390.82651, "r_x2": 480.59296, "r_y2": 382.7567399999999, "r_x3": 151.51801, "r_y3": 382.7567399999999, "coord_origin": "TOPLEFT" }, "text": "An approach for end to end table detection and structure recognition from image-", "orig": "An approach for end to end table detection and structure recognition from image-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 401.78549, "r_x1": 480.59293, "r_y1": 401.78549, "r_x2": 480.59293, "r_y2": 393.71573, "r_x3": 151.51801, "r_y3": 393.71573, "coord_origin": "TOPLEFT" }, "text": "based documents. In: Proceedings of the IEEE/CVF conference on computer vision", "orig": "based documents. In: Proceedings of the IEEE/CVF conference on computer vision", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 412.74448, "r_x1": 373.82727, "r_y1": 412.74448, "r_x2": 373.82727, "r_y2": 404.67471, "r_x3": 151.51801, "r_y3": 404.67471, "coord_origin": "TOPLEFT" }, "text": "and pattern recognition workshops. pp. 572-573 (2020)", "orig": "and pattern recognition workshops. pp. 572-573 (2020)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "11. Prasad, D., Gadpal, A., Kapadni, K., Visave, M., Sultanpure, K.: Cascadetabnet: An approach for end to end table detection and structure recognition from imagebased documents. In: Proceedings of the IEEE/CVF conference on computer vision and pattern recognition workshops. pp. 572-573 (2020)" }, { "label": "list_item", "id": 3, "page_no": 12, "cluster": { "id": 3, "label": "list_item", "bbox": { "l": 134.76401, "t": 415.64471, "r": 480.59469999999993, "b": 456.59146, "coord_origin": "TOPLEFT" }, "confidence": 0.9707236886024475, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76401, "r_y0": 423.71448000000004, "r_x1": 145.91106, "r_y1": 423.71448000000004, "r_x2": 145.91106, "r_y2": 415.64471, "r_x3": 134.76401, "r_y3": 415.64471, "coord_origin": "TOPLEFT" }, "text": "12.", "orig": "12.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.27309, "r_y0": 423.71448000000004, "r_x1": 480.5874, "r_y1": 423.71448000000004, "r_x2": 480.5874, "r_y2": 415.64471, "r_x3": 150.27309, "r_y3": 415.64471, "coord_origin": "TOPLEFT" }, "text": "Schreiber, S., Agne, S., Wolf, I., Dengel, A., Ahmed, S.: Deepdesrt: Deep learning", "orig": "Schreiber, S., Agne, S., Wolf, I., Dengel, A., Ahmed, S.: Deepdesrt: Deep learning", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 434.67349, "r_x1": 480.59469999999993, "r_y1": 434.67349, "r_x2": 480.59469999999993, "r_y2": 426.60373, "r_x3": 151.51801, "r_y3": 426.60373, "coord_origin": "TOPLEFT" }, "text": "for detection and structure recognition of tables in document images. In: 2017 14th", "orig": "for detection and structure recognition of tables in document images. In: 2017 14th", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 445.63248, "r_x1": 480.58844, "r_y1": 445.63248, "r_x2": 480.58844, "r_y2": 437.5627099999999, "r_x3": 151.51801, "r_y3": 437.5627099999999, "coord_origin": "TOPLEFT" }, "text": "IAPR international conference on document analysis and recognition (ICDAR).", "orig": "IAPR international conference on document analysis and recognition (ICDAR).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 456.59146, "r_x1": 292.91455, "r_y1": 456.59146, "r_x2": 292.91455, "r_y2": 448.5217, "r_x3": 151.51801, "r_y3": 448.5217, "coord_origin": "TOPLEFT" }, "text": "vol. 1, pp. 1162-1167. IEEE (2017)", "orig": "vol. 1, pp. 1162-1167. IEEE (2017)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "12. Schreiber, S., Agne, S., Wolf, I., Dengel, A., Ahmed, S.: Deepdesrt: Deep learning for detection and structure recognition of tables in document images. In: 2017 14th IAPR international conference on document analysis and recognition (ICDAR). vol. 1, pp. 1162-1167. IEEE (2017)" }, { "label": "list_item", "id": 7, "page_no": 12, "cluster": { "id": 7, "label": "list_item", "bbox": { "l": 134.76401, "t": 459.4917, "r": 480.59372, "b": 500.48328, "coord_origin": "TOPLEFT" }, "confidence": 0.9658119678497314, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76401, "r_y0": 467.56146, "r_x1": 145.7785, "r_y1": 467.56146, "r_x2": 145.7785, "r_y2": 459.4917, "r_x3": 134.76401, "r_y3": 459.4917, "coord_origin": "TOPLEFT" }, "text": "13.", "orig": "13.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.08871, "r_y0": 467.56146, "r_x1": 480.59006, "r_y1": 467.56146, "r_x2": 480.59006, "r_y2": 459.4917, "r_x3": 150.08871, "r_y3": 459.4917, "coord_origin": "TOPLEFT" }, "text": "Siddiqui, S.A., Fateh, I.A., Rizvi, S.T.R., Dengel, A., Ahmed, S.: Deeptabstr: Deep", "orig": "Siddiqui, S.A., Fateh, I.A., Rizvi, S.T.R., Dengel, A., Ahmed, S.: Deeptabstr: Deep", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 478.52048, "r_x1": 480.59116, "r_y1": 478.52048, "r_x2": 480.59116, "r_y2": 470.45071, "r_x3": 151.51801, "r_y3": 470.45071, "coord_origin": "TOPLEFT" }, "text": "learning based table structure recognition. In: 2019 International Conference on", "orig": "learning based table structure recognition. In: 2019 International Conference on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 489.47946, "r_x1": 439.05963, "r_y1": 489.47946, "r_x2": 439.05963, "r_y2": 481.4097, "r_x3": 151.51801, "r_y3": 481.4097, "coord_origin": "TOPLEFT" }, "text": "Document Analysis and Recognition (ICDAR). pp. 1403-1409 (2019).", "orig": "Document Analysis and Recognition (ICDAR). pp. 1403-1409 (2019).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.94202000000007, "r_y0": 489.52429, "r_x1": 480.59372, "r_y1": 489.52429, "r_x2": 480.59372, "r_y2": 482.05527, "r_x3": 442.94202000000007, "r_y3": 482.05527, "coord_origin": "TOPLEFT" }, "text": "https://", "orig": "https://", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 500.48328, "r_x1": 302.11584, "r_y1": 500.48328, "r_x2": 302.11584, "r_y2": 493.01425, "r_x3": 151.51801, "r_y3": 493.01425, "coord_origin": "TOPLEFT" }, "text": "doi.org/10.1109/ICDAR.2019.00226", "orig": "doi.org/10.1109/ICDAR.2019.00226", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "13. Siddiqui, S.A., Fateh, I.A., Rizvi, S.T.R., Dengel, A., Ahmed, S.: Deeptabstr: Deep learning based table structure recognition. In: 2019 International Conference on Document Analysis and Recognition (ICDAR). pp. 1403-1409 (2019). https:// doi.org/10.1109/ICDAR.2019.00226" }, { "label": "list_item", "id": 2, "page_no": 12, "cluster": { "id": 2, "label": "list_item", "bbox": { "l": 134.76401, "t": 503.33868, "r": 480.59286000000003, "b": 544.28545, "coord_origin": "TOPLEFT" }, "confidence": 0.972225546836853, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76401, "r_y0": 511.40845, "r_x1": 146.15501, "r_y1": 511.40845, "r_x2": 146.15501, "r_y2": 503.33868, "r_x3": 134.76401, "r_y3": 503.33868, "coord_origin": "TOPLEFT" }, "text": "14.", "orig": "14.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.61252, "r_y0": 511.40845, "r_x1": 480.59088, "r_y1": 511.40845, "r_x2": 480.59088, "r_y2": 503.33868, "r_x3": 150.61252, "r_y3": 503.33868, "coord_origin": "TOPLEFT" }, "text": "Smock, B., Pesala, R., Abraham, R.: PubTables-1M: Towards comprehensive ta-", "orig": "Smock, B., Pesala, R., Abraham, R.: PubTables-1M: Towards comprehensive ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 522.3674599999999, "r_x1": 480.59286000000003, "r_y1": 522.3674599999999, "r_x2": 480.59286000000003, "r_y2": 514.2977000000001, "r_x3": 151.51801, "r_y3": 514.2977000000001, "coord_origin": "TOPLEFT" }, "text": "ble extraction from unstructured documents. In: Proceedings of the IEEE/CVF", "orig": "ble extraction from unstructured documents. In: Proceedings of the IEEE/CVF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 533.32645, "r_x1": 480.58838000000003, "r_y1": 533.32645, "r_x2": 480.58838000000003, "r_y2": 525.25668, "r_x3": 151.51801, "r_y3": 525.25668, "coord_origin": "TOPLEFT" }, "text": "Conference on Computer Vision and Pattern Recognition (CVPR). pp. 4634-4642", "orig": "Conference on Computer Vision and Pattern Recognition (CVPR). pp. 4634-4642", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 544.28545, "r_x1": 199.24704, "r_y1": 544.28545, "r_x2": 199.24704, "r_y2": 536.21568, "r_x3": 151.51801, "r_y3": 536.21568, "coord_origin": "TOPLEFT" }, "text": "(June 2022)", "orig": "(June 2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "14. Smock, B., Pesala, R., Abraham, R.: PubTables-1M: Towards comprehensive table extraction from unstructured documents. In: Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR). pp. 4634-4642 (June 2022)" }, { "label": "list_item", "id": 6, "page_no": 12, "cluster": { "id": 6, "label": "list_item", "bbox": { "l": 134.76401, "t": 547.18568, "r": 480.59583, "b": 610.09528, "coord_origin": "TOPLEFT" }, "confidence": 0.9674034714698792, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76401, "r_y0": 555.25545, "r_x1": 146.16588, "r_y1": 555.25545, "r_x2": 146.16588, "r_y2": 547.18568, "r_x3": 134.76401, "r_y3": 547.18568, "coord_origin": "TOPLEFT" }, "text": "15.", "orig": "15.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.62764, "r_y0": 555.25545, "r_x1": 480.58734000000004, "r_y1": 555.25545, "r_x2": 480.58734000000004, "r_y2": 547.18568, "r_x3": 150.62764, "r_y3": 547.18568, "coord_origin": "TOPLEFT" }, "text": "Staar, P.W.J., Dolfi, M., Auer, C., Bekas, C.: Corpus conversion service: A ma-", "orig": "Staar, P.W.J., Dolfi, M., Auer, C., Bekas, C.: Corpus conversion service: A ma-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 566.2144499999999, "r_x1": 480.58838000000003, "r_y1": 566.2144499999999, "r_x2": 480.58838000000003, "r_y2": 558.14468, "r_x3": 151.51801, "r_y3": 558.14468, "coord_origin": "TOPLEFT" }, "text": "chine learning platform to ingest documents at scale. In: Proceedings of the 24th", "orig": "chine learning platform to ingest documents at scale. In: Proceedings of the 24th", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 577.17345, "r_x1": 480.59109, "r_y1": 577.17345, "r_x2": 480.59109, "r_y2": 569.1036799999999, "r_x3": 151.51801, "r_y3": 569.1036799999999, "coord_origin": "TOPLEFT" }, "text": "ACM SIGKDD International Conference on Knowledge Discovery & Data Min-", "orig": "ACM SIGKDD International Conference on Knowledge Discovery & Data Min-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 588.1324500000001, "r_x1": 480.59195, "r_y1": 588.1324500000001, "r_x2": 480.59195, "r_y2": 580.06268, "r_x3": 151.51801, "r_y3": 580.06268, "coord_origin": "TOPLEFT" }, "text": "ing. pp. 774-782. KDD \u201918, Association for Computing Machinery, New York, NY,", "orig": "ing. pp. 774-782. KDD \u201918, Association for Computing Machinery, New York, NY,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 599.09145, "r_x1": 200.75787, "r_y1": 599.09145, "r_x2": 200.75787, "r_y2": 591.0216800000001, "r_x3": 151.51801, "r_y3": 591.0216800000001, "coord_origin": "TOPLEFT" }, "text": "USA (2018).", "orig": "USA (2018).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 202.916, "r_y0": 599.1362799999999, "r_x1": 386.45911, "r_y1": 599.1362799999999, "r_x2": 386.45911, "r_y2": 591.66727, "r_x3": 202.916, "r_y3": 591.66727, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.1145/3219819.3219834", "orig": "https://doi.org/10.1145/3219819.3219834", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.45801, "r_y0": 599.09145, "r_x1": 389.01703, "r_y1": 599.09145, "r_x2": 389.01703, "r_y2": 591.0216800000001, "r_x3": 386.45801, "r_y3": 591.0216800000001, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 391.173, "r_y0": 599.1362799999999, "r_x1": 480.59583, "r_y1": 599.1362799999999, "r_x2": 480.59583, "r_y2": 591.66727, "r_x3": 391.173, "r_y3": 591.66727, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.", "orig": "https://doi.org/10.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 610.09528, "r_x1": 245.63831, "r_y1": 610.09528, "r_x2": 245.63831, "r_y2": 602.62627, "r_x3": 151.51801, "r_y3": 602.62627, "coord_origin": "TOPLEFT" }, "text": "1145/3219819.3219834", "orig": "1145/3219819.3219834", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "15. Staar, P.W.J., Dolfi, M., Auer, C., Bekas, C.: Corpus conversion service: A machine learning platform to ingest documents at scale. In: Proceedings of the 24th ACM SIGKDD International Conference on Knowledge Discovery & Data Mining. pp. 774-782. KDD '18, Association for Computing Machinery, New York, NY, USA (2018). https://doi.org/10.1145/3219819.3219834 , https://doi.org/10. 1145/3219819.3219834" }, { "label": "list_item", "id": 12, "page_no": 12, "cluster": { "id": 12, "label": "list_item", "bbox": { "l": 134.76401, "t": 612.95068, "r": 480.59542999999996, "b": 631.97945, "coord_origin": "TOPLEFT" }, "confidence": 0.9416429996490479, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76401, "r_y0": 621.02045, "r_x1": 146.62019, "r_y1": 621.02045, "r_x2": 146.62019, "r_y2": 612.95068, "r_x3": 134.76401, "r_y3": 612.95068, "coord_origin": "TOPLEFT" }, "text": "16.", "orig": "16.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.25977, "r_y0": 621.02045, "r_x1": 480.59542999999996, "r_y1": 621.02045, "r_x2": 480.59542999999996, "r_y2": 612.95068, "r_x3": 151.25977, "r_y3": 612.95068, "coord_origin": "TOPLEFT" }, "text": "Wang, X.: Tabular Abstraction, Editing, and Formatting. Ph.D. thesis, CAN", "orig": "Wang, X.: Tabular Abstraction, Editing, and Formatting. Ph.D. thesis, CAN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 631.97945, "r_x1": 234.43031, "r_y1": 631.97945, "r_x2": 234.43031, "r_y2": 623.90968, "r_x3": 151.51801, "r_y3": 623.90968, "coord_origin": "TOPLEFT" }, "text": "(1996), aAINN09397", "orig": "(1996), aAINN09397", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "16. Wang, X.: Tabular Abstraction, Editing, and Formatting. Ph.D. thesis, CAN (1996), aAINN09397" }, { "label": "list_item", "id": 8, "page_no": 12, "cluster": { "id": 8, "label": "list_item", "bbox": { "l": 134.76401, "t": 634.87968, "r": 480.59119, "b": 664.86745, "coord_origin": "TOPLEFT" }, "confidence": 0.9646382331848145, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76401, "r_y0": 642.9494500000001, "r_x1": 146.30539, "r_y1": 642.9494500000001, "r_x2": 146.30539, "r_y2": 634.87968, "r_x3": 134.76401, "r_y3": 634.87968, "coord_origin": "TOPLEFT" }, "text": "17.", "orig": "17.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.82175, "r_y0": 642.9494500000001, "r_x1": 480.58731000000006, "r_y1": 642.9494500000001, "r_x2": 480.58731000000006, "r_y2": 634.87968, "r_x3": 150.82175, "r_y3": 634.87968, "coord_origin": "TOPLEFT" }, "text": "Xue, W., Li, Q., Tao, D.: Res2tim: Reconstruct syntactic structures from table", "orig": "Xue, W., Li, Q., Tao, D.: Res2tim: Reconstruct syntactic structures from table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 653.90845, "r_x1": 480.59119, "r_y1": 653.90845, "r_x2": 480.59119, "r_y2": 645.8386800000001, "r_x3": 151.51801, "r_y3": 645.8386800000001, "coord_origin": "TOPLEFT" }, "text": "images. In: 2019 International Conference on Document Analysis and Recognition", "orig": "images. In: 2019 International Conference on Document Analysis and Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 664.86745, "r_x1": 299.30307, "r_y1": 664.86745, "r_x2": 299.30307, "r_y2": 656.79768, "r_x3": 151.51801, "r_y3": 656.79768, "coord_origin": "TOPLEFT" }, "text": "(ICDAR). pp. 749-755. IEEE (2019)", "orig": "(ICDAR). pp. 749-755. IEEE (2019)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "17. Xue, W., Li, Q., Tao, D.: Res2tim: Reconstruct syntactic structures from table images. In: 2019 International Conference on Document Analysis and Recognition (ICDAR). pp. 749-755. IEEE (2019)" } ], "headers": [ { "label": "page_header", "id": 13, "page_no": 12, "cluster": { "id": 13, "label": "page_header", "bbox": { "l": 194.478, "t": 93.77099999999996, "r": 447.54291000000006, "b": 101.84069999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.9163166880607605, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.478, "r_y0": 101.84069999999997, "r_x1": 447.54291000000006, "r_y1": 101.84069999999997, "r_x2": 447.54291000000006, "r_y2": 93.77099999999996, "r_x3": 194.478, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Optimized Table Tokenization for Table Structure Recognition" }, { "label": "page_header", "id": 14, "page_no": 12, "cluster": { "id": 14, "label": "page_header", "bbox": { "l": 471.37561, "t": 93.77099999999996, "r": 480.5894799999999, "b": 101.84069999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.9061064720153809, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 471.37561, "r_y0": 101.84069999999997, "r_x1": 480.5894799999999, "r_y1": 101.84069999999997, "r_x2": 480.5894799999999, "r_y2": 93.77099999999996, "r_x3": 471.37561, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "13" } ] } }, { "page_no": 13, "size": { "width": 612.0, "height": 792.0 }, "parsed_page": { "dimension": { "angle": 0.0, "rect": { "r_x0": 0.0, "r_y0": 0.0, "r_x1": 612.0, "r_y1": 0.0, "r_x2": 612.0, "r_y2": 792.0, "r_x3": 0.0, "r_y3": 792.0, "coord_origin": "BOTTOMLEFT" }, "boundary_type": "crop_box", "art_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "bleed_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "crop_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "media_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "trim_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" } }, "bitmap_resources": [], "char_cells": [], "word_cells": [], "textline_cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 101.84069999999997, "r_x1": 143.97887, "r_y1": 101.84069999999997, "r_x2": 143.97887, "r_y2": 93.77099999999996, "r_x3": 134.765, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.82053, "r_y0": 101.84069999999997, "r_x1": 178.08249, "r_y1": 101.84069999999997, "r_x2": 178.08249, "r_y2": 93.77099999999996, "r_x3": 167.82053, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.37929, "r_y0": 101.84069999999997, "r_x1": 231.72049000000004, "r_y1": 101.84069999999997, "r_x2": 231.72049000000004, "r_y2": 93.77099999999996, "r_x3": 182.37929, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 127.74370999999985, "r_x1": 146.07936, "r_y1": 127.74370999999985, "r_x2": 146.07936, "r_y2": 119.67400999999995, "r_x3": 134.765, "r_y3": 119.67400999999995, "coord_origin": "TOPLEFT" }, "text": "18.", "orig": "18.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.5069, "r_y0": 127.74370999999985, "r_x1": 480.5892, "r_y1": 127.74370999999985, "r_x2": 480.5892, "r_y2": 119.67400999999995, "r_x3": 150.5069, "r_y3": 119.67400999999995, "coord_origin": "TOPLEFT" }, "text": "Xue, W., Yu, B., Wang, W., Tao, D., Li, Q.: Tgrnet: A table graph reconstruc-", "orig": "Xue, W., Yu, B., Wang, W., Tao, D., Li, Q.: Tgrnet: A table graph reconstruc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 138.70270000000005, "r_x1": 480.59113, "r_y1": 138.70270000000005, "r_x2": 480.59113, "r_y2": 130.63300000000004, "r_x3": 151.51801, "r_y3": 130.63300000000004, "coord_origin": "TOPLEFT" }, "text": "tion network for table structure recognition. In: Proceedings of the IEEE/CVF", "orig": "tion network for table structure recognition. In: Proceedings of the IEEE/CVF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 149.66168000000005, "r_x1": 427.53329, "r_y1": 149.66168000000005, "r_x2": 427.53329, "r_y2": 141.59198000000004, "r_x3": 151.51801, "r_y3": 141.59198000000004, "coord_origin": "TOPLEFT" }, "text": "International Conference on Computer Vision. pp. 1295-1304 (2021)", "orig": "International Conference on Computer Vision. pp. 1295-1304 (2021)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 160.62067000000002, "r_x1": 146.19109, "r_y1": 160.62067000000002, "r_x2": 146.19109, "r_y2": 152.55096000000003, "r_x3": 134.765, "r_y3": 152.55096000000003, "coord_origin": "TOPLEFT" }, "text": "19.", "orig": "19.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.66234, "r_y0": 160.62067000000002, "r_x1": 480.5936899999999, "r_y1": 160.62067000000002, "r_x2": 480.5936899999999, "r_y2": 152.55096000000003, "r_x3": 150.66234, "r_y3": 152.55096000000003, "coord_origin": "TOPLEFT" }, "text": "Ye, J., Qi, X., He, Y., Chen, Y., Gu, D., Gao, P., Xiao, R.: Pingan-vcgroup\u2019s", "orig": "Ye, J., Qi, X., He, Y., Chen, Y., Gu, D., Gao, P., Xiao, R.: Pingan-vcgroup\u2019s", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 171.57965000000002, "r_x1": 480.59469999999993, "r_y1": 171.57965000000002, "r_x2": 480.59469999999993, "r_y2": 163.50995, "r_x3": 151.51801, "r_y3": 163.50995, "coord_origin": "TOPLEFT" }, "text": "solution for icdar 2021 competition on scientific literature parsing task b: Ta-", "orig": "solution for icdar 2021 competition on scientific literature parsing task b: Ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 182.53864, "r_x1": 280.64047, "r_y1": 182.53864, "r_x2": 280.64047, "r_y2": 174.46893, "r_x3": 151.51801, "r_y3": 174.46893, "coord_origin": "TOPLEFT" }, "text": "ble recognition to html (2021).", "orig": "ble recognition to html (2021).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.078, "r_y0": 182.58349999999996, "r_x1": 478.03403000000003, "r_y1": 182.58349999999996, "r_x2": 478.03403000000003, "r_y2": 175.11450000000002, "r_x3": 285.078, "r_y3": 175.11450000000002, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.48550/ARXIV.2105.01848", "orig": "https://doi.org/10.48550/ARXIV.2105.01848", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 478.0319799999999, "r_y0": 182.53864, "r_x1": 480.59099999999995, "r_y1": 182.53864, "r_x2": 480.59099999999995, "r_y2": 174.46893, "r_x3": 478.0319799999999, "r_y3": 174.46893, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51797, "r_y0": 193.54247999999995, "r_x1": 302.11584, "r_y1": 193.54247999999995, "r_x2": 302.11584, "r_y2": 186.07349, "r_x3": 151.51797, "r_y3": 186.07349, "coord_origin": "TOPLEFT" }, "text": "https://arxiv.org/abs/2105.01848", "orig": "https://arxiv.org/abs/2105.01848", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76497, "r_y0": 204.45659999999998, "r_x1": 145.65964, "r_y1": 204.45659999999998, "r_x2": 145.65964, "r_y2": 196.38689999999997, "r_x3": 134.76497, "r_y3": 196.38689999999997, "coord_origin": "TOPLEFT" }, "text": "20.", "orig": "20.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.92294, "r_y0": 204.45659999999998, "r_x1": 480.5935400000001, "r_y1": 204.45659999999998, "r_x2": 480.5935400000001, "r_y2": 196.38689999999997, "r_x3": 149.92294, "r_y3": 196.38689999999997, "coord_origin": "TOPLEFT" }, "text": "Zhang, Z., Zhang, J., Du, J., Wang, F.: Split, embed and merge: An accurate table", "orig": "Zhang, Z., Zhang, J., Du, J., Wang, F.: Split, embed and merge: An accurate table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51797, "r_y0": 215.41461000000004, "r_x1": 318.55124, "r_y1": 215.41461000000004, "r_x2": 318.55124, "r_y2": 207.34491000000003, "r_x3": 151.51797, "r_y3": 207.34491000000003, "coord_origin": "TOPLEFT" }, "text": "structure recognizer. Pattern Recognition", "orig": "structure recognizer. Pattern Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 321.62097, "r_y0": 215.20844, "r_x1": 337.53186, "r_y1": 215.20844, "r_x2": 337.53186, "r_y2": 207.2821, "r_x3": 321.62097, "r_y3": 207.2821, "coord_origin": "TOPLEFT" }, "text": "126", "orig": "126", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.53296, "r_y0": 215.41461000000004, "r_x1": 399.46927, "r_y1": 215.41461000000004, "r_x2": 399.46927, "r_y2": 207.34491000000003, "r_x3": 337.53296, "r_y3": 207.34491000000003, "coord_origin": "TOPLEFT" }, "text": ", 108565 (2022)", "orig": ", 108565 (2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76495, "r_y0": 226.3736, "r_x1": 145.7213, "r_y1": 226.3736, "r_x2": 145.7213, "r_y2": 218.30389000000002, "r_x3": 134.76495, "r_y3": 218.30389000000002, "coord_origin": "TOPLEFT" }, "text": "21.", "orig": "21.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.00871, "r_y0": 226.3736, "r_x1": 480.59012, "r_y1": 226.3736, "r_x2": 480.59012, "r_y2": 218.30389000000002, "r_x3": 150.00871, "r_y3": 218.30389000000002, "coord_origin": "TOPLEFT" }, "text": "Zheng, X., Burdick, D., Popa, L., Zhong, X., Wang, N.X.R.: Global table extractor", "orig": "Zheng, X., Burdick, D., Popa, L., Zhong, X., Wang, N.X.R.: Global table extractor", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51796, "r_y0": 237.33258, "r_x1": 480.59102999999993, "r_y1": 237.33258, "r_x2": 480.59102999999993, "r_y2": 229.26288, "r_x3": 151.51796, "r_y3": 229.26288, "coord_origin": "TOPLEFT" }, "text": "(gte): A framework for joint table identification and cell structure recognition using", "orig": "(gte): A framework for joint table identification and cell structure recognition using", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51796, "r_y0": 248.29156, "r_x1": 480.59119, "r_y1": 248.29156, "r_x2": 480.59119, "r_y2": 240.22186, "r_x3": 151.51796, "r_y3": 240.22186, "coord_origin": "TOPLEFT" }, "text": "visual context. In: 2021 IEEE Winter Conference on Applications of Computer Vi-", "orig": "visual context. In: 2021 IEEE Winter Conference on Applications of Computer Vi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51796, "r_y0": 259.25055, "r_x1": 293.44086, "r_y1": 259.25055, "r_x2": 293.44086, "r_y2": 251.18084999999996, "r_x3": 151.51796, "r_y3": 251.18084999999996, "coord_origin": "TOPLEFT" }, "text": "sion (WACV). pp. 697-706 (2021).", "orig": "sion (WACV). pp. 697-706 (2021).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 297.04996, "r_y0": 259.29540999999995, "r_x1": 480.59305000000006, "r_y1": 259.29540999999995, "r_x2": 480.59305000000006, "r_y2": 251.82641999999998, "r_x3": 297.04996, "r_y3": 251.82641999999998, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.1109/WACV48630.2021.", "orig": "https://doi.org/10.1109/WACV48630.2021.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51796, "r_y0": 270.25438999999994, "r_x1": 175.05028, "r_y1": 270.25438999999994, "r_x2": 175.05028, "r_y2": 262.7854, "r_x3": 151.51796, "r_y3": 262.7854, "coord_origin": "TOPLEFT" }, "text": "00074", "orig": "00074", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76495, "r_y0": 281.16855000000004, "r_x1": 146.36798, "r_y1": 281.16855000000004, "r_x2": 146.36798, "r_y2": 273.09882000000005, "r_x3": 134.76495, "r_y3": 273.09882000000005, "coord_origin": "TOPLEFT" }, "text": "22.", "orig": "22.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.90846, "r_y0": 281.16855000000004, "r_x1": 480.59094, "r_y1": 281.16855000000004, "r_x2": 480.59094, "r_y2": 273.09882000000005, "r_x3": 150.90846, "r_y3": 273.09882000000005, "coord_origin": "TOPLEFT" }, "text": "Zhong, X., ShafieiBavani, E., Jimeno Yepes, A.: Image-based table recognition:", "orig": "Zhong, X., ShafieiBavani, E., Jimeno Yepes, A.: Image-based table recognition:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51796, "r_y0": 292.12753, "r_x1": 480.58832000000007, "r_y1": 292.12753, "r_x2": 480.58832000000007, "r_y2": 284.05777, "r_x3": 151.51796, "r_y3": 284.05777, "coord_origin": "TOPLEFT" }, "text": "Data, model, and evaluation. In: Vedaldi, A., Bischof, H., Brox, T., Frahm, J.M.", "orig": "Data, model, and evaluation. In: Vedaldi, A., Bischof, H., Brox, T., Frahm, J.M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51796, "r_y0": 303.08651999999995, "r_x1": 480.59558, "r_y1": 303.08651999999995, "r_x2": 480.59558, "r_y2": 295.01675, "r_x3": 151.51796, "r_y3": 295.01675, "coord_origin": "TOPLEFT" }, "text": "(eds.) Computer Vision - ECCV 2020. pp. 564-580. Springer International Pub-", "orig": "(eds.) Computer Vision - ECCV 2020. pp. 564-580. Springer International Pub-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51796, "r_y0": 314.0455, "r_x1": 236.02359, "r_y1": 314.0455, "r_x2": 236.02359, "r_y2": 305.97574, "r_x3": 151.51796, "r_y3": 305.97574, "coord_origin": "TOPLEFT" }, "text": "lishing, Cham (2020)", "orig": "lishing, Cham (2020)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76495, "r_y0": 325.00449000000003, "r_x1": 145.69547, "r_y1": 325.00449000000003, "r_x2": 145.69547, "r_y2": 316.93472, "r_x3": 134.76495, "r_y3": 316.93472, "coord_origin": "TOPLEFT" }, "text": "23.", "orig": "23.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.97276, "r_y0": 325.00449000000003, "r_x1": 480.59454, "r_y1": 325.00449000000003, "r_x2": 480.59454, "r_y2": 316.93472, "r_x3": 149.97276, "r_y3": 316.93472, "coord_origin": "TOPLEFT" }, "text": "Zhong, X., Tang, J., Yepes, A.J.: Publaynet: largest dataset ever for document lay-", "orig": "Zhong, X., Tang, J., Yepes, A.J.: Publaynet: largest dataset ever for document lay-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51796, "r_y0": 335.96249, "r_x1": 480.59387000000004, "r_y1": 335.96249, "r_x2": 480.59387000000004, "r_y2": 327.8927299999999, "r_x3": 151.51796, "r_y3": 327.8927299999999, "coord_origin": "TOPLEFT" }, "text": "out analysis. In: 2019 International Conference on Document Analysis and Recog-", "orig": "out analysis. In: 2019 International Conference on Document Analysis and Recog-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51796, "r_y0": 346.92148, "r_x1": 335.13635, "r_y1": 346.92148, "r_x2": 335.13635, "r_y2": 338.85172, "r_x3": 151.51796, "r_y3": 338.85172, "coord_origin": "TOPLEFT" }, "text": "nition (ICDAR). pp. 1015-1022. IEEE (2019)", "orig": "nition (ICDAR). pp. 1015-1022. IEEE (2019)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "has_chars": false, "has_words": false, "has_lines": true, "image": null, "lines": [] }, "predictions": { "layout": { "clusters": [ { "id": 7, "label": "page_header", "bbox": { "l": 134.765, "t": 93.77099999999996, "r": 143.97887, "b": 101.84069999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.7012730240821838, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 101.84069999999997, "r_x1": 143.97887, "r_y1": 101.84069999999997, "r_x2": 143.97887, "r_y2": 93.77099999999996, "r_x3": 134.765, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 6, "label": "page_header", "bbox": { "l": 167.82053, "t": 93.77099999999996, "r": 231.72049000000004, "b": 101.84069999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.7889755964279175, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.82053, "r_y0": 101.84069999999997, "r_x1": 178.08249, "r_y1": 101.84069999999997, "r_x2": 178.08249, "r_y2": 93.77099999999996, "r_x3": 167.82053, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.37929, "r_y0": 101.84069999999997, "r_x1": 231.72049000000004, "r_y1": 101.84069999999997, "r_x2": 231.72049000000004, "r_y2": 93.77099999999996, "r_x3": 182.37929, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 5, "label": "list_item", "bbox": { "l": 134.765, "t": 119.67400999999995, "r": 480.59113, "b": 149.66168000000005, "coord_origin": "TOPLEFT" }, "confidence": 0.9444757699966431, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 127.74370999999985, "r_x1": 146.07936, "r_y1": 127.74370999999985, "r_x2": 146.07936, "r_y2": 119.67400999999995, "r_x3": 134.765, "r_y3": 119.67400999999995, "coord_origin": "TOPLEFT" }, "text": "18.", "orig": "18.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.5069, "r_y0": 127.74370999999985, "r_x1": 480.5892, "r_y1": 127.74370999999985, "r_x2": 480.5892, "r_y2": 119.67400999999995, "r_x3": 150.5069, "r_y3": 119.67400999999995, "coord_origin": "TOPLEFT" }, "text": "Xue, W., Yu, B., Wang, W., Tao, D., Li, Q.: Tgrnet: A table graph reconstruc-", "orig": "Xue, W., Yu, B., Wang, W., Tao, D., Li, Q.: Tgrnet: A table graph reconstruc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 138.70270000000005, "r_x1": 480.59113, "r_y1": 138.70270000000005, "r_x2": 480.59113, "r_y2": 130.63300000000004, "r_x3": 151.51801, "r_y3": 130.63300000000004, "coord_origin": "TOPLEFT" }, "text": "tion network for table structure recognition. In: Proceedings of the IEEE/CVF", "orig": "tion network for table structure recognition. In: Proceedings of the IEEE/CVF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 149.66168000000005, "r_x1": 427.53329, "r_y1": 149.66168000000005, "r_x2": 427.53329, "r_y2": 141.59198000000004, "r_x3": 151.51801, "r_y3": 141.59198000000004, "coord_origin": "TOPLEFT" }, "text": "International Conference on Computer Vision. pp. 1295-1304 (2021)", "orig": "International Conference on Computer Vision. pp. 1295-1304 (2021)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 3, "label": "list_item", "bbox": { "l": 134.765, "t": 152.55096000000003, "r": 480.59469999999993, "b": 193.54247999999995, "coord_origin": "TOPLEFT" }, "confidence": 0.9540892243385315, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 160.62067000000002, "r_x1": 146.19109, "r_y1": 160.62067000000002, "r_x2": 146.19109, "r_y2": 152.55096000000003, "r_x3": 134.765, "r_y3": 152.55096000000003, "coord_origin": "TOPLEFT" }, "text": "19.", "orig": "19.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.66234, "r_y0": 160.62067000000002, "r_x1": 480.5936899999999, "r_y1": 160.62067000000002, "r_x2": 480.5936899999999, "r_y2": 152.55096000000003, "r_x3": 150.66234, "r_y3": 152.55096000000003, "coord_origin": "TOPLEFT" }, "text": "Ye, J., Qi, X., He, Y., Chen, Y., Gu, D., Gao, P., Xiao, R.: Pingan-vcgroup\u2019s", "orig": "Ye, J., Qi, X., He, Y., Chen, Y., Gu, D., Gao, P., Xiao, R.: Pingan-vcgroup\u2019s", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 171.57965000000002, "r_x1": 480.59469999999993, "r_y1": 171.57965000000002, "r_x2": 480.59469999999993, "r_y2": 163.50995, "r_x3": 151.51801, "r_y3": 163.50995, "coord_origin": "TOPLEFT" }, "text": "solution for icdar 2021 competition on scientific literature parsing task b: Ta-", "orig": "solution for icdar 2021 competition on scientific literature parsing task b: Ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 182.53864, "r_x1": 280.64047, "r_y1": 182.53864, "r_x2": 280.64047, "r_y2": 174.46893, "r_x3": 151.51801, "r_y3": 174.46893, "coord_origin": "TOPLEFT" }, "text": "ble recognition to html (2021).", "orig": "ble recognition to html (2021).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.078, "r_y0": 182.58349999999996, "r_x1": 478.03403000000003, "r_y1": 182.58349999999996, "r_x2": 478.03403000000003, "r_y2": 175.11450000000002, "r_x3": 285.078, "r_y3": 175.11450000000002, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.48550/ARXIV.2105.01848", "orig": "https://doi.org/10.48550/ARXIV.2105.01848", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 478.0319799999999, "r_y0": 182.53864, "r_x1": 480.59099999999995, "r_y1": 182.53864, "r_x2": 480.59099999999995, "r_y2": 174.46893, "r_x3": 478.0319799999999, "r_y3": 174.46893, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51797, "r_y0": 193.54247999999995, "r_x1": 302.11584, "r_y1": 193.54247999999995, "r_x2": 302.11584, "r_y2": 186.07349, "r_x3": 151.51797, "r_y3": 186.07349, "coord_origin": "TOPLEFT" }, "text": "https://arxiv.org/abs/2105.01848", "orig": "https://arxiv.org/abs/2105.01848", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 4, "label": "list_item", "bbox": { "l": 134.76497, "t": 196.38689999999997, "r": 480.5935400000001, "b": 215.41461000000004, "coord_origin": "TOPLEFT" }, "confidence": 0.9531471729278564, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76497, "r_y0": 204.45659999999998, "r_x1": 145.65964, "r_y1": 204.45659999999998, "r_x2": 145.65964, "r_y2": 196.38689999999997, "r_x3": 134.76497, "r_y3": 196.38689999999997, "coord_origin": "TOPLEFT" }, "text": "20.", "orig": "20.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.92294, "r_y0": 204.45659999999998, "r_x1": 480.5935400000001, "r_y1": 204.45659999999998, "r_x2": 480.5935400000001, "r_y2": 196.38689999999997, "r_x3": 149.92294, "r_y3": 196.38689999999997, "coord_origin": "TOPLEFT" }, "text": "Zhang, Z., Zhang, J., Du, J., Wang, F.: Split, embed and merge: An accurate table", "orig": "Zhang, Z., Zhang, J., Du, J., Wang, F.: Split, embed and merge: An accurate table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51797, "r_y0": 215.41461000000004, "r_x1": 318.55124, "r_y1": 215.41461000000004, "r_x2": 318.55124, "r_y2": 207.34491000000003, "r_x3": 151.51797, "r_y3": 207.34491000000003, "coord_origin": "TOPLEFT" }, "text": "structure recognizer. Pattern Recognition", "orig": "structure recognizer. Pattern Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 321.62097, "r_y0": 215.20844, "r_x1": 337.53186, "r_y1": 215.20844, "r_x2": 337.53186, "r_y2": 207.2821, "r_x3": 321.62097, "r_y3": 207.2821, "coord_origin": "TOPLEFT" }, "text": "126", "orig": "126", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.53296, "r_y0": 215.41461000000004, "r_x1": 399.46927, "r_y1": 215.41461000000004, "r_x2": 399.46927, "r_y2": 207.34491000000003, "r_x3": 337.53296, "r_y3": 207.34491000000003, "coord_origin": "TOPLEFT" }, "text": ", 108565 (2022)", "orig": ", 108565 (2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 0, "label": "list_item", "bbox": { "l": 134.76495, "t": 218.30389000000002, "r": 480.59305000000006, "b": 270.25438999999994, "coord_origin": "TOPLEFT" }, "confidence": 0.972027063369751, "cells": [ { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76495, "r_y0": 226.3736, "r_x1": 145.7213, "r_y1": 226.3736, "r_x2": 145.7213, "r_y2": 218.30389000000002, "r_x3": 134.76495, "r_y3": 218.30389000000002, "coord_origin": "TOPLEFT" }, "text": "21.", "orig": "21.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.00871, "r_y0": 226.3736, "r_x1": 480.59012, "r_y1": 226.3736, "r_x2": 480.59012, "r_y2": 218.30389000000002, "r_x3": 150.00871, "r_y3": 218.30389000000002, "coord_origin": "TOPLEFT" }, "text": "Zheng, X., Burdick, D., Popa, L., Zhong, X., Wang, N.X.R.: Global table extractor", "orig": "Zheng, X., Burdick, D., Popa, L., Zhong, X., Wang, N.X.R.: Global table extractor", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51796, "r_y0": 237.33258, "r_x1": 480.59102999999993, "r_y1": 237.33258, "r_x2": 480.59102999999993, "r_y2": 229.26288, "r_x3": 151.51796, "r_y3": 229.26288, "coord_origin": "TOPLEFT" }, "text": "(gte): A framework for joint table identification and cell structure recognition using", "orig": "(gte): A framework for joint table identification and cell structure recognition using", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51796, "r_y0": 248.29156, "r_x1": 480.59119, "r_y1": 248.29156, "r_x2": 480.59119, "r_y2": 240.22186, "r_x3": 151.51796, "r_y3": 240.22186, "coord_origin": "TOPLEFT" }, "text": "visual context. In: 2021 IEEE Winter Conference on Applications of Computer Vi-", "orig": "visual context. In: 2021 IEEE Winter Conference on Applications of Computer Vi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51796, "r_y0": 259.25055, "r_x1": 293.44086, "r_y1": 259.25055, "r_x2": 293.44086, "r_y2": 251.18084999999996, "r_x3": 151.51796, "r_y3": 251.18084999999996, "coord_origin": "TOPLEFT" }, "text": "sion (WACV). pp. 697-706 (2021).", "orig": "sion (WACV). pp. 697-706 (2021).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 297.04996, "r_y0": 259.29540999999995, "r_x1": 480.59305000000006, "r_y1": 259.29540999999995, "r_x2": 480.59305000000006, "r_y2": 251.82641999999998, "r_x3": 297.04996, "r_y3": 251.82641999999998, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.1109/WACV48630.2021.", "orig": "https://doi.org/10.1109/WACV48630.2021.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51796, "r_y0": 270.25438999999994, "r_x1": 175.05028, "r_y1": 270.25438999999994, "r_x2": 175.05028, "r_y2": 262.7854, "r_x3": 151.51796, "r_y3": 262.7854, "coord_origin": "TOPLEFT" }, "text": "00074", "orig": "00074", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 1, "label": "list_item", "bbox": { "l": 134.76495, "t": 273.09882000000005, "r": 480.59558, "b": 314.0455, "coord_origin": "TOPLEFT" }, "confidence": 0.9685125946998596, "cells": [ { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76495, "r_y0": 281.16855000000004, "r_x1": 146.36798, "r_y1": 281.16855000000004, "r_x2": 146.36798, "r_y2": 273.09882000000005, "r_x3": 134.76495, "r_y3": 273.09882000000005, "coord_origin": "TOPLEFT" }, "text": "22.", "orig": "22.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.90846, "r_y0": 281.16855000000004, "r_x1": 480.59094, "r_y1": 281.16855000000004, "r_x2": 480.59094, "r_y2": 273.09882000000005, "r_x3": 150.90846, "r_y3": 273.09882000000005, "coord_origin": "TOPLEFT" }, "text": "Zhong, X., ShafieiBavani, E., Jimeno Yepes, A.: Image-based table recognition:", "orig": "Zhong, X., ShafieiBavani, E., Jimeno Yepes, A.: Image-based table recognition:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51796, "r_y0": 292.12753, "r_x1": 480.58832000000007, "r_y1": 292.12753, "r_x2": 480.58832000000007, "r_y2": 284.05777, "r_x3": 151.51796, "r_y3": 284.05777, "coord_origin": "TOPLEFT" }, "text": "Data, model, and evaluation. In: Vedaldi, A., Bischof, H., Brox, T., Frahm, J.M.", "orig": "Data, model, and evaluation. In: Vedaldi, A., Bischof, H., Brox, T., Frahm, J.M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51796, "r_y0": 303.08651999999995, "r_x1": 480.59558, "r_y1": 303.08651999999995, "r_x2": 480.59558, "r_y2": 295.01675, "r_x3": 151.51796, "r_y3": 295.01675, "coord_origin": "TOPLEFT" }, "text": "(eds.) Computer Vision - ECCV 2020. pp. 564-580. Springer International Pub-", "orig": "(eds.) Computer Vision - ECCV 2020. pp. 564-580. Springer International Pub-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51796, "r_y0": 314.0455, "r_x1": 236.02359, "r_y1": 314.0455, "r_x2": 236.02359, "r_y2": 305.97574, "r_x3": 151.51796, "r_y3": 305.97574, "coord_origin": "TOPLEFT" }, "text": "lishing, Cham (2020)", "orig": "lishing, Cham (2020)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 2, "label": "list_item", "bbox": { "l": 134.76495, "t": 316.93472, "r": 480.59454, "b": 346.92148, "coord_origin": "TOPLEFT" }, "confidence": 0.9668973684310913, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76495, "r_y0": 325.00449000000003, "r_x1": 145.69547, "r_y1": 325.00449000000003, "r_x2": 145.69547, "r_y2": 316.93472, "r_x3": 134.76495, "r_y3": 316.93472, "coord_origin": "TOPLEFT" }, "text": "23.", "orig": "23.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.97276, "r_y0": 325.00449000000003, "r_x1": 480.59454, "r_y1": 325.00449000000003, "r_x2": 480.59454, "r_y2": 316.93472, "r_x3": 149.97276, "r_y3": 316.93472, "coord_origin": "TOPLEFT" }, "text": "Zhong, X., Tang, J., Yepes, A.J.: Publaynet: largest dataset ever for document lay-", "orig": "Zhong, X., Tang, J., Yepes, A.J.: Publaynet: largest dataset ever for document lay-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51796, "r_y0": 335.96249, "r_x1": 480.59387000000004, "r_y1": 335.96249, "r_x2": 480.59387000000004, "r_y2": 327.8927299999999, "r_x3": 151.51796, "r_y3": 327.8927299999999, "coord_origin": "TOPLEFT" }, "text": "out analysis. In: 2019 International Conference on Document Analysis and Recog-", "orig": "out analysis. In: 2019 International Conference on Document Analysis and Recog-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51796, "r_y0": 346.92148, "r_x1": 335.13635, "r_y1": 346.92148, "r_x2": 335.13635, "r_y2": 338.85172, "r_x3": 151.51796, "r_y3": 338.85172, "coord_origin": "TOPLEFT" }, "text": "nition (ICDAR). pp. 1015-1022. IEEE (2019)", "orig": "nition (ICDAR). pp. 1015-1022. IEEE (2019)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "tablestructure": { "table_map": {} }, "figures_classification": null, "equations_prediction": null, "vlm_response": null }, "assembled": { "elements": [ { "label": "page_header", "id": 7, "page_no": 13, "cluster": { "id": 7, "label": "page_header", "bbox": { "l": 134.765, "t": 93.77099999999996, "r": 143.97887, "b": 101.84069999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.7012730240821838, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 101.84069999999997, "r_x1": 143.97887, "r_y1": 101.84069999999997, "r_x2": 143.97887, "r_y2": 93.77099999999996, "r_x3": 134.765, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "14" }, { "label": "page_header", "id": 6, "page_no": 13, "cluster": { "id": 6, "label": "page_header", "bbox": { "l": 167.82053, "t": 93.77099999999996, "r": 231.72049000000004, "b": 101.84069999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.7889755964279175, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.82053, "r_y0": 101.84069999999997, "r_x1": 178.08249, "r_y1": 101.84069999999997, "r_x2": 178.08249, "r_y2": 93.77099999999996, "r_x3": 167.82053, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.37929, "r_y0": 101.84069999999997, "r_x1": 231.72049000000004, "r_y1": 101.84069999999997, "r_x2": 231.72049000000004, "r_y2": 93.77099999999996, "r_x3": 182.37929, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "M. Lysak, et al." }, { "label": "list_item", "id": 5, "page_no": 13, "cluster": { "id": 5, "label": "list_item", "bbox": { "l": 134.765, "t": 119.67400999999995, "r": 480.59113, "b": 149.66168000000005, "coord_origin": "TOPLEFT" }, "confidence": 0.9444757699966431, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 127.74370999999985, "r_x1": 146.07936, "r_y1": 127.74370999999985, "r_x2": 146.07936, "r_y2": 119.67400999999995, "r_x3": 134.765, "r_y3": 119.67400999999995, "coord_origin": "TOPLEFT" }, "text": "18.", "orig": "18.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.5069, "r_y0": 127.74370999999985, "r_x1": 480.5892, "r_y1": 127.74370999999985, "r_x2": 480.5892, "r_y2": 119.67400999999995, "r_x3": 150.5069, "r_y3": 119.67400999999995, "coord_origin": "TOPLEFT" }, "text": "Xue, W., Yu, B., Wang, W., Tao, D., Li, Q.: Tgrnet: A table graph reconstruc-", "orig": "Xue, W., Yu, B., Wang, W., Tao, D., Li, Q.: Tgrnet: A table graph reconstruc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 138.70270000000005, "r_x1": 480.59113, "r_y1": 138.70270000000005, "r_x2": 480.59113, "r_y2": 130.63300000000004, "r_x3": 151.51801, "r_y3": 130.63300000000004, "coord_origin": "TOPLEFT" }, "text": "tion network for table structure recognition. In: Proceedings of the IEEE/CVF", "orig": "tion network for table structure recognition. In: Proceedings of the IEEE/CVF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 149.66168000000005, "r_x1": 427.53329, "r_y1": 149.66168000000005, "r_x2": 427.53329, "r_y2": 141.59198000000004, "r_x3": 151.51801, "r_y3": 141.59198000000004, "coord_origin": "TOPLEFT" }, "text": "International Conference on Computer Vision. pp. 1295-1304 (2021)", "orig": "International Conference on Computer Vision. pp. 1295-1304 (2021)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "18. Xue, W., Yu, B., Wang, W., Tao, D., Li, Q.: Tgrnet: A table graph reconstruction network for table structure recognition. In: Proceedings of the IEEE/CVF International Conference on Computer Vision. pp. 1295-1304 (2021)" }, { "label": "list_item", "id": 3, "page_no": 13, "cluster": { "id": 3, "label": "list_item", "bbox": { "l": 134.765, "t": 152.55096000000003, "r": 480.59469999999993, "b": 193.54247999999995, "coord_origin": "TOPLEFT" }, "confidence": 0.9540892243385315, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 160.62067000000002, "r_x1": 146.19109, "r_y1": 160.62067000000002, "r_x2": 146.19109, "r_y2": 152.55096000000003, "r_x3": 134.765, "r_y3": 152.55096000000003, "coord_origin": "TOPLEFT" }, "text": "19.", "orig": "19.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.66234, "r_y0": 160.62067000000002, "r_x1": 480.5936899999999, "r_y1": 160.62067000000002, "r_x2": 480.5936899999999, "r_y2": 152.55096000000003, "r_x3": 150.66234, "r_y3": 152.55096000000003, "coord_origin": "TOPLEFT" }, "text": "Ye, J., Qi, X., He, Y., Chen, Y., Gu, D., Gao, P., Xiao, R.: Pingan-vcgroup\u2019s", "orig": "Ye, J., Qi, X., He, Y., Chen, Y., Gu, D., Gao, P., Xiao, R.: Pingan-vcgroup\u2019s", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 171.57965000000002, "r_x1": 480.59469999999993, "r_y1": 171.57965000000002, "r_x2": 480.59469999999993, "r_y2": 163.50995, "r_x3": 151.51801, "r_y3": 163.50995, "coord_origin": "TOPLEFT" }, "text": "solution for icdar 2021 competition on scientific literature parsing task b: Ta-", "orig": "solution for icdar 2021 competition on scientific literature parsing task b: Ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 182.53864, "r_x1": 280.64047, "r_y1": 182.53864, "r_x2": 280.64047, "r_y2": 174.46893, "r_x3": 151.51801, "r_y3": 174.46893, "coord_origin": "TOPLEFT" }, "text": "ble recognition to html (2021).", "orig": "ble recognition to html (2021).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.078, "r_y0": 182.58349999999996, "r_x1": 478.03403000000003, "r_y1": 182.58349999999996, "r_x2": 478.03403000000003, "r_y2": 175.11450000000002, "r_x3": 285.078, "r_y3": 175.11450000000002, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.48550/ARXIV.2105.01848", "orig": "https://doi.org/10.48550/ARXIV.2105.01848", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 478.0319799999999, "r_y0": 182.53864, "r_x1": 480.59099999999995, "r_y1": 182.53864, "r_x2": 480.59099999999995, "r_y2": 174.46893, "r_x3": 478.0319799999999, "r_y3": 174.46893, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51797, "r_y0": 193.54247999999995, "r_x1": 302.11584, "r_y1": 193.54247999999995, "r_x2": 302.11584, "r_y2": 186.07349, "r_x3": 151.51797, "r_y3": 186.07349, "coord_origin": "TOPLEFT" }, "text": "https://arxiv.org/abs/2105.01848", "orig": "https://arxiv.org/abs/2105.01848", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "19. Ye, J., Qi, X., He, Y., Chen, Y., Gu, D., Gao, P., Xiao, R.: Pingan-vcgroup's solution for icdar 2021 competition on scientific literature parsing task b: Table recognition to html (2021). https://doi.org/10.48550/ARXIV.2105.01848 , https://arxiv.org/abs/2105.01848" }, { "label": "list_item", "id": 4, "page_no": 13, "cluster": { "id": 4, "label": "list_item", "bbox": { "l": 134.76497, "t": 196.38689999999997, "r": 480.5935400000001, "b": 215.41461000000004, "coord_origin": "TOPLEFT" }, "confidence": 0.9531471729278564, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76497, "r_y0": 204.45659999999998, "r_x1": 145.65964, "r_y1": 204.45659999999998, "r_x2": 145.65964, "r_y2": 196.38689999999997, "r_x3": 134.76497, "r_y3": 196.38689999999997, "coord_origin": "TOPLEFT" }, "text": "20.", "orig": "20.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.92294, "r_y0": 204.45659999999998, "r_x1": 480.5935400000001, "r_y1": 204.45659999999998, "r_x2": 480.5935400000001, "r_y2": 196.38689999999997, "r_x3": 149.92294, "r_y3": 196.38689999999997, "coord_origin": "TOPLEFT" }, "text": "Zhang, Z., Zhang, J., Du, J., Wang, F.: Split, embed and merge: An accurate table", "orig": "Zhang, Z., Zhang, J., Du, J., Wang, F.: Split, embed and merge: An accurate table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51797, "r_y0": 215.41461000000004, "r_x1": 318.55124, "r_y1": 215.41461000000004, "r_x2": 318.55124, "r_y2": 207.34491000000003, "r_x3": 151.51797, "r_y3": 207.34491000000003, "coord_origin": "TOPLEFT" }, "text": "structure recognizer. Pattern Recognition", "orig": "structure recognizer. Pattern Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 321.62097, "r_y0": 215.20844, "r_x1": 337.53186, "r_y1": 215.20844, "r_x2": 337.53186, "r_y2": 207.2821, "r_x3": 321.62097, "r_y3": 207.2821, "coord_origin": "TOPLEFT" }, "text": "126", "orig": "126", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.53296, "r_y0": 215.41461000000004, "r_x1": 399.46927, "r_y1": 215.41461000000004, "r_x2": 399.46927, "r_y2": 207.34491000000003, "r_x3": 337.53296, "r_y3": 207.34491000000003, "coord_origin": "TOPLEFT" }, "text": ", 108565 (2022)", "orig": ", 108565 (2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "20. Zhang, Z., Zhang, J., Du, J., Wang, F.: Split, embed and merge: An accurate table structure recognizer. Pattern Recognition 126 , 108565 (2022)" }, { "label": "list_item", "id": 0, "page_no": 13, "cluster": { "id": 0, "label": "list_item", "bbox": { "l": 134.76495, "t": 218.30389000000002, "r": 480.59305000000006, "b": 270.25438999999994, "coord_origin": "TOPLEFT" }, "confidence": 0.972027063369751, "cells": [ { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76495, "r_y0": 226.3736, "r_x1": 145.7213, "r_y1": 226.3736, "r_x2": 145.7213, "r_y2": 218.30389000000002, "r_x3": 134.76495, "r_y3": 218.30389000000002, "coord_origin": "TOPLEFT" }, "text": "21.", "orig": "21.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.00871, "r_y0": 226.3736, "r_x1": 480.59012, "r_y1": 226.3736, "r_x2": 480.59012, "r_y2": 218.30389000000002, "r_x3": 150.00871, "r_y3": 218.30389000000002, "coord_origin": "TOPLEFT" }, "text": "Zheng, X., Burdick, D., Popa, L., Zhong, X., Wang, N.X.R.: Global table extractor", "orig": "Zheng, X., Burdick, D., Popa, L., Zhong, X., Wang, N.X.R.: Global table extractor", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51796, "r_y0": 237.33258, "r_x1": 480.59102999999993, "r_y1": 237.33258, "r_x2": 480.59102999999993, "r_y2": 229.26288, "r_x3": 151.51796, "r_y3": 229.26288, "coord_origin": "TOPLEFT" }, "text": "(gte): A framework for joint table identification and cell structure recognition using", "orig": "(gte): A framework for joint table identification and cell structure recognition using", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51796, "r_y0": 248.29156, "r_x1": 480.59119, "r_y1": 248.29156, "r_x2": 480.59119, "r_y2": 240.22186, "r_x3": 151.51796, "r_y3": 240.22186, "coord_origin": "TOPLEFT" }, "text": "visual context. In: 2021 IEEE Winter Conference on Applications of Computer Vi-", "orig": "visual context. In: 2021 IEEE Winter Conference on Applications of Computer Vi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51796, "r_y0": 259.25055, "r_x1": 293.44086, "r_y1": 259.25055, "r_x2": 293.44086, "r_y2": 251.18084999999996, "r_x3": 151.51796, "r_y3": 251.18084999999996, "coord_origin": "TOPLEFT" }, "text": "sion (WACV). pp. 697-706 (2021).", "orig": "sion (WACV). pp. 697-706 (2021).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 297.04996, "r_y0": 259.29540999999995, "r_x1": 480.59305000000006, "r_y1": 259.29540999999995, "r_x2": 480.59305000000006, "r_y2": 251.82641999999998, "r_x3": 297.04996, "r_y3": 251.82641999999998, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.1109/WACV48630.2021.", "orig": "https://doi.org/10.1109/WACV48630.2021.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51796, "r_y0": 270.25438999999994, "r_x1": 175.05028, "r_y1": 270.25438999999994, "r_x2": 175.05028, "r_y2": 262.7854, "r_x3": 151.51796, "r_y3": 262.7854, "coord_origin": "TOPLEFT" }, "text": "00074", "orig": "00074", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "21. Zheng, X., Burdick, D., Popa, L., Zhong, X., Wang, N.X.R.: Global table extractor (gte): A framework for joint table identification and cell structure recognition using visual context. In: 2021 IEEE Winter Conference on Applications of Computer Vision (WACV). pp. 697-706 (2021). https://doi.org/10.1109/WACV48630.2021. 00074" }, { "label": "list_item", "id": 1, "page_no": 13, "cluster": { "id": 1, "label": "list_item", "bbox": { "l": 134.76495, "t": 273.09882000000005, "r": 480.59558, "b": 314.0455, "coord_origin": "TOPLEFT" }, "confidence": 0.9685125946998596, "cells": [ { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76495, "r_y0": 281.16855000000004, "r_x1": 146.36798, "r_y1": 281.16855000000004, "r_x2": 146.36798, "r_y2": 273.09882000000005, "r_x3": 134.76495, "r_y3": 273.09882000000005, "coord_origin": "TOPLEFT" }, "text": "22.", "orig": "22.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.90846, "r_y0": 281.16855000000004, "r_x1": 480.59094, "r_y1": 281.16855000000004, "r_x2": 480.59094, "r_y2": 273.09882000000005, "r_x3": 150.90846, "r_y3": 273.09882000000005, "coord_origin": "TOPLEFT" }, "text": "Zhong, X., ShafieiBavani, E., Jimeno Yepes, A.: Image-based table recognition:", "orig": "Zhong, X., ShafieiBavani, E., Jimeno Yepes, A.: Image-based table recognition:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51796, "r_y0": 292.12753, "r_x1": 480.58832000000007, "r_y1": 292.12753, "r_x2": 480.58832000000007, "r_y2": 284.05777, "r_x3": 151.51796, "r_y3": 284.05777, "coord_origin": "TOPLEFT" }, "text": "Data, model, and evaluation. In: Vedaldi, A., Bischof, H., Brox, T., Frahm, J.M.", "orig": "Data, model, and evaluation. In: Vedaldi, A., Bischof, H., Brox, T., Frahm, J.M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51796, "r_y0": 303.08651999999995, "r_x1": 480.59558, "r_y1": 303.08651999999995, "r_x2": 480.59558, "r_y2": 295.01675, "r_x3": 151.51796, "r_y3": 295.01675, "coord_origin": "TOPLEFT" }, "text": "(eds.) Computer Vision - ECCV 2020. pp. 564-580. Springer International Pub-", "orig": "(eds.) Computer Vision - ECCV 2020. pp. 564-580. Springer International Pub-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51796, "r_y0": 314.0455, "r_x1": 236.02359, "r_y1": 314.0455, "r_x2": 236.02359, "r_y2": 305.97574, "r_x3": 151.51796, "r_y3": 305.97574, "coord_origin": "TOPLEFT" }, "text": "lishing, Cham (2020)", "orig": "lishing, Cham (2020)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "22. Zhong, X., ShafieiBavani, E., Jimeno Yepes, A.: Image-based table recognition: Data, model, and evaluation. In: Vedaldi, A., Bischof, H., Brox, T., Frahm, J.M. (eds.) Computer Vision - ECCV 2020. pp. 564-580. Springer International Publishing, Cham (2020)" }, { "label": "list_item", "id": 2, "page_no": 13, "cluster": { "id": 2, "label": "list_item", "bbox": { "l": 134.76495, "t": 316.93472, "r": 480.59454, "b": 346.92148, "coord_origin": "TOPLEFT" }, "confidence": 0.9668973684310913, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76495, "r_y0": 325.00449000000003, "r_x1": 145.69547, "r_y1": 325.00449000000003, "r_x2": 145.69547, "r_y2": 316.93472, "r_x3": 134.76495, "r_y3": 316.93472, "coord_origin": "TOPLEFT" }, "text": "23.", "orig": "23.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.97276, "r_y0": 325.00449000000003, "r_x1": 480.59454, "r_y1": 325.00449000000003, "r_x2": 480.59454, "r_y2": 316.93472, "r_x3": 149.97276, "r_y3": 316.93472, "coord_origin": "TOPLEFT" }, "text": "Zhong, X., Tang, J., Yepes, A.J.: Publaynet: largest dataset ever for document lay-", "orig": "Zhong, X., Tang, J., Yepes, A.J.: Publaynet: largest dataset ever for document lay-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51796, "r_y0": 335.96249, "r_x1": 480.59387000000004, "r_y1": 335.96249, "r_x2": 480.59387000000004, "r_y2": 327.8927299999999, "r_x3": 151.51796, "r_y3": 327.8927299999999, "coord_origin": "TOPLEFT" }, "text": "out analysis. In: 2019 International Conference on Document Analysis and Recog-", "orig": "out analysis. In: 2019 International Conference on Document Analysis and Recog-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51796, "r_y0": 346.92148, "r_x1": 335.13635, "r_y1": 346.92148, "r_x2": 335.13635, "r_y2": 338.85172, "r_x3": 151.51796, "r_y3": 338.85172, "coord_origin": "TOPLEFT" }, "text": "nition (ICDAR). pp. 1015-1022. IEEE (2019)", "orig": "nition (ICDAR). pp. 1015-1022. IEEE (2019)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "23. Zhong, X., Tang, J., Yepes, A.J.: Publaynet: largest dataset ever for document layout analysis. In: 2019 International Conference on Document Analysis and Recognition (ICDAR). pp. 1015-1022. IEEE (2019)" } ], "body": [ { "label": "list_item", "id": 5, "page_no": 13, "cluster": { "id": 5, "label": "list_item", "bbox": { "l": 134.765, "t": 119.67400999999995, "r": 480.59113, "b": 149.66168000000005, "coord_origin": "TOPLEFT" }, "confidence": 0.9444757699966431, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 127.74370999999985, "r_x1": 146.07936, "r_y1": 127.74370999999985, "r_x2": 146.07936, "r_y2": 119.67400999999995, "r_x3": 134.765, "r_y3": 119.67400999999995, "coord_origin": "TOPLEFT" }, "text": "18.", "orig": "18.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.5069, "r_y0": 127.74370999999985, "r_x1": 480.5892, "r_y1": 127.74370999999985, "r_x2": 480.5892, "r_y2": 119.67400999999995, "r_x3": 150.5069, "r_y3": 119.67400999999995, "coord_origin": "TOPLEFT" }, "text": "Xue, W., Yu, B., Wang, W., Tao, D., Li, Q.: Tgrnet: A table graph reconstruc-", "orig": "Xue, W., Yu, B., Wang, W., Tao, D., Li, Q.: Tgrnet: A table graph reconstruc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 138.70270000000005, "r_x1": 480.59113, "r_y1": 138.70270000000005, "r_x2": 480.59113, "r_y2": 130.63300000000004, "r_x3": 151.51801, "r_y3": 130.63300000000004, "coord_origin": "TOPLEFT" }, "text": "tion network for table structure recognition. In: Proceedings of the IEEE/CVF", "orig": "tion network for table structure recognition. In: Proceedings of the IEEE/CVF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 149.66168000000005, "r_x1": 427.53329, "r_y1": 149.66168000000005, "r_x2": 427.53329, "r_y2": 141.59198000000004, "r_x3": 151.51801, "r_y3": 141.59198000000004, "coord_origin": "TOPLEFT" }, "text": "International Conference on Computer Vision. pp. 1295-1304 (2021)", "orig": "International Conference on Computer Vision. pp. 1295-1304 (2021)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "18. Xue, W., Yu, B., Wang, W., Tao, D., Li, Q.: Tgrnet: A table graph reconstruction network for table structure recognition. In: Proceedings of the IEEE/CVF International Conference on Computer Vision. pp. 1295-1304 (2021)" }, { "label": "list_item", "id": 3, "page_no": 13, "cluster": { "id": 3, "label": "list_item", "bbox": { "l": 134.765, "t": 152.55096000000003, "r": 480.59469999999993, "b": 193.54247999999995, "coord_origin": "TOPLEFT" }, "confidence": 0.9540892243385315, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 160.62067000000002, "r_x1": 146.19109, "r_y1": 160.62067000000002, "r_x2": 146.19109, "r_y2": 152.55096000000003, "r_x3": 134.765, "r_y3": 152.55096000000003, "coord_origin": "TOPLEFT" }, "text": "19.", "orig": "19.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.66234, "r_y0": 160.62067000000002, "r_x1": 480.5936899999999, "r_y1": 160.62067000000002, "r_x2": 480.5936899999999, "r_y2": 152.55096000000003, "r_x3": 150.66234, "r_y3": 152.55096000000003, "coord_origin": "TOPLEFT" }, "text": "Ye, J., Qi, X., He, Y., Chen, Y., Gu, D., Gao, P., Xiao, R.: Pingan-vcgroup\u2019s", "orig": "Ye, J., Qi, X., He, Y., Chen, Y., Gu, D., Gao, P., Xiao, R.: Pingan-vcgroup\u2019s", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 171.57965000000002, "r_x1": 480.59469999999993, "r_y1": 171.57965000000002, "r_x2": 480.59469999999993, "r_y2": 163.50995, "r_x3": 151.51801, "r_y3": 163.50995, "coord_origin": "TOPLEFT" }, "text": "solution for icdar 2021 competition on scientific literature parsing task b: Ta-", "orig": "solution for icdar 2021 competition on scientific literature parsing task b: Ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51801, "r_y0": 182.53864, "r_x1": 280.64047, "r_y1": 182.53864, "r_x2": 280.64047, "r_y2": 174.46893, "r_x3": 151.51801, "r_y3": 174.46893, "coord_origin": "TOPLEFT" }, "text": "ble recognition to html (2021).", "orig": "ble recognition to html (2021).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.078, "r_y0": 182.58349999999996, "r_x1": 478.03403000000003, "r_y1": 182.58349999999996, "r_x2": 478.03403000000003, "r_y2": 175.11450000000002, "r_x3": 285.078, "r_y3": 175.11450000000002, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.48550/ARXIV.2105.01848", "orig": "https://doi.org/10.48550/ARXIV.2105.01848", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 478.0319799999999, "r_y0": 182.53864, "r_x1": 480.59099999999995, "r_y1": 182.53864, "r_x2": 480.59099999999995, "r_y2": 174.46893, "r_x3": 478.0319799999999, "r_y3": 174.46893, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51797, "r_y0": 193.54247999999995, "r_x1": 302.11584, "r_y1": 193.54247999999995, "r_x2": 302.11584, "r_y2": 186.07349, "r_x3": 151.51797, "r_y3": 186.07349, "coord_origin": "TOPLEFT" }, "text": "https://arxiv.org/abs/2105.01848", "orig": "https://arxiv.org/abs/2105.01848", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "19. Ye, J., Qi, X., He, Y., Chen, Y., Gu, D., Gao, P., Xiao, R.: Pingan-vcgroup's solution for icdar 2021 competition on scientific literature parsing task b: Table recognition to html (2021). https://doi.org/10.48550/ARXIV.2105.01848 , https://arxiv.org/abs/2105.01848" }, { "label": "list_item", "id": 4, "page_no": 13, "cluster": { "id": 4, "label": "list_item", "bbox": { "l": 134.76497, "t": 196.38689999999997, "r": 480.5935400000001, "b": 215.41461000000004, "coord_origin": "TOPLEFT" }, "confidence": 0.9531471729278564, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76497, "r_y0": 204.45659999999998, "r_x1": 145.65964, "r_y1": 204.45659999999998, "r_x2": 145.65964, "r_y2": 196.38689999999997, "r_x3": 134.76497, "r_y3": 196.38689999999997, "coord_origin": "TOPLEFT" }, "text": "20.", "orig": "20.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.92294, "r_y0": 204.45659999999998, "r_x1": 480.5935400000001, "r_y1": 204.45659999999998, "r_x2": 480.5935400000001, "r_y2": 196.38689999999997, "r_x3": 149.92294, "r_y3": 196.38689999999997, "coord_origin": "TOPLEFT" }, "text": "Zhang, Z., Zhang, J., Du, J., Wang, F.: Split, embed and merge: An accurate table", "orig": "Zhang, Z., Zhang, J., Du, J., Wang, F.: Split, embed and merge: An accurate table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51797, "r_y0": 215.41461000000004, "r_x1": 318.55124, "r_y1": 215.41461000000004, "r_x2": 318.55124, "r_y2": 207.34491000000003, "r_x3": 151.51797, "r_y3": 207.34491000000003, "coord_origin": "TOPLEFT" }, "text": "structure recognizer. Pattern Recognition", "orig": "structure recognizer. Pattern Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 321.62097, "r_y0": 215.20844, "r_x1": 337.53186, "r_y1": 215.20844, "r_x2": 337.53186, "r_y2": 207.2821, "r_x3": 321.62097, "r_y3": 207.2821, "coord_origin": "TOPLEFT" }, "text": "126", "orig": "126", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.53296, "r_y0": 215.41461000000004, "r_x1": 399.46927, "r_y1": 215.41461000000004, "r_x2": 399.46927, "r_y2": 207.34491000000003, "r_x3": 337.53296, "r_y3": 207.34491000000003, "coord_origin": "TOPLEFT" }, "text": ", 108565 (2022)", "orig": ", 108565 (2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "20. Zhang, Z., Zhang, J., Du, J., Wang, F.: Split, embed and merge: An accurate table structure recognizer. Pattern Recognition 126 , 108565 (2022)" }, { "label": "list_item", "id": 0, "page_no": 13, "cluster": { "id": 0, "label": "list_item", "bbox": { "l": 134.76495, "t": 218.30389000000002, "r": 480.59305000000006, "b": 270.25438999999994, "coord_origin": "TOPLEFT" }, "confidence": 0.972027063369751, "cells": [ { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76495, "r_y0": 226.3736, "r_x1": 145.7213, "r_y1": 226.3736, "r_x2": 145.7213, "r_y2": 218.30389000000002, "r_x3": 134.76495, "r_y3": 218.30389000000002, "coord_origin": "TOPLEFT" }, "text": "21.", "orig": "21.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.00871, "r_y0": 226.3736, "r_x1": 480.59012, "r_y1": 226.3736, "r_x2": 480.59012, "r_y2": 218.30389000000002, "r_x3": 150.00871, "r_y3": 218.30389000000002, "coord_origin": "TOPLEFT" }, "text": "Zheng, X., Burdick, D., Popa, L., Zhong, X., Wang, N.X.R.: Global table extractor", "orig": "Zheng, X., Burdick, D., Popa, L., Zhong, X., Wang, N.X.R.: Global table extractor", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51796, "r_y0": 237.33258, "r_x1": 480.59102999999993, "r_y1": 237.33258, "r_x2": 480.59102999999993, "r_y2": 229.26288, "r_x3": 151.51796, "r_y3": 229.26288, "coord_origin": "TOPLEFT" }, "text": "(gte): A framework for joint table identification and cell structure recognition using", "orig": "(gte): A framework for joint table identification and cell structure recognition using", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51796, "r_y0": 248.29156, "r_x1": 480.59119, "r_y1": 248.29156, "r_x2": 480.59119, "r_y2": 240.22186, "r_x3": 151.51796, "r_y3": 240.22186, "coord_origin": "TOPLEFT" }, "text": "visual context. In: 2021 IEEE Winter Conference on Applications of Computer Vi-", "orig": "visual context. In: 2021 IEEE Winter Conference on Applications of Computer Vi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51796, "r_y0": 259.25055, "r_x1": 293.44086, "r_y1": 259.25055, "r_x2": 293.44086, "r_y2": 251.18084999999996, "r_x3": 151.51796, "r_y3": 251.18084999999996, "coord_origin": "TOPLEFT" }, "text": "sion (WACV). pp. 697-706 (2021).", "orig": "sion (WACV). pp. 697-706 (2021).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 297.04996, "r_y0": 259.29540999999995, "r_x1": 480.59305000000006, "r_y1": 259.29540999999995, "r_x2": 480.59305000000006, "r_y2": 251.82641999999998, "r_x3": 297.04996, "r_y3": 251.82641999999998, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.1109/WACV48630.2021.", "orig": "https://doi.org/10.1109/WACV48630.2021.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51796, "r_y0": 270.25438999999994, "r_x1": 175.05028, "r_y1": 270.25438999999994, "r_x2": 175.05028, "r_y2": 262.7854, "r_x3": 151.51796, "r_y3": 262.7854, "coord_origin": "TOPLEFT" }, "text": "00074", "orig": "00074", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "21. Zheng, X., Burdick, D., Popa, L., Zhong, X., Wang, N.X.R.: Global table extractor (gte): A framework for joint table identification and cell structure recognition using visual context. In: 2021 IEEE Winter Conference on Applications of Computer Vision (WACV). pp. 697-706 (2021). https://doi.org/10.1109/WACV48630.2021. 00074" }, { "label": "list_item", "id": 1, "page_no": 13, "cluster": { "id": 1, "label": "list_item", "bbox": { "l": 134.76495, "t": 273.09882000000005, "r": 480.59558, "b": 314.0455, "coord_origin": "TOPLEFT" }, "confidence": 0.9685125946998596, "cells": [ { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76495, "r_y0": 281.16855000000004, "r_x1": 146.36798, "r_y1": 281.16855000000004, "r_x2": 146.36798, "r_y2": 273.09882000000005, "r_x3": 134.76495, "r_y3": 273.09882000000005, "coord_origin": "TOPLEFT" }, "text": "22.", "orig": "22.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.90846, "r_y0": 281.16855000000004, "r_x1": 480.59094, "r_y1": 281.16855000000004, "r_x2": 480.59094, "r_y2": 273.09882000000005, "r_x3": 150.90846, "r_y3": 273.09882000000005, "coord_origin": "TOPLEFT" }, "text": "Zhong, X., ShafieiBavani, E., Jimeno Yepes, A.: Image-based table recognition:", "orig": "Zhong, X., ShafieiBavani, E., Jimeno Yepes, A.: Image-based table recognition:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51796, "r_y0": 292.12753, "r_x1": 480.58832000000007, "r_y1": 292.12753, "r_x2": 480.58832000000007, "r_y2": 284.05777, "r_x3": 151.51796, "r_y3": 284.05777, "coord_origin": "TOPLEFT" }, "text": "Data, model, and evaluation. In: Vedaldi, A., Bischof, H., Brox, T., Frahm, J.M.", "orig": "Data, model, and evaluation. In: Vedaldi, A., Bischof, H., Brox, T., Frahm, J.M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51796, "r_y0": 303.08651999999995, "r_x1": 480.59558, "r_y1": 303.08651999999995, "r_x2": 480.59558, "r_y2": 295.01675, "r_x3": 151.51796, "r_y3": 295.01675, "coord_origin": "TOPLEFT" }, "text": "(eds.) Computer Vision - ECCV 2020. pp. 564-580. Springer International Pub-", "orig": "(eds.) Computer Vision - ECCV 2020. pp. 564-580. Springer International Pub-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51796, "r_y0": 314.0455, "r_x1": 236.02359, "r_y1": 314.0455, "r_x2": 236.02359, "r_y2": 305.97574, "r_x3": 151.51796, "r_y3": 305.97574, "coord_origin": "TOPLEFT" }, "text": "lishing, Cham (2020)", "orig": "lishing, Cham (2020)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "22. Zhong, X., ShafieiBavani, E., Jimeno Yepes, A.: Image-based table recognition: Data, model, and evaluation. In: Vedaldi, A., Bischof, H., Brox, T., Frahm, J.M. (eds.) Computer Vision - ECCV 2020. pp. 564-580. Springer International Publishing, Cham (2020)" }, { "label": "list_item", "id": 2, "page_no": 13, "cluster": { "id": 2, "label": "list_item", "bbox": { "l": 134.76495, "t": 316.93472, "r": 480.59454, "b": 346.92148, "coord_origin": "TOPLEFT" }, "confidence": 0.9668973684310913, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76495, "r_y0": 325.00449000000003, "r_x1": 145.69547, "r_y1": 325.00449000000003, "r_x2": 145.69547, "r_y2": 316.93472, "r_x3": 134.76495, "r_y3": 316.93472, "coord_origin": "TOPLEFT" }, "text": "23.", "orig": "23.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.97276, "r_y0": 325.00449000000003, "r_x1": 480.59454, "r_y1": 325.00449000000003, "r_x2": 480.59454, "r_y2": 316.93472, "r_x3": 149.97276, "r_y3": 316.93472, "coord_origin": "TOPLEFT" }, "text": "Zhong, X., Tang, J., Yepes, A.J.: Publaynet: largest dataset ever for document lay-", "orig": "Zhong, X., Tang, J., Yepes, A.J.: Publaynet: largest dataset ever for document lay-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51796, "r_y0": 335.96249, "r_x1": 480.59387000000004, "r_y1": 335.96249, "r_x2": 480.59387000000004, "r_y2": 327.8927299999999, "r_x3": 151.51796, "r_y3": 327.8927299999999, "coord_origin": "TOPLEFT" }, "text": "out analysis. In: 2019 International Conference on Document Analysis and Recog-", "orig": "out analysis. In: 2019 International Conference on Document Analysis and Recog-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.51796, "r_y0": 346.92148, "r_x1": 335.13635, "r_y1": 346.92148, "r_x2": 335.13635, "r_y2": 338.85172, "r_x3": 151.51796, "r_y3": 338.85172, "coord_origin": "TOPLEFT" }, "text": "nition (ICDAR). pp. 1015-1022. IEEE (2019)", "orig": "nition (ICDAR). pp. 1015-1022. IEEE (2019)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "23. Zhong, X., Tang, J., Yepes, A.J.: Publaynet: largest dataset ever for document layout analysis. In: 2019 International Conference on Document Analysis and Recognition (ICDAR). pp. 1015-1022. IEEE (2019)" } ], "headers": [ { "label": "page_header", "id": 7, "page_no": 13, "cluster": { "id": 7, "label": "page_header", "bbox": { "l": 134.765, "t": 93.77099999999996, "r": 143.97887, "b": 101.84069999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.7012730240821838, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.765, "r_y0": 101.84069999999997, "r_x1": 143.97887, "r_y1": 101.84069999999997, "r_x2": 143.97887, "r_y2": 93.77099999999996, "r_x3": 134.765, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "14" }, { "label": "page_header", "id": 6, "page_no": 13, "cluster": { "id": 6, "label": "page_header", "bbox": { "l": 167.82053, "t": 93.77099999999996, "r": 231.72049000000004, "b": 101.84069999999997, "coord_origin": "TOPLEFT" }, "confidence": 0.7889755964279175, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.82053, "r_y0": 101.84069999999997, "r_x1": 178.08249, "r_y1": 101.84069999999997, "r_x2": 178.08249, "r_y2": 93.77099999999996, "r_x3": 167.82053, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.37929, "r_y0": 101.84069999999997, "r_x1": 231.72049000000004, "r_y1": 101.84069999999997, "r_x2": 231.72049000000004, "r_y2": 93.77099999999996, "r_x3": 182.37929, "r_y3": 93.77099999999996, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "M. Lysak, et al." } ] } } ]