fix(pypdfium): resolve overlapping text when merging bounding boxes (#1549)
get merged_text from boundingbox instead of merging it to prevent overlaps Signed-off-by: Pedro Ribeiro <pedro_ribeiro_93@hotmail.com>
This commit is contained in:
parent
12a0e64892
commit
98b5eeb844
@ -175,13 +175,18 @@ class PyPdfiumPageBackend(PdfPageBackend):
|
||||
if len(group) == 1:
|
||||
return group[0]
|
||||
|
||||
merged_text = "".join(cell.text for cell in group)
|
||||
merged_bbox = BoundingBox(
|
||||
l=min(cell.rect.to_bounding_box().l for cell in group),
|
||||
t=min(cell.rect.to_bounding_box().t for cell in group),
|
||||
r=max(cell.rect.to_bounding_box().r for cell in group),
|
||||
b=max(cell.rect.to_bounding_box().b for cell in group),
|
||||
)
|
||||
|
||||
assert self._ppage is not None
|
||||
self.text_page = self._ppage.get_textpage()
|
||||
bbox = merged_bbox.to_bottom_left_origin(page_size.height)
|
||||
merged_text = self.text_page.get_text_bounded(*bbox.as_tuple())
|
||||
|
||||
return TextCell(
|
||||
index=group[0].index,
|
||||
text=merged_text,
|
||||
|
@ -4913,9 +4913,9 @@
|
||||
{
|
||||
"bbox": [
|
||||
315.65362548828125,
|
||||
489.1985778808594,
|
||||
489.19854736328125,
|
||||
537.1475219726562,
|
||||
563.276611328125
|
||||
563.2765655517578
|
||||
],
|
||||
"page": 1,
|
||||
"span": [
|
||||
@ -4979,9 +4979,9 @@
|
||||
{
|
||||
"bbox": [
|
||||
312.10369873046875,
|
||||
541.3901519775391,
|
||||
541.3901214599609,
|
||||
550.38916015625,
|
||||
713.5591354370117
|
||||
713.5591125488281
|
||||
],
|
||||
"page": 3,
|
||||
"span": [
|
||||
@ -5003,7 +5003,7 @@
|
||||
74.30525970458984,
|
||||
608.2984924316406,
|
||||
519.9801025390625,
|
||||
714.0887985229492
|
||||
714.0887908935547
|
||||
],
|
||||
"page": 5,
|
||||
"span": [
|
||||
@ -5024,7 +5024,7 @@
|
||||
"bbox": [
|
||||
53.03328323364258,
|
||||
284.3311462402344,
|
||||
285.3731689453125,
|
||||
285.3731384277344,
|
||||
534.3346557617188
|
||||
],
|
||||
"page": 5,
|
||||
@ -5047,7 +5047,7 @@
|
||||
49.97503662109375,
|
||||
604.4210662841797,
|
||||
301.6335754394531,
|
||||
688.2873382568359
|
||||
688.2873153686523
|
||||
],
|
||||
"page": 8,
|
||||
"span": [
|
||||
@ -5066,7 +5066,7 @@
|
||||
"prov": [
|
||||
{
|
||||
"bbox": [
|
||||
305.5836486816406,
|
||||
305.58367919921875,
|
||||
611.3732452392578,
|
||||
554.8258666992188,
|
||||
693.3458404541016
|
||||
@ -5111,9 +5111,9 @@
|
||||
{
|
||||
"bbox": [
|
||||
216.76925659179688,
|
||||
348.65301513671875,
|
||||
348.6529541015625,
|
||||
375.7829284667969,
|
||||
411.5093688964844
|
||||
411.5093994140625
|
||||
],
|
||||
"page": 8,
|
||||
"span": [
|
||||
@ -5132,10 +5132,10 @@
|
||||
"prov": [
|
||||
{
|
||||
"bbox": [
|
||||
383.1364440917969,
|
||||
383.1363830566406,
|
||||
349.2250671386719,
|
||||
542.1132202148438,
|
||||
410.7686767578125
|
||||
542.1131591796875,
|
||||
410.7687072753906
|
||||
],
|
||||
"page": 8,
|
||||
"span": [
|
||||
@ -5220,7 +5220,7 @@
|
||||
"prov": [
|
||||
{
|
||||
"bbox": [
|
||||
51.15378952026367,
|
||||
51.153778076171875,
|
||||
447.09332275390625,
|
||||
282.8598937988281,
|
||||
687.6914825439453
|
||||
@ -5286,8 +5286,8 @@
|
||||
"prov": [
|
||||
{
|
||||
"bbox": [
|
||||
55.116363525390625,
|
||||
542.6654510498047,
|
||||
55.11635208129883,
|
||||
542.6654968261719,
|
||||
279.370849609375,
|
||||
655.7449951171875
|
||||
],
|
||||
@ -5375,9 +5375,9 @@
|
||||
{
|
||||
"bbox": [
|
||||
323.46868896484375,
|
||||
327.739501953125,
|
||||
327.73956298828125,
|
||||
525.9569091796875,
|
||||
429.5491638183594
|
||||
429.5492248535156
|
||||
],
|
||||
"page": 15,
|
||||
"span": [
|
||||
@ -5421,7 +5421,7 @@
|
||||
66.79948425292969,
|
||||
293.8616027832031,
|
||||
528.5565795898438,
|
||||
538.3836822509766
|
||||
538.3837127685547
|
||||
],
|
||||
"page": 16,
|
||||
"span": [
|
||||
@ -5443,9 +5443,9 @@
|
||||
{
|
||||
"bbox": [
|
||||
315.65362548828125,
|
||||
489.1985778808594,
|
||||
489.19854736328125,
|
||||
537.1475219726562,
|
||||
563.276611328125
|
||||
563.2765655517578
|
||||
],
|
||||
"page": 1,
|
||||
"span": [
|
||||
@ -6250,10 +6250,10 @@
|
||||
"prov": [
|
||||
{
|
||||
"bbox": [
|
||||
310.67584228515625,
|
||||
310.6757507324219,
|
||||
636.7794799804688,
|
||||
542.9547119140625,
|
||||
718.8061141967773
|
||||
542.9546508789062,
|
||||
718.8061218261719
|
||||
],
|
||||
"page": 4,
|
||||
"span": [
|
||||
@ -9329,7 +9329,7 @@
|
||||
332.9688720703125,
|
||||
148.73028564453125,
|
||||
520.942138671875,
|
||||
251.7164306640625
|
||||
251.71649169921875
|
||||
],
|
||||
"page": 7,
|
||||
"span": [
|
||||
@ -10152,9 +10152,9 @@
|
||||
{
|
||||
"bbox": [
|
||||
53.62853240966797,
|
||||
499.60003662109375,
|
||||
499.6000061035156,
|
||||
298.5574951171875,
|
||||
573.0514221191406
|
||||
573.0514526367188
|
||||
],
|
||||
"page": 8,
|
||||
"span": [
|
||||
@ -12941,7 +12941,7 @@
|
||||
"prov": [
|
||||
{
|
||||
"bbox": [
|
||||
83.31756591796875,
|
||||
83.31759643554688,
|
||||
304.7430114746094,
|
||||
248.873046875,
|
||||
395.9864501953125
|
||||
@ -12968,9 +12968,9 @@
|
||||
{
|
||||
"bbox": [
|
||||
310.3294372558594,
|
||||
655.8524780273438,
|
||||
655.8524932861328,
|
||||
555.8338623046875,
|
||||
690.8223266601562
|
||||
690.8223342895508
|
||||
],
|
||||
"page": 13,
|
||||
"span": [
|
||||
@ -12994,9 +12994,9 @@
|
||||
{
|
||||
"bbox": [
|
||||
309.9566345214844,
|
||||
607.2774658203125,
|
||||
607.2774353027344,
|
||||
555.7466430664062,
|
||||
637.3855133056641
|
||||
637.3854827880859
|
||||
],
|
||||
"page": 13,
|
||||
"span": [
|
||||
@ -13019,10 +13019,10 @@
|
||||
"prov": [
|
||||
{
|
||||
"bbox": [
|
||||
309.9635314941406,
|
||||
558.4485473632812,
|
||||
555.7054443359375,
|
||||
596.2945861816406
|
||||
309.96356201171875,
|
||||
558.4485168457031,
|
||||
555.7053833007812,
|
||||
596.2945098876953
|
||||
],
|
||||
"page": 13,
|
||||
"span": [
|
||||
@ -13175,10 +13175,10 @@
|
||||
"prov": [
|
||||
{
|
||||
"bbox": [
|
||||
51.72642135620117,
|
||||
447.7554931640625,
|
||||
283.114013671875,
|
||||
518.3907165527344
|
||||
51.726383209228516,
|
||||
447.7555236816406,
|
||||
283.1140441894531,
|
||||
518.3907470703125
|
||||
],
|
||||
"page": 14,
|
||||
"span": [
|
||||
@ -13201,7 +13201,7 @@
|
||||
"prov": [
|
||||
{
|
||||
"bbox": [
|
||||
51.434879302978516,
|
||||
51.43488693237305,
|
||||
300.17974853515625,
|
||||
310.7267150878906,
|
||||
338.51251220703125
|
||||
@ -13253,7 +13253,7 @@
|
||||
"prov": [
|
||||
{
|
||||
"bbox": [
|
||||
51.27280807495117,
|
||||
51.2728271484375,
|
||||
200.086669921875,
|
||||
311.0897216796875,
|
||||
238.271484375
|
||||
@ -13435,10 +13435,10 @@
|
||||
"prov": [
|
||||
{
|
||||
"bbox": [
|
||||
319.06494140625,
|
||||
319.0649719238281,
|
||||
122.80792236328125,
|
||||
533.77392578125,
|
||||
182.1591796875
|
||||
533.7738647460938,
|
||||
182.1590576171875
|
||||
],
|
||||
"page": 14,
|
||||
"span": [
|
||||
@ -13461,8 +13461,8 @@
|
||||
"prov": [
|
||||
{
|
||||
"bbox": [
|
||||
55.116363525390625,
|
||||
542.6654510498047,
|
||||
55.11635208129883,
|
||||
542.6654968261719,
|
||||
279.370849609375,
|
||||
655.7449951171875
|
||||
],
|
||||
@ -13513,10 +13513,10 @@
|
||||
"prov": [
|
||||
{
|
||||
"bbox": [
|
||||
323.0059509277344,
|
||||
569.0885925292969,
|
||||
525.95166015625,
|
||||
670.4528503417969
|
||||
323.0059814453125,
|
||||
569.0885772705078,
|
||||
525.9517211914062,
|
||||
670.4528656005859
|
||||
],
|
||||
"page": 15,
|
||||
"span": [
|
||||
@ -13540,9 +13540,9 @@
|
||||
{
|
||||
"bbox": [
|
||||
323.384765625,
|
||||
447.90789794921875,
|
||||
447.9078674316406,
|
||||
526.1268920898438,
|
||||
550.0270538330078
|
||||
550.0270690917969
|
||||
],
|
||||
"page": 15,
|
||||
"span": [
|
||||
@ -13566,9 +13566,9 @@
|
||||
{
|
||||
"bbox": [
|
||||
323.46868896484375,
|
||||
327.739501953125,
|
||||
327.73956298828125,
|
||||
525.9569091796875,
|
||||
429.5491638183594
|
||||
429.5492248535156
|
||||
],
|
||||
"page": 15,
|
||||
"span": [
|
||||
|
File diff suppressed because it is too large
Load Diff
@ -3099,9 +3099,9 @@
|
||||
"prov": [
|
||||
{
|
||||
"bbox": [
|
||||
323.408203125,
|
||||
266.1492919921875,
|
||||
553.2952270507812,
|
||||
323.4081115722656,
|
||||
266.14935302734375,
|
||||
553.295166015625,
|
||||
541.6512603759766
|
||||
],
|
||||
"page": 1,
|
||||
@ -3122,9 +3122,9 @@
|
||||
{
|
||||
"bbox": [
|
||||
88.33030700683594,
|
||||
571.4317321777344,
|
||||
571.4317626953125,
|
||||
263.7049560546875,
|
||||
699.1134796142578
|
||||
699.1134490966797
|
||||
],
|
||||
"page": 3,
|
||||
"span": [
|
||||
@ -3144,9 +3144,9 @@
|
||||
{
|
||||
"bbox": [
|
||||
53.05912780761719,
|
||||
251.135986328125,
|
||||
251.1358642578125,
|
||||
295.8506164550781,
|
||||
481.2087097167969
|
||||
481.20867919921875
|
||||
],
|
||||
"page": 4,
|
||||
"span": [
|
||||
@ -3234,9 +3234,9 @@
|
||||
{
|
||||
"bbox": [
|
||||
98.93103790283203,
|
||||
497.91851806640625,
|
||||
497.91845703125,
|
||||
512.579833984375,
|
||||
654.5245208740234
|
||||
654.5244903564453
|
||||
],
|
||||
"page": 4,
|
||||
"span": [
|
||||
@ -8153,7 +8153,7 @@
|
||||
62.02753829956055,
|
||||
440.3381042480469,
|
||||
285.78955078125,
|
||||
596.3199310302734
|
||||
596.3199462890625
|
||||
],
|
||||
"page": 6,
|
||||
"span": [
|
||||
@ -10514,9 +10514,9 @@
|
||||
"prov": [
|
||||
{
|
||||
"bbox": [
|
||||
80.35525512695312,
|
||||
80.35527038574219,
|
||||
496.5545349121094,
|
||||
267.0082092285156,
|
||||
267.00823974609375,
|
||||
641.0637054443359
|
||||
],
|
||||
"page": 7,
|
||||
@ -14214,10 +14214,10 @@
|
||||
"prov": [
|
||||
{
|
||||
"bbox": [
|
||||
72.6590347290039,
|
||||
452.1459655761719,
|
||||
274.83465576171875,
|
||||
619.5191955566406
|
||||
72.65901947021484,
|
||||
452.14599609375,
|
||||
274.8346862792969,
|
||||
619.5191650390625
|
||||
],
|
||||
"page": 8,
|
||||
"span": [
|
||||
|
File diff suppressed because it is too large
Load Diff
@ -2686,7 +2686,7 @@
|
||||
"b": 102.78223000000003,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.8858679533004761,
|
||||
"confidence": 0.8858681321144104,
|
||||
"cells": [
|
||||
{
|
||||
"index": 1,
|
||||
@ -2816,7 +2816,7 @@
|
||||
"b": 179.20818999999995,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9577404260635376,
|
||||
"confidence": 0.957740306854248,
|
||||
"cells": [
|
||||
{
|
||||
"index": 5,
|
||||
@ -13628,7 +13628,7 @@
|
||||
"b": 102.78223000000003,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.8858679533004761,
|
||||
"confidence": 0.8858681321144104,
|
||||
"cells": [
|
||||
{
|
||||
"index": 1,
|
||||
@ -13770,7 +13770,7 @@
|
||||
"b": 179.20818999999995,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9577404260635376,
|
||||
"confidence": 0.957740306854248,
|
||||
"cells": [
|
||||
{
|
||||
"index": 5,
|
||||
@ -20153,7 +20153,7 @@
|
||||
"b": 179.20818999999995,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9577404260635376,
|
||||
"confidence": 0.957740306854248,
|
||||
"cells": [
|
||||
{
|
||||
"index": 5,
|
||||
@ -26486,7 +26486,7 @@
|
||||
"b": 102.78223000000003,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.8858679533004761,
|
||||
"confidence": 0.8858681321144104,
|
||||
"cells": [
|
||||
{
|
||||
"index": 1,
|
||||
|
@ -2498,9 +2498,9 @@
|
||||
{
|
||||
"bbox": [
|
||||
148.45364379882812,
|
||||
366.1537780761719,
|
||||
366.1538391113281,
|
||||
464.3608093261719,
|
||||
583.6257629394531
|
||||
583.6257476806641
|
||||
],
|
||||
"page": 2,
|
||||
"span": [
|
||||
@ -2541,9 +2541,9 @@
|
||||
"prov": [
|
||||
{
|
||||
"bbox": [
|
||||
164.65028381347656,
|
||||
164.6503143310547,
|
||||
511.6590576171875,
|
||||
449.5505676269531,
|
||||
449.550537109375,
|
||||
628.2029113769531
|
||||
],
|
||||
"page": 7,
|
||||
@ -2563,7 +2563,7 @@
|
||||
"prov": [
|
||||
{
|
||||
"bbox": [
|
||||
140.70968627929688,
|
||||
140.70960998535156,
|
||||
198.32281494140625,
|
||||
472.73382568359375,
|
||||
283.9361572265625
|
||||
@ -2585,10 +2585,10 @@
|
||||
"prov": [
|
||||
{
|
||||
"bbox": [
|
||||
162.67430114746094,
|
||||
128.78643798828125,
|
||||
451.70062255859375,
|
||||
347.37744140625
|
||||
162.67434692382812,
|
||||
128.786376953125,
|
||||
451.70068359375,
|
||||
347.3774719238281
|
||||
],
|
||||
"page": 10,
|
||||
"span": [
|
||||
@ -2607,9 +2607,9 @@
|
||||
"prov": [
|
||||
{
|
||||
"bbox": [
|
||||
168.39285278320312,
|
||||
168.3928985595703,
|
||||
157.99432373046875,
|
||||
447.35137939453125,
|
||||
447.3513488769531,
|
||||
610.0334930419922
|
||||
],
|
||||
"page": 11,
|
||||
@ -4065,7 +4065,7 @@
|
||||
143.6376495361328,
|
||||
528.7375183105469,
|
||||
470.8485412597656,
|
||||
635.6522979736328
|
||||
635.6522827148438
|
||||
],
|
||||
"page": 10,
|
||||
"span": [
|
||||
|
File diff suppressed because it is too large
Load Diff
@ -426,7 +426,7 @@
|
||||
320.4467468261719,
|
||||
81.689208984375,
|
||||
558.8576049804688,
|
||||
352.359375
|
||||
352.3592834472656
|
||||
],
|
||||
"page": 1,
|
||||
"span": [
|
||||
|
@ -3411,7 +3411,7 @@
|
||||
"b": 519.65363,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9695363640785217,
|
||||
"confidence": 0.9695364832878113,
|
||||
"cells": [
|
||||
{
|
||||
"index": 34,
|
||||
@ -4081,7 +4081,7 @@
|
||||
"b": 142.65363000000002,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9263731241226196,
|
||||
"confidence": 0.9263732433319092,
|
||||
"cells": [
|
||||
{
|
||||
"index": 59,
|
||||
@ -4611,7 +4611,7 @@
|
||||
"b": 382.15362999999996,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9253152012825012,
|
||||
"confidence": 0.9253151416778564,
|
||||
"cells": [
|
||||
{
|
||||
"index": 79,
|
||||
@ -4651,7 +4651,7 @@
|
||||
"b": 409.15362999999996,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9676451683044434,
|
||||
"confidence": 0.9676452875137329,
|
||||
"cells": [
|
||||
{
|
||||
"index": 80,
|
||||
@ -4711,12 +4711,12 @@
|
||||
"label": "picture",
|
||||
"bbox": {
|
||||
"l": 320.4467468261719,
|
||||
"t": 421.640625,
|
||||
"t": 421.6407165527344,
|
||||
"r": 558.8576049804688,
|
||||
"b": 692.310791015625,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9881086945533752,
|
||||
"confidence": 0.9881085753440857,
|
||||
"cells": [
|
||||
{
|
||||
"index": 82,
|
||||
@ -5463,7 +5463,7 @@
|
||||
"b": 713.009598,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9449448585510254,
|
||||
"confidence": 0.9449449777603149,
|
||||
"cells": [
|
||||
{
|
||||
"index": 93,
|
||||
@ -5528,7 +5528,7 @@
|
||||
"b": 710.989597,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9497622847557068,
|
||||
"confidence": 0.9497623443603516,
|
||||
"cells": [
|
||||
{
|
||||
"index": 95,
|
||||
@ -5593,7 +5593,7 @@
|
||||
"b": 740.290298,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9368568658828735,
|
||||
"confidence": 0.9368569850921631,
|
||||
"cells": [
|
||||
{
|
||||
"index": 97,
|
||||
@ -6624,7 +6624,7 @@
|
||||
"b": 519.65363,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9695363640785217,
|
||||
"confidence": 0.9695364832878113,
|
||||
"cells": [
|
||||
{
|
||||
"index": 34,
|
||||
@ -7312,7 +7312,7 @@
|
||||
"b": 142.65363000000002,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9263731241226196,
|
||||
"confidence": 0.9263732433319092,
|
||||
"cells": [
|
||||
{
|
||||
"index": 59,
|
||||
@ -7854,7 +7854,7 @@
|
||||
"b": 382.15362999999996,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9253152012825012,
|
||||
"confidence": 0.9253151416778564,
|
||||
"cells": [
|
||||
{
|
||||
"index": 79,
|
||||
@ -7900,7 +7900,7 @@
|
||||
"b": 409.15362999999996,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9676451683044434,
|
||||
"confidence": 0.9676452875137329,
|
||||
"cells": [
|
||||
{
|
||||
"index": 80,
|
||||
@ -7966,12 +7966,12 @@
|
||||
"label": "picture",
|
||||
"bbox": {
|
||||
"l": 320.4467468261719,
|
||||
"t": 421.640625,
|
||||
"t": 421.6407165527344,
|
||||
"r": 558.8576049804688,
|
||||
"b": 692.310791015625,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9881086945533752,
|
||||
"confidence": 0.9881085753440857,
|
||||
"cells": [
|
||||
{
|
||||
"index": 82,
|
||||
@ -8738,7 +8738,7 @@
|
||||
"b": 713.009598,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9449448585510254,
|
||||
"confidence": 0.9449449777603149,
|
||||
"cells": [
|
||||
{
|
||||
"index": 93,
|
||||
@ -8809,7 +8809,7 @@
|
||||
"b": 710.989597,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9497622847557068,
|
||||
"confidence": 0.9497623443603516,
|
||||
"cells": [
|
||||
{
|
||||
"index": 95,
|
||||
@ -8880,7 +8880,7 @@
|
||||
"b": 740.290298,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9368568658828735,
|
||||
"confidence": 0.9368569850921631,
|
||||
"cells": [
|
||||
{
|
||||
"index": 97,
|
||||
@ -9904,7 +9904,7 @@
|
||||
"b": 519.65363,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9695363640785217,
|
||||
"confidence": 0.9695364832878113,
|
||||
"cells": [
|
||||
{
|
||||
"index": 34,
|
||||
@ -10592,7 +10592,7 @@
|
||||
"b": 142.65363000000002,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9263731241226196,
|
||||
"confidence": 0.9263732433319092,
|
||||
"cells": [
|
||||
{
|
||||
"index": 59,
|
||||
@ -11134,7 +11134,7 @@
|
||||
"b": 382.15362999999996,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9253152012825012,
|
||||
"confidence": 0.9253151416778564,
|
||||
"cells": [
|
||||
{
|
||||
"index": 79,
|
||||
@ -11180,7 +11180,7 @@
|
||||
"b": 409.15362999999996,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9676451683044434,
|
||||
"confidence": 0.9676452875137329,
|
||||
"cells": [
|
||||
{
|
||||
"index": 80,
|
||||
@ -11246,12 +11246,12 @@
|
||||
"label": "picture",
|
||||
"bbox": {
|
||||
"l": 320.4467468261719,
|
||||
"t": 421.640625,
|
||||
"t": 421.6407165527344,
|
||||
"r": 558.8576049804688,
|
||||
"b": 692.310791015625,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9881086945533752,
|
||||
"confidence": 0.9881085753440857,
|
||||
"cells": [
|
||||
{
|
||||
"index": 82,
|
||||
@ -12018,7 +12018,7 @@
|
||||
"b": 713.009598,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9449448585510254,
|
||||
"confidence": 0.9449449777603149,
|
||||
"cells": [
|
||||
{
|
||||
"index": 93,
|
||||
@ -12089,7 +12089,7 @@
|
||||
"b": 710.989597,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9497622847557068,
|
||||
"confidence": 0.9497623443603516,
|
||||
"cells": [
|
||||
{
|
||||
"index": 95,
|
||||
@ -12162,7 +12162,7 @@
|
||||
"b": 740.290298,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9368568658828735,
|
||||
"confidence": 0.9368569850921631,
|
||||
"cells": [
|
||||
{
|
||||
"index": 97,
|
||||
|
@ -1541,7 +1541,7 @@
|
||||
"b": 358.76782,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.5588350296020508,
|
||||
"confidence": 0.5588339567184448,
|
||||
"cells": [
|
||||
{
|
||||
"index": 18,
|
||||
@ -1581,7 +1581,7 @@
|
||||
"b": 406.74554,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.6312209963798523,
|
||||
"confidence": 0.6312211155891418,
|
||||
"cells": [
|
||||
{
|
||||
"index": 19,
|
||||
@ -2036,7 +2036,7 @@
|
||||
"b": 607.23564,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9843751788139343,
|
||||
"confidence": 0.9843752980232239,
|
||||
"cells": [
|
||||
{
|
||||
"index": 36,
|
||||
@ -2719,7 +2719,7 @@
|
||||
"b": 358.76782,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.5588350296020508,
|
||||
"confidence": 0.5588339567184448,
|
||||
"cells": [
|
||||
{
|
||||
"index": 18,
|
||||
@ -2765,7 +2765,7 @@
|
||||
"b": 406.74554,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.6312209963798523,
|
||||
"confidence": 0.6312211155891418,
|
||||
"cells": [
|
||||
{
|
||||
"index": 19,
|
||||
@ -3232,7 +3232,7 @@
|
||||
"b": 607.23564,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9843751788139343,
|
||||
"confidence": 0.9843752980232239,
|
||||
"cells": [
|
||||
{
|
||||
"index": 36,
|
||||
@ -3914,7 +3914,7 @@
|
||||
"b": 358.76782,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.5588350296020508,
|
||||
"confidence": 0.5588339567184448,
|
||||
"cells": [
|
||||
{
|
||||
"index": 18,
|
||||
@ -3960,7 +3960,7 @@
|
||||
"b": 406.74554,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.6312209963798523,
|
||||
"confidence": 0.6312211155891418,
|
||||
"cells": [
|
||||
{
|
||||
"index": 19,
|
||||
@ -4427,7 +4427,7 @@
|
||||
"b": 607.23564,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9843751788139343,
|
||||
"confidence": 0.9843752980232239,
|
||||
"cells": [
|
||||
{
|
||||
"index": 36,
|
||||
@ -5782,7 +5782,7 @@
|
||||
"b": 137.5481507594625,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.950506865978241,
|
||||
"confidence": 0.9505067467689514,
|
||||
"cells": [
|
||||
{
|
||||
"index": 0,
|
||||
@ -6302,7 +6302,7 @@
|
||||
"b": 373.7119120634245,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.8727474808692932,
|
||||
"confidence": 0.8727476000785828,
|
||||
"cells": [
|
||||
{
|
||||
"index": 19,
|
||||
@ -7037,7 +7037,7 @@
|
||||
"b": 704.5687238902275,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.8504500389099121,
|
||||
"confidence": 0.8504503965377808,
|
||||
"cells": [
|
||||
{
|
||||
"index": 46,
|
||||
@ -7092,7 +7092,7 @@
|
||||
"b": 137.5481507594625,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.950506865978241,
|
||||
"confidence": 0.9505067467689514,
|
||||
"cells": [
|
||||
{
|
||||
"index": 0,
|
||||
@ -7630,7 +7630,7 @@
|
||||
"b": 373.7119120634245,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.8727474808692932,
|
||||
"confidence": 0.8727476000785828,
|
||||
"cells": [
|
||||
{
|
||||
"index": 19,
|
||||
@ -8389,7 +8389,7 @@
|
||||
"b": 704.5687238902275,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.8504500389099121,
|
||||
"confidence": 0.8504503965377808,
|
||||
"cells": [
|
||||
{
|
||||
"index": 46,
|
||||
@ -8437,7 +8437,7 @@
|
||||
"b": 137.5481507594625,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.950506865978241,
|
||||
"confidence": 0.9505067467689514,
|
||||
"cells": [
|
||||
{
|
||||
"index": 0,
|
||||
@ -8975,7 +8975,7 @@
|
||||
"b": 373.7119120634245,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.8727474808692932,
|
||||
"confidence": 0.8727476000785828,
|
||||
"cells": [
|
||||
{
|
||||
"index": 19,
|
||||
@ -9736,7 +9736,7 @@
|
||||
"b": 704.5687238902275,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.8504500389099121,
|
||||
"confidence": 0.8504503965377808,
|
||||
"cells": [
|
||||
{
|
||||
"index": 46,
|
||||
|
55
tests/data/groundtruth/docling_v1/multi_page.doctags.txt
Normal file
55
tests/data/groundtruth/docling_v1/multi_page.doctags.txt
Normal file
@ -0,0 +1,55 @@
|
||||
<document>
|
||||
<subtitle-level-1><location><page_1><loc_12><loc_90><loc_44><loc_91></location>The Evolution of the Word Processor</subtitle-level-1>
|
||||
<paragraph><location><page_1><loc_12><loc_85><loc_84><loc_88></location>The concept of the word processor predates modern computers and has evolved through several technological milestones.</paragraph>
|
||||
<subtitle-level-1><location><page_1><loc_12><loc_81><loc_55><loc_83></location>Pre-Digital Era (19th - Early 20th Century)</subtitle-level-1>
|
||||
<paragraph><location><page_1><loc_12><loc_73><loc_85><loc_80></location>The origins of word processing can be traced back to the invention of the typewriter in the mid-19th century. Patented in 1868 by Christopher Latham Sholes, the typewriter revolutionized written communication by enabling people to produce legible, professional documents more efficiently than handwriting.</paragraph>
|
||||
<paragraph><location><page_1><loc_12><loc_65><loc_85><loc_71></location>During this period, the term "word processing" didn't exist, but the typewriter laid the groundwork for future developments. Over time, advancements such as carbon paper (for copies) and the electric typewriter (introduced by IBM in 1935) improved the speed and convenience of document creation.</paragraph>
|
||||
<subtitle-level-1><location><page_1><loc_12><loc_58><loc_57><loc_60></location>The Birth of Word Processing (1960s - 1970s)</subtitle-level-1>
|
||||
<paragraph><location><page_1><loc_12><loc_52><loc_88><loc_56></location>The term "word processor" first emerged in the 1960s and referred to any system designed to streamline written communication and document production. Early word processors were not software programs but rather standalone machines.</paragraph>
|
||||
<paragraph><location><page_1><loc_15><loc_43><loc_87><loc_50></location>- · IBM MT/ST (Magnetic Tape/Selectric Typewriter) : Introduced in 1964, this machine combined IBM's Selectric typewriter with magnetic tape storage. It allowed users to record, edit, and replay typed content-an early example of digital text storage.</paragraph>
|
||||
<paragraph><location><page_1><loc_15><loc_38><loc_84><loc_43></location>- · Wang Laboratories : In the 1970s, Wang introduced dedicated word processing machines. These devices, like the Wang 1200, featured small screens and floppy disks, making them revolutionary for their time.</paragraph>
|
||||
<paragraph><location><page_1><loc_12><loc_33><loc_86><loc_37></location>These machines were primarily used in offices, where secretarial pools benefited from their ability to make revisions without retyping entire documents.</paragraph>
|
||||
<subtitle-level-1><location><page_1><loc_12><loc_27><loc_52><loc_28></location>The Rise of Personal Computers (1980s)</subtitle-level-1>
|
||||
<paragraph><location><page_1><loc_12><loc_22><loc_87><loc_25></location>The advent of personal computers in the late 1970s and early 1980s transformed word processing from a niche tool to an essential technology for businesses and individuals alike.</paragraph>
|
||||
<paragraph><location><page_1><loc_15><loc_15><loc_88><loc_20></location>- · WordStar (1978) : Developed for the CP/M operating system, WordStar was one of the first widely used word processing programs. It featured early examples of modern features like cut, copy, and paste.</paragraph>
|
||||
<paragraph><location><page_1><loc_15><loc_10><loc_88><loc_15></location>- · Microsoft Word (1983) : Microsoft launched Word for MS-DOS in 1983, introducing a graphical user interface (GUI) and mouse support. Over the years, Microsoft Word became the industry standard for word processing.</paragraph>
|
||||
<paragraph><location><page_2><loc_12><loc_87><loc_87><loc_91></location>Other notable software from this era included WordPerfect, which was popular among legal professionals, and Apple's MacWrite, which leveraged the Macintosh's graphical capabilities.</paragraph>
|
||||
<subtitle-level-1><location><page_2><loc_12><loc_80><loc_46><loc_81></location>The Modern Era (1990s - Present)</subtitle-level-1>
|
||||
<paragraph><location><page_2><loc_12><loc_75><loc_86><loc_78></location>By the 1990s, word processing software had become more sophisticated, with features like spell check, grammar check, templates, and collaborative tools.</paragraph>
|
||||
<paragraph><location><page_2><loc_15><loc_70><loc_83><loc_73></location>- · Microsoft Office Suite : Microsoft continued to dominate with its Office Suite, integrating Word with other productivity tools like Excel and PowerPoint.</paragraph>
|
||||
<paragraph><location><page_2><loc_15><loc_67><loc_87><loc_70></location>- · OpenOffice and LibreOffice : Open-source alternatives emerged in the early 2000s, offering free and flexible word processing options.</paragraph>
|
||||
<paragraph><location><page_2><loc_15><loc_62><loc_88><loc_67></location>- · Google Docs (2006) : The introduction of cloud-based word processing revolutionized collaboration. Google Docs enabled real-time editing and sharing, making it a staple for teams and remote work.</paragraph>
|
||||
<subtitle-level-1><location><page_2><loc_12><loc_55><loc_39><loc_57></location>Future of Word Processing</subtitle-level-1>
|
||||
<paragraph><location><page_2><loc_12><loc_45><loc_87><loc_53></location>Today, word processors are more than just tools for typing. They integrate artificial intelligence for grammar and style suggestions (e.g., Grammarly), voice-to-text features, and advanced layout options. As AI continues to advance, word processors may evolve into even more intuitive tools that predict user needs, automate repetitive tasks, and support richer multimedia integration.</paragraph>
|
||||
<paragraph><location><page_2><loc_12><loc_35><loc_87><loc_40></location>From the clunky typewriters of the 19th century to the AI-powered cloud tools of today, the word processor has come a long way. It remains an essential tool for communication and creativity, shaping how we write and share ideas.</paragraph>
|
||||
<subtitle-level-1><location><page_3><loc_12><loc_90><loc_46><loc_91></location>Specialized Word Processing Tools</subtitle-level-1>
|
||||
<paragraph><location><page_3><loc_12><loc_83><loc_86><loc_88></location>In addition to general-purpose word processors, specialized tools have emerged to cater to specific industries and needs. These tools incorporate unique features tailored to their users' workflows:</paragraph>
|
||||
<paragraph><location><page_3><loc_15><loc_73><loc_87><loc_81></location>- · Academic and Technical Writing : Tools like LaTeX gained popularity among academics, scientists, and engineers. Unlike traditional word processors, LaTeX focuses on precise formatting, particularly for complex mathematical equations, scientific papers, and technical documents. It relies on a markup language to produce polished documents suitable for publishing.</paragraph>
|
||||
<paragraph><location><page_3><loc_15><loc_67><loc_85><loc_73></location>- · Screenwriting Software : For screenwriters, tools like Final Draft and Celtx are specialized to handle scripts for film and television. These programs automate the formatting of dialogue, scene descriptions, and other elements unique to screenwriting.</paragraph>
|
||||
<paragraph><location><page_3><loc_15><loc_60><loc_88><loc_67></location>- · Legal Document Processors : Word processors tailored for legal professionals, like WordPerfect, offered features such as redlining (early version tracking) and document comparison. Even today, many law firms rely on these tools due to their robust formatting options for contracts and legal briefs.</paragraph>
|
||||
<subtitle-level-1><location><page_3><loc_12><loc_53><loc_57><loc_55></location>Key Features That Changed Word Processing</subtitle-level-1>
|
||||
<paragraph><location><page_3><loc_12><loc_47><loc_86><loc_52></location>The evolution of word processors wasn't just about hardware or software improvements-it was about the features that revolutionized how people wrote and edited. Some of these transformative features include:</paragraph>
|
||||
<paragraph><location><page_3><loc_15><loc_42><loc_86><loc_45></location>- 1. Undo/Redo : Introduced in the 1980s, the ability to undo mistakes and redo actions made experimentation and error correction much easier.</paragraph>
|
||||
<paragraph><location><page_3><loc_15><loc_38><loc_87><loc_42></location>- 2. Spell Check and Grammar Check : By the 1990s, these became standard, allowing users to spot errors automatically.</paragraph>
|
||||
<paragraph><location><page_3><loc_15><loc_35><loc_82><loc_38></location>- 3. Templates : Pre-designed formats for documents, such as resumes, letters, and invoices, helped users save time.</paragraph>
|
||||
<paragraph><location><page_3><loc_15><loc_32><loc_84><loc_35></location>- 4. Track Changes : A game-changer for collaboration, this feature allowed multiple users to suggest edits while maintaining the original text.</paragraph>
|
||||
<paragraph><location><page_3><loc_15><loc_27><loc_88><loc_32></location>- 5. Real-Time Collaboration : Tools like Google Docs and Microsoft 365 enabled multiple users to edit the same document simultaneously, forever changing teamwork dynamics.</paragraph>
|
||||
<subtitle-level-1><location><page_3><loc_12><loc_20><loc_52><loc_22></location>The Cultural Impact of Word Processors</subtitle-level-1>
|
||||
<paragraph><location><page_3><loc_12><loc_14><loc_87><loc_18></location>The word processor didn't just change workplaces-it changed culture. It democratized writing, enabling anyone with access to a computer to produce professional-quality documents. This shift had profound implications for education, business, and creative fields:</paragraph>
|
||||
<paragraph><location><page_4><loc_15><loc_87><loc_86><loc_91></location>- · Accessibility : Writers no longer needed expensive publishing equipment or training in typesetting to create polished work. This accessibility paved the way for selfpublishing, blogging, and even fan fiction communities.</paragraph>
|
||||
<paragraph><location><page_4><loc_15><loc_82><loc_88><loc_87></location>- · Education : Word processors became a cornerstone of education, teaching students not only how to write essays but also how to use technology effectively. Features like bibliography generators and integrated research tools enhanced learning.</paragraph>
|
||||
<paragraph><location><page_4><loc_15><loc_77><loc_87><loc_82></location>- · Creative Writing : Writers gained powerful tools to organize their ideas. Programs like Scrivener allowed authors to manage large projects, from novels to screenplays, with features like chapter outlines and character notes.</paragraph>
|
||||
<subtitle-level-1><location><page_4><loc_12><loc_70><loc_50><loc_72></location>Word Processors in a Post-Digital Era</subtitle-level-1>
|
||||
<paragraph><location><page_4><loc_12><loc_67><loc_88><loc_68></location>As we move further into the 21st century, the role of the word processor continues to evolve:</paragraph>
|
||||
<paragraph><location><page_4><loc_15><loc_58><loc_88><loc_65></location>- 1. Artificial Intelligence : Modern word processors are leveraging AI to suggest content improvements. Tools like Grammarly, ProWritingAid, and even native features in Word now analyze tone, conciseness, and clarity. Some AI systems can even generate entire paragraphs or rewrite sentences.</paragraph>
|
||||
<paragraph><location><page_4><loc_15><loc_52><loc_86><loc_58></location>- 2. Integration with Other Tools : Word processors are no longer standalone. They integrate with task managers, cloud storage, and project management platforms. For instance, Google Docs syncs with Google Drive, while Microsoft Word integrates seamlessly with OneDrive and Teams.</paragraph>
|
||||
<paragraph><location><page_4><loc_15><loc_45><loc_84><loc_52></location>- 3. Voice Typing : Speech-to-text capabilities have made word processing more accessible, particularly for those with disabilities. Tools like Dragon NaturallySpeaking and built-in options in Google Docs and Microsoft Word have made dictation mainstream.</paragraph>
|
||||
<paragraph><location><page_4><loc_15><loc_40><loc_87><loc_45></location>- 4. Multimedia Documents : Word processing has expanded beyond text. Modern tools allow users to embed images, videos, charts, and interactive elements, transforming simple documents into rich multimedia experiences.</paragraph>
|
||||
<paragraph><location><page_4><loc_15><loc_35><loc_86><loc_40></location>- 5. Cross-Platform Accessibility : Thanks to cloud computing, documents can now be accessed and edited across devices. Whether you're on a desktop, tablet, or smartphone, you can continue working seamlessly.</paragraph>
|
||||
<subtitle-level-1><location><page_4><loc_12><loc_29><loc_38><loc_30></location>A Glimpse Into the Future</subtitle-level-1>
|
||||
<paragraph><location><page_4><loc_12><loc_24><loc_87><loc_27></location>The word processor's future lies in adaptability and intelligence. Some exciting possibilities include:</paragraph>
|
||||
<paragraph><location><page_4><loc_15><loc_19><loc_87><loc_22></location>- · Fully AI-Assisted Writing : Imagine a word processor that understands your writing style, drafts emails, or creates entire essays based on minimal input.</paragraph>
|
||||
<paragraph><location><page_4><loc_15><loc_14><loc_88><loc_19></location>- · Immersive Interfaces : As augmented reality (AR) and virtual reality (VR) technology advance, users may be able to write and edit in 3D spaces, collaborating in virtual environments.</paragraph>
|
||||
<paragraph><location><page_4><loc_15><loc_11><loc_87><loc_14></location>- · Hyper-Personalization : Word processors could offer dynamic suggestions based on industry-specific needs, user habits, or even regional language variations.</paragraph>
|
||||
<paragraph><location><page_5><loc_12><loc_80><loc_86><loc_88></location>The journey of the word processor-from clunky typewriters to AI-powered platformsreflects humanity's broader technological progress. What began as a tool to simply replace handwriting has transformed into a powerful ally for creativity, communication, and collaboration. As technology continues to advance, the word processor will undoubtedly remain at the heart of how we express ideas and connect with one another.</paragraph>
|
||||
</document>
|
1319
tests/data/groundtruth/docling_v1/multi_page.json
Normal file
1319
tests/data/groundtruth/docling_v1/multi_page.json
Normal file
File diff suppressed because it is too large
Load Diff
105
tests/data/groundtruth/docling_v1/multi_page.md
Normal file
105
tests/data/groundtruth/docling_v1/multi_page.md
Normal file
@ -0,0 +1,105 @@
|
||||
## The Evolution of the Word Processor
|
||||
|
||||
The concept of the word processor predates modern computers and has evolved through several technological milestones.
|
||||
|
||||
## Pre-Digital Era (19th - Early 20th Century)
|
||||
|
||||
The origins of word processing can be traced back to the invention of the typewriter in the mid-19th century. Patented in 1868 by Christopher Latham Sholes, the typewriter revolutionized written communication by enabling people to produce legible, professional documents more efficiently than handwriting.
|
||||
|
||||
During this period, the term "word processing" didn't exist, but the typewriter laid the groundwork for future developments. Over time, advancements such as carbon paper (for copies) and the electric typewriter (introduced by IBM in 1935) improved the speed and convenience of document creation.
|
||||
|
||||
## The Birth of Word Processing (1960s - 1970s)
|
||||
|
||||
The term "word processor" first emerged in the 1960s and referred to any system designed to streamline written communication and document production. Early word processors were not software programs but rather standalone machines.
|
||||
|
||||
- · IBM MT/ST (Magnetic Tape/Selectric Typewriter) : Introduced in 1964, this machine combined IBM's Selectric typewriter with magnetic tape storage. It allowed users to record, edit, and replay typed content-an early example of digital text storage.
|
||||
|
||||
- · Wang Laboratories : In the 1970s, Wang introduced dedicated word processing machines. These devices, like the Wang 1200, featured small screens and floppy disks, making them revolutionary for their time.
|
||||
|
||||
These machines were primarily used in offices, where secretarial pools benefited from their ability to make revisions without retyping entire documents.
|
||||
|
||||
## The Rise of Personal Computers (1980s)
|
||||
|
||||
The advent of personal computers in the late 1970s and early 1980s transformed word processing from a niche tool to an essential technology for businesses and individuals alike.
|
||||
|
||||
- · WordStar (1978) : Developed for the CP/M operating system, WordStar was one of the first widely used word processing programs. It featured early examples of modern features like cut, copy, and paste.
|
||||
|
||||
- · Microsoft Word (1983) : Microsoft launched Word for MS-DOS in 1983, introducing a graphical user interface (GUI) and mouse support. Over the years, Microsoft Word became the industry standard for word processing.
|
||||
|
||||
Other notable software from this era included WordPerfect, which was popular among legal professionals, and Apple's MacWrite, which leveraged the Macintosh's graphical capabilities.
|
||||
|
||||
## The Modern Era (1990s - Present)
|
||||
|
||||
By the 1990s, word processing software had become more sophisticated, with features like spell check, grammar check, templates, and collaborative tools.
|
||||
|
||||
- · Microsoft Office Suite : Microsoft continued to dominate with its Office Suite, integrating Word with other productivity tools like Excel and PowerPoint.
|
||||
|
||||
- · OpenOffice and LibreOffice : Open-source alternatives emerged in the early 2000s, offering free and flexible word processing options.
|
||||
|
||||
- · Google Docs (2006) : The introduction of cloud-based word processing revolutionized collaboration. Google Docs enabled real-time editing and sharing, making it a staple for teams and remote work.
|
||||
|
||||
## Future of Word Processing
|
||||
|
||||
Today, word processors are more than just tools for typing. They integrate artificial intelligence for grammar and style suggestions (e.g., Grammarly), voice-to-text features, and advanced layout options. As AI continues to advance, word processors may evolve into even more intuitive tools that predict user needs, automate repetitive tasks, and support richer multimedia integration.
|
||||
|
||||
From the clunky typewriters of the 19th century to the AI-powered cloud tools of today, the word processor has come a long way. It remains an essential tool for communication and creativity, shaping how we write and share ideas.
|
||||
|
||||
## Specialized Word Processing Tools
|
||||
|
||||
In addition to general-purpose word processors, specialized tools have emerged to cater to specific industries and needs. These tools incorporate unique features tailored to their users' workflows:
|
||||
|
||||
- · Academic and Technical Writing : Tools like LaTeX gained popularity among academics, scientists, and engineers. Unlike traditional word processors, LaTeX focuses on precise formatting, particularly for complex mathematical equations, scientific papers, and technical documents. It relies on a markup language to produce polished documents suitable for publishing.
|
||||
|
||||
- · Screenwriting Software : For screenwriters, tools like Final Draft and Celtx are specialized to handle scripts for film and television. These programs automate the formatting of dialogue, scene descriptions, and other elements unique to screenwriting.
|
||||
|
||||
- · Legal Document Processors : Word processors tailored for legal professionals, like WordPerfect, offered features such as redlining (early version tracking) and document comparison. Even today, many law firms rely on these tools due to their robust formatting options for contracts and legal briefs.
|
||||
|
||||
## Key Features That Changed Word Processing
|
||||
|
||||
The evolution of word processors wasn't just about hardware or software improvements-it was about the features that revolutionized how people wrote and edited. Some of these transformative features include:
|
||||
|
||||
- 1. Undo/Redo : Introduced in the 1980s, the ability to undo mistakes and redo actions made experimentation and error correction much easier.
|
||||
|
||||
- 2. Spell Check and Grammar Check : By the 1990s, these became standard, allowing users to spot errors automatically.
|
||||
|
||||
- 3. Templates : Pre-designed formats for documents, such as resumes, letters, and invoices, helped users save time.
|
||||
|
||||
- 4. Track Changes : A game-changer for collaboration, this feature allowed multiple users to suggest edits while maintaining the original text.
|
||||
|
||||
- 5. Real-Time Collaboration : Tools like Google Docs and Microsoft 365 enabled multiple users to edit the same document simultaneously, forever changing teamwork dynamics.
|
||||
|
||||
## The Cultural Impact of Word Processors
|
||||
|
||||
The word processor didn't just change workplaces-it changed culture. It democratized writing, enabling anyone with access to a computer to produce professional-quality documents. This shift had profound implications for education, business, and creative fields:
|
||||
|
||||
- · Accessibility : Writers no longer needed expensive publishing equipment or training in typesetting to create polished work. This accessibility paved the way for selfpublishing, blogging, and even fan fiction communities.
|
||||
|
||||
- · Education : Word processors became a cornerstone of education, teaching students not only how to write essays but also how to use technology effectively. Features like bibliography generators and integrated research tools enhanced learning.
|
||||
|
||||
- · Creative Writing : Writers gained powerful tools to organize their ideas. Programs like Scrivener allowed authors to manage large projects, from novels to screenplays, with features like chapter outlines and character notes.
|
||||
|
||||
## Word Processors in a Post-Digital Era
|
||||
|
||||
As we move further into the 21st century, the role of the word processor continues to evolve:
|
||||
|
||||
- 1. Artificial Intelligence : Modern word processors are leveraging AI to suggest content improvements. Tools like Grammarly, ProWritingAid, and even native features in Word now analyze tone, conciseness, and clarity. Some AI systems can even generate entire paragraphs or rewrite sentences.
|
||||
|
||||
- 2. Integration with Other Tools : Word processors are no longer standalone. They integrate with task managers, cloud storage, and project management platforms. For instance, Google Docs syncs with Google Drive, while Microsoft Word integrates seamlessly with OneDrive and Teams.
|
||||
|
||||
- 3. Voice Typing : Speech-to-text capabilities have made word processing more accessible, particularly for those with disabilities. Tools like Dragon NaturallySpeaking and built-in options in Google Docs and Microsoft Word have made dictation mainstream.
|
||||
|
||||
- 4. Multimedia Documents : Word processing has expanded beyond text. Modern tools allow users to embed images, videos, charts, and interactive elements, transforming simple documents into rich multimedia experiences.
|
||||
|
||||
- 5. Cross-Platform Accessibility : Thanks to cloud computing, documents can now be accessed and edited across devices. Whether you're on a desktop, tablet, or smartphone, you can continue working seamlessly.
|
||||
|
||||
## A Glimpse Into the Future
|
||||
|
||||
The word processor's future lies in adaptability and intelligence. Some exciting possibilities include:
|
||||
|
||||
- · Fully AI-Assisted Writing : Imagine a word processor that understands your writing style, drafts emails, or creates entire essays based on minimal input.
|
||||
|
||||
- · Immersive Interfaces : As augmented reality (AR) and virtual reality (VR) technology advance, users may be able to write and edit in 3D spaces, collaborating in virtual environments.
|
||||
|
||||
- · Hyper-Personalization : Word processors could offer dynamic suggestions based on industry-specific needs, user habits, or even regional language variations.
|
||||
|
||||
The journey of the word processor-from clunky typewriters to AI-powered platformsreflects humanity's broader technological progress. What began as a tool to simply replace handwriting has transformed into a powerful ally for creativity, communication, and collaboration. As technology continues to advance, the word processor will undoubtedly remain at the heart of how we express ideas and connect with one another.
|
21968
tests/data/groundtruth/docling_v1/multi_page.pages.json
Normal file
21968
tests/data/groundtruth/docling_v1/multi_page.pages.json
Normal file
File diff suppressed because it is too large
Load Diff
@ -222,7 +222,7 @@
|
||||
"prov": [
|
||||
{
|
||||
"bbox": [
|
||||
134.9200439453125,
|
||||
134.9199981689453,
|
||||
281.78173828125,
|
||||
475.6635437011719,
|
||||
487.109375
|
||||
@ -244,7 +244,7 @@
|
||||
"prov": [
|
||||
{
|
||||
"bbox": [
|
||||
218.8155517578125,
|
||||
218.81556701660156,
|
||||
283.10589599609375,
|
||||
391.96246337890625,
|
||||
513.9846496582031
|
||||
|
@ -1390,7 +1390,7 @@
|
||||
"id": 2,
|
||||
"label": "picture",
|
||||
"bbox": {
|
||||
"l": 134.9200439453125,
|
||||
"l": 134.9199981689453,
|
||||
"t": 304.890625,
|
||||
"r": 475.6635437011719,
|
||||
"b": 510.21826171875,
|
||||
@ -2174,7 +2174,7 @@
|
||||
"id": 2,
|
||||
"label": "picture",
|
||||
"bbox": {
|
||||
"l": 134.9200439453125,
|
||||
"l": 134.9199981689453,
|
||||
"t": 304.890625,
|
||||
"r": 475.6635437011719,
|
||||
"b": 510.21826171875,
|
||||
@ -2909,7 +2909,7 @@
|
||||
"id": 2,
|
||||
"label": "picture",
|
||||
"bbox": {
|
||||
"l": 134.9200439453125,
|
||||
"l": 134.9199981689453,
|
||||
"t": 304.890625,
|
||||
"r": 475.6635437011719,
|
||||
"b": 510.21826171875,
|
||||
@ -3623,7 +3623,7 @@
|
||||
"b": 268.20489999999995,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9870928525924683,
|
||||
"confidence": 0.987092912197113,
|
||||
"cells": [
|
||||
{
|
||||
"index": 0,
|
||||
@ -3938,7 +3938,7 @@
|
||||
"b": 532.05774,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9494236707687378,
|
||||
"confidence": 0.9494234323501587,
|
||||
"cells": [
|
||||
{
|
||||
"index": 12,
|
||||
@ -4302,7 +4302,7 @@
|
||||
"id": 2,
|
||||
"label": "picture",
|
||||
"bbox": {
|
||||
"l": 218.8155517578125,
|
||||
"l": 218.81556701660156,
|
||||
"t": 278.0153503417969,
|
||||
"r": 391.96246337890625,
|
||||
"b": 508.89410400390625,
|
||||
@ -4337,7 +4337,7 @@
|
||||
"b": 268.20489999999995,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9870928525924683,
|
||||
"confidence": 0.987092912197113,
|
||||
"cells": [
|
||||
{
|
||||
"index": 0,
|
||||
@ -4658,7 +4658,7 @@
|
||||
"b": 532.05774,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9494236707687378,
|
||||
"confidence": 0.9494234323501587,
|
||||
"cells": [
|
||||
{
|
||||
"index": 12,
|
||||
@ -5040,7 +5040,7 @@
|
||||
"id": 2,
|
||||
"label": "picture",
|
||||
"bbox": {
|
||||
"l": 218.8155517578125,
|
||||
"l": 218.81556701660156,
|
||||
"t": 278.0153503417969,
|
||||
"r": 391.96246337890625,
|
||||
"b": 508.89410400390625,
|
||||
@ -5072,7 +5072,7 @@
|
||||
"b": 268.20489999999995,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9870928525924683,
|
||||
"confidence": 0.987092912197113,
|
||||
"cells": [
|
||||
{
|
||||
"index": 0,
|
||||
@ -5393,7 +5393,7 @@
|
||||
"b": 532.05774,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9494236707687378,
|
||||
"confidence": 0.9494234323501587,
|
||||
"cells": [
|
||||
{
|
||||
"index": 12,
|
||||
@ -5729,7 +5729,7 @@
|
||||
"id": 2,
|
||||
"label": "picture",
|
||||
"bbox": {
|
||||
"l": 218.8155517578125,
|
||||
"l": 218.81556701660156,
|
||||
"t": 278.0153503417969,
|
||||
"r": 391.96246337890625,
|
||||
"b": 508.89410400390625,
|
||||
|
@ -3989,7 +3989,7 @@
|
||||
"prov": [
|
||||
{
|
||||
"bbox": [
|
||||
33.09040069580078,
|
||||
33.09052658081055,
|
||||
89.5469970703125,
|
||||
585.1502075195312,
|
||||
498.9671630859375
|
||||
@ -4055,9 +4055,9 @@
|
||||
"prov": [
|
||||
{
|
||||
"bbox": [
|
||||
64.1669921875,
|
||||
64.16704559326172,
|
||||
103.87176513671875,
|
||||
258.7742919921875,
|
||||
258.77435302734375,
|
||||
188.49365234375
|
||||
],
|
||||
"page": 3,
|
||||
@ -4099,7 +4099,7 @@
|
||||
"prov": [
|
||||
{
|
||||
"bbox": [
|
||||
145.4144744873047,
|
||||
145.41448974609375,
|
||||
156.616943359375,
|
||||
252.08840942382812,
|
||||
264.7552490234375
|
||||
@ -4121,10 +4121,10 @@
|
||||
"prov": [
|
||||
{
|
||||
"bbox": [
|
||||
32.075252532958984,
|
||||
554.0420684814453,
|
||||
32.075260162353516,
|
||||
554.0421142578125,
|
||||
239.620361328125,
|
||||
721.4226226806641
|
||||
721.4226608276367
|
||||
],
|
||||
"page": 5,
|
||||
"span": [
|
||||
@ -4168,7 +4168,7 @@
|
||||
135.97177124023438,
|
||||
381.39068603515625,
|
||||
545.4180908203125,
|
||||
684.5892486572266
|
||||
684.5892562866211
|
||||
],
|
||||
"page": 10,
|
||||
"span": [
|
||||
@ -4187,10 +4187,10 @@
|
||||
"prov": [
|
||||
{
|
||||
"bbox": [
|
||||
135.64837646484375,
|
||||
135.64834594726562,
|
||||
197.24334716796875,
|
||||
301.2367248535156,
|
||||
407.8262939453125
|
||||
301.23675537109375,
|
||||
407.8263244628906
|
||||
],
|
||||
"page": 11,
|
||||
"span": [
|
||||
@ -4209,10 +4209,10 @@
|
||||
"prov": [
|
||||
{
|
||||
"bbox": [
|
||||
63.801902770996094,
|
||||
621.9678497314453,
|
||||
547.11474609375,
|
||||
696.6175842285156
|
||||
63.80195617675781,
|
||||
621.9679107666016,
|
||||
547.1146850585938,
|
||||
696.6176071166992
|
||||
],
|
||||
"page": 14,
|
||||
"span": [
|
||||
@ -4231,7 +4231,7 @@
|
||||
"prov": [
|
||||
{
|
||||
"bbox": [
|
||||
63.985130310058594,
|
||||
63.9850959777832,
|
||||
145.8603515625,
|
||||
530.0478515625,
|
||||
364.09503173828125
|
||||
@ -4254,9 +4254,9 @@
|
||||
{
|
||||
"bbox": [
|
||||
136.5016632080078,
|
||||
314.4587707519531,
|
||||
314.45880126953125,
|
||||
545.4508666992188,
|
||||
672.7508773803711
|
||||
672.7509078979492
|
||||
],
|
||||
"page": 15,
|
||||
"span": [
|
||||
@ -4343,10 +4343,10 @@
|
||||
"prov": [
|
||||
{
|
||||
"bbox": [
|
||||
136.1496124267578,
|
||||
76.34844970703125,
|
||||
547.5267944335938,
|
||||
659.9669647216797
|
||||
136.1495819091797,
|
||||
76.3485107421875,
|
||||
547.52685546875,
|
||||
659.9669189453125
|
||||
],
|
||||
"page": 2,
|
||||
"span": [
|
||||
@ -6705,9 +6705,9 @@
|
||||
{
|
||||
"bbox": [
|
||||
135.52462768554688,
|
||||
349.949462890625,
|
||||
349.94940185546875,
|
||||
545.8714599609375,
|
||||
502.2747802734375
|
||||
502.2746887207031
|
||||
],
|
||||
"page": 8,
|
||||
"span": [
|
||||
@ -7164,7 +7164,7 @@
|
||||
64.41139221191406,
|
||||
70.39208984375,
|
||||
547.3950805664062,
|
||||
398.3863830566406
|
||||
398.3863525390625
|
||||
],
|
||||
"page": 9,
|
||||
"span": [
|
||||
@ -9130,7 +9130,7 @@
|
||||
"prov": [
|
||||
{
|
||||
"bbox": [
|
||||
63.55636978149414,
|
||||
63.55635070800781,
|
||||
495.77532958984375,
|
||||
548.5687255859375,
|
||||
687.7661285400391
|
||||
|
File diff suppressed because it is too large
Load Diff
@ -1171,7 +1171,7 @@
|
||||
"b": 295.08200000000005,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9547483325004578,
|
||||
"confidence": 0.9547481536865234,
|
||||
"cells": [
|
||||
{
|
||||
"index": 17,
|
||||
@ -1311,7 +1311,7 @@
|
||||
"b": 350.522,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9672117233276367,
|
||||
"confidence": 0.9672118425369263,
|
||||
"cells": [
|
||||
{
|
||||
"index": 22,
|
||||
@ -1971,7 +1971,7 @@
|
||||
"b": 295.08200000000005,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9547483325004578,
|
||||
"confidence": 0.9547481536865234,
|
||||
"cells": [
|
||||
{
|
||||
"index": 17,
|
||||
@ -2117,7 +2117,7 @@
|
||||
"b": 350.522,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9672117233276367,
|
||||
"confidence": 0.9672118425369263,
|
||||
"cells": [
|
||||
{
|
||||
"index": 22,
|
||||
@ -2770,7 +2770,7 @@
|
||||
"b": 295.08200000000005,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9547483325004578,
|
||||
"confidence": 0.9547481536865234,
|
||||
"cells": [
|
||||
{
|
||||
"index": 17,
|
||||
@ -2916,7 +2916,7 @@
|
||||
"b": 350.522,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9672117233276367,
|
||||
"confidence": 0.9672118425369263,
|
||||
"cells": [
|
||||
{
|
||||
"index": 22,
|
||||
|
@ -5951,7 +5951,7 @@
|
||||
"b": 465.596681609368,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9393879771232605,
|
||||
"confidence": 0.93938809633255,
|
||||
"cells": [
|
||||
{
|
||||
"index": 77,
|
||||
@ -7406,7 +7406,7 @@
|
||||
"b": 534.1167018462124,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.5769620537757874,
|
||||
"confidence": 0.5769621729850769,
|
||||
"cells": [
|
||||
{
|
||||
"index": 134,
|
||||
@ -8046,7 +8046,7 @@
|
||||
"b": 650.6431884765625,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.6444889903068542,
|
||||
"confidence": 0.6444893479347229,
|
||||
"cells": [],
|
||||
"children": []
|
||||
}
|
||||
@ -10042,7 +10042,7 @@
|
||||
"b": 465.596681609368,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9393879771232605,
|
||||
"confidence": 0.93938809633255,
|
||||
"cells": [
|
||||
{
|
||||
"index": 77,
|
||||
@ -11509,7 +11509,7 @@
|
||||
"b": 534.1167018462124,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.5769620537757874,
|
||||
"confidence": 0.5769621729850769,
|
||||
"cells": [
|
||||
{
|
||||
"index": 134,
|
||||
@ -12155,7 +12155,7 @@
|
||||
"b": 650.6431884765625,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.6444889903068542,
|
||||
"confidence": 0.6444893479347229,
|
||||
"cells": [],
|
||||
"children": []
|
||||
},
|
||||
@ -14148,7 +14148,7 @@
|
||||
"b": 465.596681609368,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9393879771232605,
|
||||
"confidence": 0.93938809633255,
|
||||
"cells": [
|
||||
{
|
||||
"index": 77,
|
||||
@ -15615,7 +15615,7 @@
|
||||
"b": 534.1167018462124,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.5769620537757874,
|
||||
"confidence": 0.5769621729850769,
|
||||
"cells": [
|
||||
{
|
||||
"index": 134,
|
||||
@ -16261,7 +16261,7 @@
|
||||
"b": 650.6431884765625,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.6444889903068542,
|
||||
"confidence": 0.6444893479347229,
|
||||
"cells": [],
|
||||
"children": []
|
||||
},
|
||||
|
@ -744,7 +744,7 @@
|
||||
388.5767822265625,
|
||||
739.034423828125,
|
||||
482.4759216308594,
|
||||
806.0041046142578
|
||||
806.0040969848633
|
||||
],
|
||||
"page": 1,
|
||||
"span": [
|
||||
|
@ -1391,7 +1391,7 @@
|
||||
"label": "picture",
|
||||
"bbox": {
|
||||
"l": 388.5767822265625,
|
||||
"t": 36.03587341308594,
|
||||
"t": 36.03588104248047,
|
||||
"r": 482.4759216308594,
|
||||
"b": 103.00555419921875,
|
||||
"coord_origin": "TOPLEFT"
|
||||
@ -1477,7 +1477,7 @@
|
||||
"b": 81.03008981017001,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.6917961239814758,
|
||||
"confidence": 0.6917959451675415,
|
||||
"cells": [
|
||||
{
|
||||
"index": 2,
|
||||
@ -1517,7 +1517,7 @@
|
||||
"b": 790.0379791491694,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.899228036403656,
|
||||
"confidence": 0.8992282152175903,
|
||||
"cells": [
|
||||
{
|
||||
"index": 3,
|
||||
@ -1597,7 +1597,7 @@
|
||||
"b": 323.44982924225053,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.6362584233283997,
|
||||
"confidence": 0.6362582445144653,
|
||||
"cells": [
|
||||
{
|
||||
"index": 5,
|
||||
@ -2361,7 +2361,7 @@
|
||||
"b": 179.2998695799522,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.7258325815200806,
|
||||
"confidence": 0.7258322834968567,
|
||||
"cells": [
|
||||
{
|
||||
"index": 5,
|
||||
@ -2891,7 +2891,7 @@
|
||||
"b": 233.17986945372706,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.8121814727783203,
|
||||
"confidence": 0.8121819496154785,
|
||||
"cells": [
|
||||
{
|
||||
"index": 25,
|
||||
@ -2931,7 +2931,7 @@
|
||||
"b": 228.73998946412837,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.7672220468521118,
|
||||
"confidence": 0.7672221660614014,
|
||||
"cells": [
|
||||
{
|
||||
"index": 26,
|
||||
@ -2971,7 +2971,7 @@
|
||||
"b": 255.88982940052404,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.8320456743240356,
|
||||
"confidence": 0.8320454955101013,
|
||||
"cells": [
|
||||
{
|
||||
"index": 27,
|
||||
@ -3011,7 +3011,7 @@
|
||||
"b": 251.44994941092557,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.5538824796676636,
|
||||
"confidence": 0.5538817644119263,
|
||||
"cells": [
|
||||
{
|
||||
"index": 28,
|
||||
@ -3051,7 +3051,7 @@
|
||||
"b": 278.5698293473914,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.7909000515937805,
|
||||
"confidence": 0.7908995151519775,
|
||||
"cells": [
|
||||
{
|
||||
"index": 29,
|
||||
@ -3131,7 +3131,7 @@
|
||||
"b": 323.44982924225053,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.6534578204154968,
|
||||
"confidence": 0.6534579396247864,
|
||||
"cells": [
|
||||
{
|
||||
"index": 31,
|
||||
@ -3236,7 +3236,7 @@
|
||||
"b": 296.80999930466,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.5417144298553467,
|
||||
"confidence": 0.5417138934135437,
|
||||
"cells": [
|
||||
{
|
||||
"index": 35,
|
||||
@ -3318,7 +3318,7 @@
|
||||
"b": 596.0198686036978,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.719137966632843,
|
||||
"confidence": 0.7191378474235535,
|
||||
"cells": [
|
||||
{
|
||||
"index": 37,
|
||||
@ -3822,7 +3822,7 @@
|
||||
"b": 386.56997909437825,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.8262879252433777,
|
||||
"confidence": 0.8262876868247986,
|
||||
"cells": [
|
||||
{
|
||||
"index": 38,
|
||||
@ -3862,7 +3862,7 @@
|
||||
"b": 413.70983903079747,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.7766718864440918,
|
||||
"confidence": 0.7766715884208679,
|
||||
"cells": [
|
||||
{
|
||||
"index": 39,
|
||||
@ -3902,7 +3902,7 @@
|
||||
"b": 409.26995904119883,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.8204737901687622,
|
||||
"confidence": 0.8204739093780518,
|
||||
"cells": [
|
||||
{
|
||||
"index": 40,
|
||||
@ -3942,7 +3942,7 @@
|
||||
"b": 436.3898589776647,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.7670677900314331,
|
||||
"confidence": 0.7670676708221436,
|
||||
"cells": [
|
||||
{
|
||||
"index": 41,
|
||||
@ -3982,7 +3982,7 @@
|
||||
"b": 432.0699789877849,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.8048340082168579,
|
||||
"confidence": 0.8048339486122131,
|
||||
"cells": [
|
||||
{
|
||||
"index": 42,
|
||||
@ -4062,7 +4062,7 @@
|
||||
"b": 454.7499689346523,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.827337384223938,
|
||||
"confidence": 0.8273372054100037,
|
||||
"cells": [
|
||||
{
|
||||
"index": 44,
|
||||
@ -4102,7 +4102,7 @@
|
||||
"b": 481.8698388711183,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.7342236638069153,
|
||||
"confidence": 0.7342240214347839,
|
||||
"cells": [
|
||||
{
|
||||
"index": 45,
|
||||
@ -4142,7 +4142,7 @@
|
||||
"b": 477.42995888151955,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.8411222696304321,
|
||||
"confidence": 0.8411223888397217,
|
||||
"cells": [
|
||||
{
|
||||
"index": 46,
|
||||
@ -4182,7 +4182,7 @@
|
||||
"b": 528.3098487623228,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.7251589894294739,
|
||||
"confidence": 0.7251590490341187,
|
||||
"cells": [
|
||||
{
|
||||
"index": 47,
|
||||
@ -4247,7 +4247,7 @@
|
||||
"b": 501.78997882445117,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.7848678827285767,
|
||||
"confidence": 0.7848676443099976,
|
||||
"cells": [
|
||||
{
|
||||
"index": 49,
|
||||
@ -4287,7 +4287,7 @@
|
||||
"b": 573.2198486571116,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.7586438059806824,
|
||||
"confidence": 0.758643627166748,
|
||||
"cells": [
|
||||
{
|
||||
"index": 50,
|
||||
@ -4352,7 +4352,7 @@
|
||||
"b": 546.69997871924,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.7897851467132568,
|
||||
"confidence": 0.7897858619689941,
|
||||
"cells": [
|
||||
{
|
||||
"index": 52,
|
||||
@ -4432,7 +4432,7 @@
|
||||
"b": 591.5799886140991,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.8144810795783997,
|
||||
"confidence": 0.8144806027412415,
|
||||
"cells": [
|
||||
{
|
||||
"index": 54,
|
||||
@ -4484,7 +4484,7 @@
|
||||
"label": "picture",
|
||||
"bbox": {
|
||||
"l": 388.5767822265625,
|
||||
"t": 36.03587341308594,
|
||||
"t": 36.03588104248047,
|
||||
"r": 482.4759216308594,
|
||||
"b": 103.00555419921875,
|
||||
"coord_origin": "TOPLEFT"
|
||||
@ -4580,7 +4580,7 @@
|
||||
"b": 81.03008981017001,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.6917961239814758,
|
||||
"confidence": 0.6917959451675415,
|
||||
"cells": [
|
||||
{
|
||||
"index": 2,
|
||||
@ -4626,7 +4626,7 @@
|
||||
"b": 790.0379791491694,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.899228036403656,
|
||||
"confidence": 0.8992282152175903,
|
||||
"cells": [
|
||||
{
|
||||
"index": 3,
|
||||
@ -4718,7 +4718,7 @@
|
||||
"b": 323.44982924225053,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.6362584233283997,
|
||||
"confidence": 0.6362582445144653,
|
||||
"cells": [
|
||||
{
|
||||
"index": 5,
|
||||
@ -5482,7 +5482,7 @@
|
||||
"b": 179.2998695799522,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.7258325815200806,
|
||||
"confidence": 0.7258322834968567,
|
||||
"cells": [
|
||||
{
|
||||
"index": 5,
|
||||
@ -6012,7 +6012,7 @@
|
||||
"b": 233.17986945372706,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.8121814727783203,
|
||||
"confidence": 0.8121819496154785,
|
||||
"cells": [
|
||||
{
|
||||
"index": 25,
|
||||
@ -6052,7 +6052,7 @@
|
||||
"b": 228.73998946412837,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.7672220468521118,
|
||||
"confidence": 0.7672221660614014,
|
||||
"cells": [
|
||||
{
|
||||
"index": 26,
|
||||
@ -6092,7 +6092,7 @@
|
||||
"b": 255.88982940052404,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.8320456743240356,
|
||||
"confidence": 0.8320454955101013,
|
||||
"cells": [
|
||||
{
|
||||
"index": 27,
|
||||
@ -6132,7 +6132,7 @@
|
||||
"b": 251.44994941092557,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.5538824796676636,
|
||||
"confidence": 0.5538817644119263,
|
||||
"cells": [
|
||||
{
|
||||
"index": 28,
|
||||
@ -6172,7 +6172,7 @@
|
||||
"b": 278.5698293473914,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.7909000515937805,
|
||||
"confidence": 0.7908995151519775,
|
||||
"cells": [
|
||||
{
|
||||
"index": 29,
|
||||
@ -6252,7 +6252,7 @@
|
||||
"b": 323.44982924225053,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.6534578204154968,
|
||||
"confidence": 0.6534579396247864,
|
||||
"cells": [
|
||||
{
|
||||
"index": 31,
|
||||
@ -6357,7 +6357,7 @@
|
||||
"b": 296.80999930466,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.5417144298553467,
|
||||
"confidence": 0.5417138934135437,
|
||||
"cells": [
|
||||
{
|
||||
"index": 35,
|
||||
@ -6451,7 +6451,7 @@
|
||||
"b": 596.0198686036978,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.719137966632843,
|
||||
"confidence": 0.7191378474235535,
|
||||
"cells": [
|
||||
{
|
||||
"index": 37,
|
||||
@ -6955,7 +6955,7 @@
|
||||
"b": 386.56997909437825,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.8262879252433777,
|
||||
"confidence": 0.8262876868247986,
|
||||
"cells": [
|
||||
{
|
||||
"index": 38,
|
||||
@ -6995,7 +6995,7 @@
|
||||
"b": 413.70983903079747,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.7766718864440918,
|
||||
"confidence": 0.7766715884208679,
|
||||
"cells": [
|
||||
{
|
||||
"index": 39,
|
||||
@ -7035,7 +7035,7 @@
|
||||
"b": 409.26995904119883,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.8204737901687622,
|
||||
"confidence": 0.8204739093780518,
|
||||
"cells": [
|
||||
{
|
||||
"index": 40,
|
||||
@ -7075,7 +7075,7 @@
|
||||
"b": 436.3898589776647,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.7670677900314331,
|
||||
"confidence": 0.7670676708221436,
|
||||
"cells": [
|
||||
{
|
||||
"index": 41,
|
||||
@ -7115,7 +7115,7 @@
|
||||
"b": 432.0699789877849,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.8048340082168579,
|
||||
"confidence": 0.8048339486122131,
|
||||
"cells": [
|
||||
{
|
||||
"index": 42,
|
||||
@ -7195,7 +7195,7 @@
|
||||
"b": 454.7499689346523,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.827337384223938,
|
||||
"confidence": 0.8273372054100037,
|
||||
"cells": [
|
||||
{
|
||||
"index": 44,
|
||||
@ -7235,7 +7235,7 @@
|
||||
"b": 481.8698388711183,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.7342236638069153,
|
||||
"confidence": 0.7342240214347839,
|
||||
"cells": [
|
||||
{
|
||||
"index": 45,
|
||||
@ -7275,7 +7275,7 @@
|
||||
"b": 477.42995888151955,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.8411222696304321,
|
||||
"confidence": 0.8411223888397217,
|
||||
"cells": [
|
||||
{
|
||||
"index": 46,
|
||||
@ -7315,7 +7315,7 @@
|
||||
"b": 528.3098487623228,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.7251589894294739,
|
||||
"confidence": 0.7251590490341187,
|
||||
"cells": [
|
||||
{
|
||||
"index": 47,
|
||||
@ -7380,7 +7380,7 @@
|
||||
"b": 501.78997882445117,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.7848678827285767,
|
||||
"confidence": 0.7848676443099976,
|
||||
"cells": [
|
||||
{
|
||||
"index": 49,
|
||||
@ -7420,7 +7420,7 @@
|
||||
"b": 573.2198486571116,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.7586438059806824,
|
||||
"confidence": 0.758643627166748,
|
||||
"cells": [
|
||||
{
|
||||
"index": 50,
|
||||
@ -7485,7 +7485,7 @@
|
||||
"b": 546.69997871924,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.7897851467132568,
|
||||
"confidence": 0.7897858619689941,
|
||||
"cells": [
|
||||
{
|
||||
"index": 52,
|
||||
@ -7565,7 +7565,7 @@
|
||||
"b": 591.5799886140991,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.8144810795783997,
|
||||
"confidence": 0.8144806027412415,
|
||||
"cells": [
|
||||
{
|
||||
"index": 54,
|
||||
@ -7610,7 +7610,7 @@
|
||||
"label": "picture",
|
||||
"bbox": {
|
||||
"l": 388.5767822265625,
|
||||
"t": 36.03587341308594,
|
||||
"t": 36.03588104248047,
|
||||
"r": 482.4759216308594,
|
||||
"b": 103.00555419921875,
|
||||
"coord_origin": "TOPLEFT"
|
||||
@ -7706,7 +7706,7 @@
|
||||
"b": 81.03008981017001,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.6917961239814758,
|
||||
"confidence": 0.6917959451675415,
|
||||
"cells": [
|
||||
{
|
||||
"index": 2,
|
||||
@ -7798,7 +7798,7 @@
|
||||
"b": 323.44982924225053,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.6362584233283997,
|
||||
"confidence": 0.6362582445144653,
|
||||
"cells": [
|
||||
{
|
||||
"index": 5,
|
||||
@ -8562,7 +8562,7 @@
|
||||
"b": 179.2998695799522,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.7258325815200806,
|
||||
"confidence": 0.7258322834968567,
|
||||
"cells": [
|
||||
{
|
||||
"index": 5,
|
||||
@ -9092,7 +9092,7 @@
|
||||
"b": 233.17986945372706,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.8121814727783203,
|
||||
"confidence": 0.8121819496154785,
|
||||
"cells": [
|
||||
{
|
||||
"index": 25,
|
||||
@ -9132,7 +9132,7 @@
|
||||
"b": 228.73998946412837,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.7672220468521118,
|
||||
"confidence": 0.7672221660614014,
|
||||
"cells": [
|
||||
{
|
||||
"index": 26,
|
||||
@ -9172,7 +9172,7 @@
|
||||
"b": 255.88982940052404,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.8320456743240356,
|
||||
"confidence": 0.8320454955101013,
|
||||
"cells": [
|
||||
{
|
||||
"index": 27,
|
||||
@ -9212,7 +9212,7 @@
|
||||
"b": 251.44994941092557,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.5538824796676636,
|
||||
"confidence": 0.5538817644119263,
|
||||
"cells": [
|
||||
{
|
||||
"index": 28,
|
||||
@ -9252,7 +9252,7 @@
|
||||
"b": 278.5698293473914,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.7909000515937805,
|
||||
"confidence": 0.7908995151519775,
|
||||
"cells": [
|
||||
{
|
||||
"index": 29,
|
||||
@ -9332,7 +9332,7 @@
|
||||
"b": 323.44982924225053,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.6534578204154968,
|
||||
"confidence": 0.6534579396247864,
|
||||
"cells": [
|
||||
{
|
||||
"index": 31,
|
||||
@ -9437,7 +9437,7 @@
|
||||
"b": 296.80999930466,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.5417144298553467,
|
||||
"confidence": 0.5417138934135437,
|
||||
"cells": [
|
||||
{
|
||||
"index": 35,
|
||||
@ -9531,7 +9531,7 @@
|
||||
"b": 596.0198686036978,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.719137966632843,
|
||||
"confidence": 0.7191378474235535,
|
||||
"cells": [
|
||||
{
|
||||
"index": 37,
|
||||
@ -10035,7 +10035,7 @@
|
||||
"b": 386.56997909437825,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.8262879252433777,
|
||||
"confidence": 0.8262876868247986,
|
||||
"cells": [
|
||||
{
|
||||
"index": 38,
|
||||
@ -10075,7 +10075,7 @@
|
||||
"b": 413.70983903079747,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.7766718864440918,
|
||||
"confidence": 0.7766715884208679,
|
||||
"cells": [
|
||||
{
|
||||
"index": 39,
|
||||
@ -10115,7 +10115,7 @@
|
||||
"b": 409.26995904119883,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.8204737901687622,
|
||||
"confidence": 0.8204739093780518,
|
||||
"cells": [
|
||||
{
|
||||
"index": 40,
|
||||
@ -10155,7 +10155,7 @@
|
||||
"b": 436.3898589776647,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.7670677900314331,
|
||||
"confidence": 0.7670676708221436,
|
||||
"cells": [
|
||||
{
|
||||
"index": 41,
|
||||
@ -10195,7 +10195,7 @@
|
||||
"b": 432.0699789877849,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.8048340082168579,
|
||||
"confidence": 0.8048339486122131,
|
||||
"cells": [
|
||||
{
|
||||
"index": 42,
|
||||
@ -10275,7 +10275,7 @@
|
||||
"b": 454.7499689346523,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.827337384223938,
|
||||
"confidence": 0.8273372054100037,
|
||||
"cells": [
|
||||
{
|
||||
"index": 44,
|
||||
@ -10315,7 +10315,7 @@
|
||||
"b": 481.8698388711183,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.7342236638069153,
|
||||
"confidence": 0.7342240214347839,
|
||||
"cells": [
|
||||
{
|
||||
"index": 45,
|
||||
@ -10355,7 +10355,7 @@
|
||||
"b": 477.42995888151955,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.8411222696304321,
|
||||
"confidence": 0.8411223888397217,
|
||||
"cells": [
|
||||
{
|
||||
"index": 46,
|
||||
@ -10395,7 +10395,7 @@
|
||||
"b": 528.3098487623228,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.7251589894294739,
|
||||
"confidence": 0.7251590490341187,
|
||||
"cells": [
|
||||
{
|
||||
"index": 47,
|
||||
@ -10460,7 +10460,7 @@
|
||||
"b": 501.78997882445117,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.7848678827285767,
|
||||
"confidence": 0.7848676443099976,
|
||||
"cells": [
|
||||
{
|
||||
"index": 49,
|
||||
@ -10500,7 +10500,7 @@
|
||||
"b": 573.2198486571116,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.7586438059806824,
|
||||
"confidence": 0.758643627166748,
|
||||
"cells": [
|
||||
{
|
||||
"index": 50,
|
||||
@ -10565,7 +10565,7 @@
|
||||
"b": 546.69997871924,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.7897851467132568,
|
||||
"confidence": 0.7897858619689941,
|
||||
"cells": [
|
||||
{
|
||||
"index": 52,
|
||||
@ -10645,7 +10645,7 @@
|
||||
"b": 591.5799886140991,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.8144810795783997,
|
||||
"confidence": 0.8144806027412415,
|
||||
"cells": [
|
||||
{
|
||||
"index": 54,
|
||||
@ -10695,7 +10695,7 @@
|
||||
"b": 790.0379791491694,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.899228036403656,
|
||||
"confidence": 0.8992282152175903,
|
||||
"cells": [
|
||||
{
|
||||
"index": 3,
|
||||
|
@ -16094,9 +16094,9 @@
|
||||
"page_no": 1,
|
||||
"bbox": {
|
||||
"l": 315.65362548828125,
|
||||
"t": 563.276611328125,
|
||||
"t": 563.2765655517578,
|
||||
"r": 537.1475219726562,
|
||||
"b": 489.1985778808594,
|
||||
"b": 489.19854736328125,
|
||||
"coord_origin": "BOTTOMLEFT"
|
||||
},
|
||||
"charspan": [
|
||||
@ -16443,9 +16443,9 @@
|
||||
"page_no": 3,
|
||||
"bbox": {
|
||||
"l": 312.10369873046875,
|
||||
"t": 713.5591354370117,
|
||||
"t": 713.5591125488281,
|
||||
"r": 550.38916015625,
|
||||
"b": 541.3901519775391,
|
||||
"b": 541.3901214599609,
|
||||
"coord_origin": "BOTTOMLEFT"
|
||||
},
|
||||
"charspan": [
|
||||
@ -16658,7 +16658,7 @@
|
||||
"page_no": 5,
|
||||
"bbox": {
|
||||
"l": 74.30525970458984,
|
||||
"t": 714.0887985229492,
|
||||
"t": 714.0887908935547,
|
||||
"r": 519.9801025390625,
|
||||
"b": 608.2984924316406,
|
||||
"coord_origin": "BOTTOMLEFT"
|
||||
@ -16829,7 +16829,7 @@
|
||||
"bbox": {
|
||||
"l": 53.03328323364258,
|
||||
"t": 534.3346557617188,
|
||||
"r": 285.3731689453125,
|
||||
"r": 285.3731384277344,
|
||||
"b": 284.3311462402344,
|
||||
"coord_origin": "BOTTOMLEFT"
|
||||
},
|
||||
@ -16862,7 +16862,7 @@
|
||||
"page_no": 8,
|
||||
"bbox": {
|
||||
"l": 49.97503662109375,
|
||||
"t": 688.2873382568359,
|
||||
"t": 688.2873153686523,
|
||||
"r": 301.6335754394531,
|
||||
"b": 604.4210662841797,
|
||||
"coord_origin": "BOTTOMLEFT"
|
||||
@ -16895,7 +16895,7 @@
|
||||
{
|
||||
"page_no": 8,
|
||||
"bbox": {
|
||||
"l": 305.5836486816406,
|
||||
"l": 305.58367919921875,
|
||||
"t": 693.3458404541016,
|
||||
"r": 554.8258666992188,
|
||||
"b": 611.3732452392578,
|
||||
@ -16978,9 +16978,9 @@
|
||||
"page_no": 8,
|
||||
"bbox": {
|
||||
"l": 216.76925659179688,
|
||||
"t": 411.5093688964844,
|
||||
"t": 411.5093994140625,
|
||||
"r": 375.7829284667969,
|
||||
"b": 348.65301513671875,
|
||||
"b": 348.6529541015625,
|
||||
"coord_origin": "BOTTOMLEFT"
|
||||
},
|
||||
"charspan": [
|
||||
@ -17177,9 +17177,9 @@
|
||||
{
|
||||
"page_no": 8,
|
||||
"bbox": {
|
||||
"l": 383.1364440917969,
|
||||
"t": 410.7686767578125,
|
||||
"r": 542.1132202148438,
|
||||
"l": 383.1363830566406,
|
||||
"t": 410.7687072753906,
|
||||
"r": 542.1131591796875,
|
||||
"b": 349.2250671386719,
|
||||
"coord_origin": "BOTTOMLEFT"
|
||||
},
|
||||
@ -17482,7 +17482,7 @@
|
||||
{
|
||||
"page_no": 14,
|
||||
"bbox": {
|
||||
"l": 51.15378952026367,
|
||||
"l": 51.153778076171875,
|
||||
"t": 687.6914825439453,
|
||||
"r": 282.8598937988281,
|
||||
"b": 447.09332275390625,
|
||||
@ -17580,10 +17580,10 @@
|
||||
{
|
||||
"page_no": 15,
|
||||
"bbox": {
|
||||
"l": 55.116363525390625,
|
||||
"l": 55.11635208129883,
|
||||
"t": 655.7449951171875,
|
||||
"r": 279.370849609375,
|
||||
"b": 542.6654510498047,
|
||||
"b": 542.6654968261719,
|
||||
"coord_origin": "BOTTOMLEFT"
|
||||
},
|
||||
"charspan": [
|
||||
@ -17701,9 +17701,9 @@
|
||||
"page_no": 15,
|
||||
"bbox": {
|
||||
"l": 323.46868896484375,
|
||||
"t": 429.5491638183594,
|
||||
"t": 429.5492248535156,
|
||||
"r": 525.9569091796875,
|
||||
"b": 327.739501953125,
|
||||
"b": 327.73956298828125,
|
||||
"coord_origin": "BOTTOMLEFT"
|
||||
},
|
||||
"charspan": [
|
||||
@ -17765,7 +17765,7 @@
|
||||
"page_no": 16,
|
||||
"bbox": {
|
||||
"l": 66.79948425292969,
|
||||
"t": 538.3836822509766,
|
||||
"t": 538.3837127685547,
|
||||
"r": 528.5565795898438,
|
||||
"b": 293.8616027832031,
|
||||
"coord_origin": "BOTTOMLEFT"
|
||||
@ -17801,9 +17801,9 @@
|
||||
"page_no": 1,
|
||||
"bbox": {
|
||||
"l": 315.65362548828125,
|
||||
"t": 563.276611328125,
|
||||
"t": 563.2765655517578,
|
||||
"r": 537.1475219726562,
|
||||
"b": 489.1985778808594,
|
||||
"b": 489.19854736328125,
|
||||
"coord_origin": "BOTTOMLEFT"
|
||||
},
|
||||
"charspan": [
|
||||
@ -18771,9 +18771,9 @@
|
||||
{
|
||||
"page_no": 4,
|
||||
"bbox": {
|
||||
"l": 310.67584228515625,
|
||||
"t": 718.8061141967773,
|
||||
"r": 542.9547119140625,
|
||||
"l": 310.6757507324219,
|
||||
"t": 718.8061218261719,
|
||||
"r": 542.9546508789062,
|
||||
"b": 636.7794799804688,
|
||||
"coord_origin": "BOTTOMLEFT"
|
||||
},
|
||||
@ -22946,7 +22946,7 @@
|
||||
"page_no": 7,
|
||||
"bbox": {
|
||||
"l": 332.9688720703125,
|
||||
"t": 251.7164306640625,
|
||||
"t": 251.71649169921875,
|
||||
"r": 520.942138671875,
|
||||
"b": 148.73028564453125,
|
||||
"coord_origin": "BOTTOMLEFT"
|
||||
@ -24069,9 +24069,9 @@
|
||||
"page_no": 8,
|
||||
"bbox": {
|
||||
"l": 53.62853240966797,
|
||||
"t": 573.0514221191406,
|
||||
"t": 573.0514526367188,
|
||||
"r": 298.5574951171875,
|
||||
"b": 499.60003662109375,
|
||||
"b": 499.6000061035156,
|
||||
"coord_origin": "BOTTOMLEFT"
|
||||
},
|
||||
"charspan": [
|
||||
@ -27719,7 +27719,7 @@
|
||||
{
|
||||
"page_no": 13,
|
||||
"bbox": {
|
||||
"l": 83.31756591796875,
|
||||
"l": 83.31759643554688,
|
||||
"t": 395.9864501953125,
|
||||
"r": 248.873046875,
|
||||
"b": 304.7430114746094,
|
||||
@ -27759,9 +27759,9 @@
|
||||
"page_no": 13,
|
||||
"bbox": {
|
||||
"l": 310.3294372558594,
|
||||
"t": 690.8223266601562,
|
||||
"t": 690.8223342895508,
|
||||
"r": 555.8338623046875,
|
||||
"b": 655.8524780273438,
|
||||
"b": 655.8524932861328,
|
||||
"coord_origin": "BOTTOMLEFT"
|
||||
},
|
||||
"charspan": [
|
||||
@ -27798,9 +27798,9 @@
|
||||
"page_no": 13,
|
||||
"bbox": {
|
||||
"l": 309.9566345214844,
|
||||
"t": 637.3855133056641,
|
||||
"t": 637.3854827880859,
|
||||
"r": 555.7466430664062,
|
||||
"b": 607.2774658203125,
|
||||
"b": 607.2774353027344,
|
||||
"coord_origin": "BOTTOMLEFT"
|
||||
},
|
||||
"charspan": [
|
||||
@ -27832,10 +27832,10 @@
|
||||
{
|
||||
"page_no": 13,
|
||||
"bbox": {
|
||||
"l": 309.9635314941406,
|
||||
"t": 596.2945861816406,
|
||||
"r": 555.7054443359375,
|
||||
"b": 558.4485473632812,
|
||||
"l": 309.96356201171875,
|
||||
"t": 596.2945098876953,
|
||||
"r": 555.7053833007812,
|
||||
"b": 558.4485168457031,
|
||||
"coord_origin": "BOTTOMLEFT"
|
||||
},
|
||||
"charspan": [
|
||||
@ -28050,10 +28050,10 @@
|
||||
{
|
||||
"page_no": 14,
|
||||
"bbox": {
|
||||
"l": 51.72642135620117,
|
||||
"t": 518.3907165527344,
|
||||
"r": 283.114013671875,
|
||||
"b": 447.7554931640625,
|
||||
"l": 51.726383209228516,
|
||||
"t": 518.3907470703125,
|
||||
"r": 283.1140441894531,
|
||||
"b": 447.7555236816406,
|
||||
"coord_origin": "BOTTOMLEFT"
|
||||
},
|
||||
"charspan": [
|
||||
@ -28085,7 +28085,7 @@
|
||||
{
|
||||
"page_no": 14,
|
||||
"bbox": {
|
||||
"l": 51.434879302978516,
|
||||
"l": 51.43488693237305,
|
||||
"t": 338.51251220703125,
|
||||
"r": 310.7267150878906,
|
||||
"b": 300.17974853515625,
|
||||
@ -28155,7 +28155,7 @@
|
||||
{
|
||||
"page_no": 14,
|
||||
"bbox": {
|
||||
"l": 51.27280807495117,
|
||||
"l": 51.2728271484375,
|
||||
"t": 238.271484375,
|
||||
"r": 311.0897216796875,
|
||||
"b": 200.086669921875,
|
||||
@ -28408,9 +28408,9 @@
|
||||
{
|
||||
"page_no": 14,
|
||||
"bbox": {
|
||||
"l": 319.06494140625,
|
||||
"t": 182.1591796875,
|
||||
"r": 533.77392578125,
|
||||
"l": 319.0649719238281,
|
||||
"t": 182.1590576171875,
|
||||
"r": 533.7738647460938,
|
||||
"b": 122.80792236328125,
|
||||
"coord_origin": "BOTTOMLEFT"
|
||||
},
|
||||
@ -28443,10 +28443,10 @@
|
||||
{
|
||||
"page_no": 15,
|
||||
"bbox": {
|
||||
"l": 55.116363525390625,
|
||||
"l": 55.11635208129883,
|
||||
"t": 655.7449951171875,
|
||||
"r": 279.370849609375,
|
||||
"b": 542.6654510498047,
|
||||
"b": 542.6654968261719,
|
||||
"coord_origin": "BOTTOMLEFT"
|
||||
},
|
||||
"charspan": [
|
||||
@ -28517,10 +28517,10 @@
|
||||
{
|
||||
"page_no": 15,
|
||||
"bbox": {
|
||||
"l": 323.0059509277344,
|
||||
"t": 670.4528503417969,
|
||||
"r": 525.95166015625,
|
||||
"b": 569.0885925292969,
|
||||
"l": 323.0059814453125,
|
||||
"t": 670.4528656005859,
|
||||
"r": 525.9517211914062,
|
||||
"b": 569.0885772705078,
|
||||
"coord_origin": "BOTTOMLEFT"
|
||||
},
|
||||
"charspan": [
|
||||
@ -28557,9 +28557,9 @@
|
||||
"page_no": 15,
|
||||
"bbox": {
|
||||
"l": 323.384765625,
|
||||
"t": 550.0270538330078,
|
||||
"t": 550.0270690917969,
|
||||
"r": 526.1268920898438,
|
||||
"b": 447.90789794921875,
|
||||
"b": 447.9078674316406,
|
||||
"coord_origin": "BOTTOMLEFT"
|
||||
},
|
||||
"charspan": [
|
||||
@ -28592,9 +28592,9 @@
|
||||
"page_no": 15,
|
||||
"bbox": {
|
||||
"l": 323.46868896484375,
|
||||
"t": 429.5491638183594,
|
||||
"t": 429.5492248535156,
|
||||
"r": 525.9569091796875,
|
||||
"b": 327.739501953125,
|
||||
"b": 327.73956298828125,
|
||||
"coord_origin": "BOTTOMLEFT"
|
||||
},
|
||||
"charspan": [
|
||||
|
File diff suppressed because it is too large
Load Diff
@ -16866,10 +16866,10 @@
|
||||
{
|
||||
"page_no": 1,
|
||||
"bbox": {
|
||||
"l": 323.408203125,
|
||||
"l": 323.4081115722656,
|
||||
"t": 541.6512603759766,
|
||||
"r": 553.2952270507812,
|
||||
"b": 266.1492919921875,
|
||||
"r": 553.295166015625,
|
||||
"b": 266.14935302734375,
|
||||
"coord_origin": "BOTTOMLEFT"
|
||||
},
|
||||
"charspan": [
|
||||
@ -16941,9 +16941,9 @@
|
||||
"page_no": 3,
|
||||
"bbox": {
|
||||
"l": 88.33030700683594,
|
||||
"t": 699.1134796142578,
|
||||
"t": 699.1134490966797,
|
||||
"r": 263.7049560546875,
|
||||
"b": 571.4317321777344,
|
||||
"b": 571.4317626953125,
|
||||
"coord_origin": "BOTTOMLEFT"
|
||||
},
|
||||
"charspan": [
|
||||
@ -16979,9 +16979,9 @@
|
||||
"page_no": 4,
|
||||
"bbox": {
|
||||
"l": 53.05912780761719,
|
||||
"t": 481.2087097167969,
|
||||
"t": 481.20867919921875,
|
||||
"r": 295.8506164550781,
|
||||
"b": 251.135986328125,
|
||||
"b": 251.1358642578125,
|
||||
"coord_origin": "BOTTOMLEFT"
|
||||
},
|
||||
"charspan": [
|
||||
@ -17255,9 +17255,9 @@
|
||||
"page_no": 4,
|
||||
"bbox": {
|
||||
"l": 98.93103790283203,
|
||||
"t": 654.5245208740234,
|
||||
"t": 654.5244903564453,
|
||||
"r": 512.579833984375,
|
||||
"b": 497.91851806640625,
|
||||
"b": 497.91845703125,
|
||||
"coord_origin": "BOTTOMLEFT"
|
||||
},
|
||||
"charspan": [
|
||||
@ -23506,7 +23506,7 @@
|
||||
"page_no": 6,
|
||||
"bbox": {
|
||||
"l": 62.02753829956055,
|
||||
"t": 596.3199310302734,
|
||||
"t": 596.3199462890625,
|
||||
"r": 285.78955078125,
|
||||
"b": 440.3381042480469,
|
||||
"coord_origin": "BOTTOMLEFT"
|
||||
@ -26668,9 +26668,9 @@
|
||||
{
|
||||
"page_no": 7,
|
||||
"bbox": {
|
||||
"l": 80.35525512695312,
|
||||
"l": 80.35527038574219,
|
||||
"t": 641.0637054443359,
|
||||
"r": 267.0082092285156,
|
||||
"r": 267.00823974609375,
|
||||
"b": 496.5545349121094,
|
||||
"coord_origin": "BOTTOMLEFT"
|
||||
},
|
||||
@ -31588,10 +31588,10 @@
|
||||
{
|
||||
"page_no": 8,
|
||||
"bbox": {
|
||||
"l": 72.6590347290039,
|
||||
"t": 619.5191955566406,
|
||||
"r": 274.83465576171875,
|
||||
"b": 452.1459655761719,
|
||||
"l": 72.65901947021484,
|
||||
"t": 619.5191650390625,
|
||||
"r": 274.8346862792969,
|
||||
"b": 452.14599609375,
|
||||
"coord_origin": "BOTTOMLEFT"
|
||||
},
|
||||
"charspan": [
|
||||
|
File diff suppressed because it is too large
Load Diff
@ -2686,7 +2686,7 @@
|
||||
"b": 102.78223000000003,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.8858679533004761,
|
||||
"confidence": 0.8858681321144104,
|
||||
"cells": [
|
||||
{
|
||||
"index": 1,
|
||||
@ -2816,7 +2816,7 @@
|
||||
"b": 179.20818999999995,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9577404260635376,
|
||||
"confidence": 0.957740306854248,
|
||||
"cells": [
|
||||
{
|
||||
"index": 5,
|
||||
@ -13628,7 +13628,7 @@
|
||||
"b": 102.78223000000003,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.8858679533004761,
|
||||
"confidence": 0.8858681321144104,
|
||||
"cells": [
|
||||
{
|
||||
"index": 1,
|
||||
@ -13770,7 +13770,7 @@
|
||||
"b": 179.20818999999995,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9577404260635376,
|
||||
"confidence": 0.957740306854248,
|
||||
"cells": [
|
||||
{
|
||||
"index": 5,
|
||||
@ -20153,7 +20153,7 @@
|
||||
"b": 179.20818999999995,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9577404260635376,
|
||||
"confidence": 0.957740306854248,
|
||||
"cells": [
|
||||
{
|
||||
"index": 5,
|
||||
@ -26486,7 +26486,7 @@
|
||||
"b": 102.78223000000003,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.8858679533004761,
|
||||
"confidence": 0.8858681321144104,
|
||||
"cells": [
|
||||
{
|
||||
"index": 1,
|
||||
|
@ -14942,9 +14942,9 @@
|
||||
"page_no": 2,
|
||||
"bbox": {
|
||||
"l": 148.45364379882812,
|
||||
"t": 583.6257629394531,
|
||||
"t": 583.6257476806641,
|
||||
"r": 464.3608093261719,
|
||||
"b": 366.1537780761719,
|
||||
"b": 366.1538391113281,
|
||||
"coord_origin": "BOTTOMLEFT"
|
||||
},
|
||||
"charspan": [
|
||||
@ -15221,9 +15221,9 @@
|
||||
{
|
||||
"page_no": 7,
|
||||
"bbox": {
|
||||
"l": 164.65028381347656,
|
||||
"l": 164.6503143310547,
|
||||
"t": 628.2029113769531,
|
||||
"r": 449.5505676269531,
|
||||
"r": 449.550537109375,
|
||||
"b": 511.6590576171875,
|
||||
"coord_origin": "BOTTOMLEFT"
|
||||
},
|
||||
@ -15475,7 +15475,7 @@
|
||||
{
|
||||
"page_no": 8,
|
||||
"bbox": {
|
||||
"l": 140.70968627929688,
|
||||
"l": 140.70960998535156,
|
||||
"t": 283.9361572265625,
|
||||
"r": 472.73382568359375,
|
||||
"b": 198.32281494140625,
|
||||
@ -15804,10 +15804,10 @@
|
||||
{
|
||||
"page_no": 10,
|
||||
"bbox": {
|
||||
"l": 162.67430114746094,
|
||||
"t": 347.37744140625,
|
||||
"r": 451.70062255859375,
|
||||
"b": 128.78643798828125,
|
||||
"l": 162.67434692382812,
|
||||
"t": 347.3774719238281,
|
||||
"r": 451.70068359375,
|
||||
"b": 128.786376953125,
|
||||
"coord_origin": "BOTTOMLEFT"
|
||||
},
|
||||
"charspan": [
|
||||
@ -15875,9 +15875,9 @@
|
||||
{
|
||||
"page_no": 11,
|
||||
"bbox": {
|
||||
"l": 168.39285278320312,
|
||||
"l": 168.3928985595703,
|
||||
"t": 610.0334930419922,
|
||||
"r": 447.35137939453125,
|
||||
"r": 447.3513488769531,
|
||||
"b": 157.99432373046875,
|
||||
"coord_origin": "BOTTOMLEFT"
|
||||
},
|
||||
@ -17702,7 +17702,7 @@
|
||||
"page_no": 10,
|
||||
"bbox": {
|
||||
"l": 143.6376495361328,
|
||||
"t": 635.6522979736328,
|
||||
"t": 635.6522827148438,
|
||||
"r": 470.8485412597656,
|
||||
"b": 528.7375183105469,
|
||||
"coord_origin": "BOTTOMLEFT"
|
||||
|
File diff suppressed because it is too large
Load Diff
@ -951,7 +951,7 @@
|
||||
"page_no": 1,
|
||||
"bbox": {
|
||||
"l": 320.4467468261719,
|
||||
"t": 352.359375,
|
||||
"t": 352.3592834472656,
|
||||
"r": 558.8576049804688,
|
||||
"b": 81.689208984375,
|
||||
"coord_origin": "BOTTOMLEFT"
|
||||
|
@ -3411,7 +3411,7 @@
|
||||
"b": 519.65363,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9695363640785217,
|
||||
"confidence": 0.9695364832878113,
|
||||
"cells": [
|
||||
{
|
||||
"index": 34,
|
||||
@ -4081,7 +4081,7 @@
|
||||
"b": 142.65363000000002,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9263731241226196,
|
||||
"confidence": 0.9263732433319092,
|
||||
"cells": [
|
||||
{
|
||||
"index": 59,
|
||||
@ -4611,7 +4611,7 @@
|
||||
"b": 382.15362999999996,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9253152012825012,
|
||||
"confidence": 0.9253151416778564,
|
||||
"cells": [
|
||||
{
|
||||
"index": 79,
|
||||
@ -4651,7 +4651,7 @@
|
||||
"b": 409.15362999999996,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9676451683044434,
|
||||
"confidence": 0.9676452875137329,
|
||||
"cells": [
|
||||
{
|
||||
"index": 80,
|
||||
@ -4711,12 +4711,12 @@
|
||||
"label": "picture",
|
||||
"bbox": {
|
||||
"l": 320.4467468261719,
|
||||
"t": 421.640625,
|
||||
"t": 421.6407165527344,
|
||||
"r": 558.8576049804688,
|
||||
"b": 692.310791015625,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9881086945533752,
|
||||
"confidence": 0.9881085753440857,
|
||||
"cells": [
|
||||
{
|
||||
"index": 82,
|
||||
@ -5463,7 +5463,7 @@
|
||||
"b": 713.009598,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9449448585510254,
|
||||
"confidence": 0.9449449777603149,
|
||||
"cells": [
|
||||
{
|
||||
"index": 93,
|
||||
@ -5528,7 +5528,7 @@
|
||||
"b": 710.989597,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9497622847557068,
|
||||
"confidence": 0.9497623443603516,
|
||||
"cells": [
|
||||
{
|
||||
"index": 95,
|
||||
@ -5593,7 +5593,7 @@
|
||||
"b": 740.290298,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9368568658828735,
|
||||
"confidence": 0.9368569850921631,
|
||||
"cells": [
|
||||
{
|
||||
"index": 97,
|
||||
@ -6624,7 +6624,7 @@
|
||||
"b": 519.65363,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9695363640785217,
|
||||
"confidence": 0.9695364832878113,
|
||||
"cells": [
|
||||
{
|
||||
"index": 34,
|
||||
@ -7312,7 +7312,7 @@
|
||||
"b": 142.65363000000002,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9263731241226196,
|
||||
"confidence": 0.9263732433319092,
|
||||
"cells": [
|
||||
{
|
||||
"index": 59,
|
||||
@ -7854,7 +7854,7 @@
|
||||
"b": 382.15362999999996,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9253152012825012,
|
||||
"confidence": 0.9253151416778564,
|
||||
"cells": [
|
||||
{
|
||||
"index": 79,
|
||||
@ -7900,7 +7900,7 @@
|
||||
"b": 409.15362999999996,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9676451683044434,
|
||||
"confidence": 0.9676452875137329,
|
||||
"cells": [
|
||||
{
|
||||
"index": 80,
|
||||
@ -7966,12 +7966,12 @@
|
||||
"label": "picture",
|
||||
"bbox": {
|
||||
"l": 320.4467468261719,
|
||||
"t": 421.640625,
|
||||
"t": 421.6407165527344,
|
||||
"r": 558.8576049804688,
|
||||
"b": 692.310791015625,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9881086945533752,
|
||||
"confidence": 0.9881085753440857,
|
||||
"cells": [
|
||||
{
|
||||
"index": 82,
|
||||
@ -8738,7 +8738,7 @@
|
||||
"b": 713.009598,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9449448585510254,
|
||||
"confidence": 0.9449449777603149,
|
||||
"cells": [
|
||||
{
|
||||
"index": 93,
|
||||
@ -8809,7 +8809,7 @@
|
||||
"b": 710.989597,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9497622847557068,
|
||||
"confidence": 0.9497623443603516,
|
||||
"cells": [
|
||||
{
|
||||
"index": 95,
|
||||
@ -8880,7 +8880,7 @@
|
||||
"b": 740.290298,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9368568658828735,
|
||||
"confidence": 0.9368569850921631,
|
||||
"cells": [
|
||||
{
|
||||
"index": 97,
|
||||
@ -9904,7 +9904,7 @@
|
||||
"b": 519.65363,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9695363640785217,
|
||||
"confidence": 0.9695364832878113,
|
||||
"cells": [
|
||||
{
|
||||
"index": 34,
|
||||
@ -10592,7 +10592,7 @@
|
||||
"b": 142.65363000000002,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9263731241226196,
|
||||
"confidence": 0.9263732433319092,
|
||||
"cells": [
|
||||
{
|
||||
"index": 59,
|
||||
@ -11134,7 +11134,7 @@
|
||||
"b": 382.15362999999996,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9253152012825012,
|
||||
"confidence": 0.9253151416778564,
|
||||
"cells": [
|
||||
{
|
||||
"index": 79,
|
||||
@ -11180,7 +11180,7 @@
|
||||
"b": 409.15362999999996,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9676451683044434,
|
||||
"confidence": 0.9676452875137329,
|
||||
"cells": [
|
||||
{
|
||||
"index": 80,
|
||||
@ -11246,12 +11246,12 @@
|
||||
"label": "picture",
|
||||
"bbox": {
|
||||
"l": 320.4467468261719,
|
||||
"t": 421.640625,
|
||||
"t": 421.6407165527344,
|
||||
"r": 558.8576049804688,
|
||||
"b": 692.310791015625,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9881086945533752,
|
||||
"confidence": 0.9881085753440857,
|
||||
"cells": [
|
||||
{
|
||||
"index": 82,
|
||||
@ -12018,7 +12018,7 @@
|
||||
"b": 713.009598,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9449448585510254,
|
||||
"confidence": 0.9449449777603149,
|
||||
"cells": [
|
||||
{
|
||||
"index": 93,
|
||||
@ -12089,7 +12089,7 @@
|
||||
"b": 710.989597,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9497622847557068,
|
||||
"confidence": 0.9497623443603516,
|
||||
"cells": [
|
||||
{
|
||||
"index": 95,
|
||||
@ -12162,7 +12162,7 @@
|
||||
"b": 740.290298,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9368568658828735,
|
||||
"confidence": 0.9368569850921631,
|
||||
"cells": [
|
||||
{
|
||||
"index": 97,
|
||||
|
@ -1541,7 +1541,7 @@
|
||||
"b": 358.76782,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.5588350296020508,
|
||||
"confidence": 0.5588339567184448,
|
||||
"cells": [
|
||||
{
|
||||
"index": 18,
|
||||
@ -1581,7 +1581,7 @@
|
||||
"b": 406.74554,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.6312209963798523,
|
||||
"confidence": 0.6312211155891418,
|
||||
"cells": [
|
||||
{
|
||||
"index": 19,
|
||||
@ -2036,7 +2036,7 @@
|
||||
"b": 607.23564,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9843751788139343,
|
||||
"confidence": 0.9843752980232239,
|
||||
"cells": [
|
||||
{
|
||||
"index": 36,
|
||||
@ -2719,7 +2719,7 @@
|
||||
"b": 358.76782,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.5588350296020508,
|
||||
"confidence": 0.5588339567184448,
|
||||
"cells": [
|
||||
{
|
||||
"index": 18,
|
||||
@ -2765,7 +2765,7 @@
|
||||
"b": 406.74554,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.6312209963798523,
|
||||
"confidence": 0.6312211155891418,
|
||||
"cells": [
|
||||
{
|
||||
"index": 19,
|
||||
@ -3232,7 +3232,7 @@
|
||||
"b": 607.23564,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9843751788139343,
|
||||
"confidence": 0.9843752980232239,
|
||||
"cells": [
|
||||
{
|
||||
"index": 36,
|
||||
@ -3914,7 +3914,7 @@
|
||||
"b": 358.76782,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.5588350296020508,
|
||||
"confidence": 0.5588339567184448,
|
||||
"cells": [
|
||||
{
|
||||
"index": 18,
|
||||
@ -3960,7 +3960,7 @@
|
||||
"b": 406.74554,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.6312209963798523,
|
||||
"confidence": 0.6312211155891418,
|
||||
"cells": [
|
||||
{
|
||||
"index": 19,
|
||||
@ -4427,7 +4427,7 @@
|
||||
"b": 607.23564,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9843751788139343,
|
||||
"confidence": 0.9843752980232239,
|
||||
"cells": [
|
||||
{
|
||||
"index": 36,
|
||||
@ -5782,7 +5782,7 @@
|
||||
"b": 137.5481507594625,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.950506865978241,
|
||||
"confidence": 0.9505067467689514,
|
||||
"cells": [
|
||||
{
|
||||
"index": 0,
|
||||
@ -6302,7 +6302,7 @@
|
||||
"b": 373.7119120634245,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.8727474808692932,
|
||||
"confidence": 0.8727476000785828,
|
||||
"cells": [
|
||||
{
|
||||
"index": 19,
|
||||
@ -7037,7 +7037,7 @@
|
||||
"b": 704.5687238902275,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.8504500389099121,
|
||||
"confidence": 0.8504503965377808,
|
||||
"cells": [
|
||||
{
|
||||
"index": 46,
|
||||
@ -7092,7 +7092,7 @@
|
||||
"b": 137.5481507594625,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.950506865978241,
|
||||
"confidence": 0.9505067467689514,
|
||||
"cells": [
|
||||
{
|
||||
"index": 0,
|
||||
@ -7630,7 +7630,7 @@
|
||||
"b": 373.7119120634245,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.8727474808692932,
|
||||
"confidence": 0.8727476000785828,
|
||||
"cells": [
|
||||
{
|
||||
"index": 19,
|
||||
@ -8389,7 +8389,7 @@
|
||||
"b": 704.5687238902275,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.8504500389099121,
|
||||
"confidence": 0.8504503965377808,
|
||||
"cells": [
|
||||
{
|
||||
"index": 46,
|
||||
@ -8437,7 +8437,7 @@
|
||||
"b": 137.5481507594625,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.950506865978241,
|
||||
"confidence": 0.9505067467689514,
|
||||
"cells": [
|
||||
{
|
||||
"index": 0,
|
||||
@ -8975,7 +8975,7 @@
|
||||
"b": 373.7119120634245,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.8727474808692932,
|
||||
"confidence": 0.8727476000785828,
|
||||
"cells": [
|
||||
{
|
||||
"index": 19,
|
||||
@ -9736,7 +9736,7 @@
|
||||
"b": 704.5687238902275,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.8504500389099121,
|
||||
"confidence": 0.8504503965377808,
|
||||
"cells": [
|
||||
{
|
||||
"index": 46,
|
||||
|
66
tests/data/groundtruth/docling_v2/multi_page.doctags.txt
Normal file
66
tests/data/groundtruth/docling_v2/multi_page.doctags.txt
Normal file
@ -0,0 +1,66 @@
|
||||
<doctag><section_header_level_1><loc_60><loc_43><loc_221><loc_51>The Evolution of the Word Processor</section_header_level_1>
|
||||
<text><loc_60><loc_59><loc_418><loc_76>The concept of the word processor predates modern computers and has evolved through several technological milestones.</text>
|
||||
<section_header_level_1><loc_60><loc_84><loc_274><loc_93>Pre-Digital Era (19th - Early 20th Century)</section_header_level_1>
|
||||
<text><loc_60><loc_102><loc_427><loc_134>The origins of word processing can be traced back to the invention of the typewriter in the mid-19th century. Patented in 1868 by Christopher Latham Sholes, the typewriter revolutionized written communication by enabling people to produce legible, professional documents more efficiently than handwriting.</text>
|
||||
<text><loc_60><loc_143><loc_424><loc_175>During this period, the term "word processing" didn't exist, but the typewriter laid the groundwork for future developments. Over time, advancements such as carbon paper (for copies) and the electric typewriter (introduced by IBM in 1935) improved the speed and convenience of document creation.</text>
|
||||
<section_header_level_1><loc_60><loc_201><loc_283><loc_209>The Birth of Word Processing (1960s - 1970s)</section_header_level_1>
|
||||
<text><loc_60><loc_218><loc_440><loc_242>The term "word processor" first emerged in the 1960s and referred to any system designed to streamline written communication and document production. Early word processors were not software programs but rather standalone machines.</text>
|
||||
<unordered_list><list_item><loc_76><loc_251><loc_435><loc_283>· IBM MT/ST (Magnetic Tape/Selectric Typewriter) : Introduced in 1964, this machine combined IBM's Selectric typewriter with magnetic tape storage. It allowed users to record, edit, and replay typed content-an early example of digital text storage.</list_item>
|
||||
<list_item><loc_76><loc_284><loc_418><loc_308>· Wang Laboratories : In the 1970s, Wang introduced dedicated word processing machines. These devices, like the Wang 1200, featured small screens and floppy disks, making them revolutionary for their time.</list_item>
|
||||
</unordered_list>
|
||||
<text><loc_60><loc_316><loc_432><loc_333>These machines were primarily used in offices, where secretarial pools benefited from their ability to make revisions without retyping entire documents.</text>
|
||||
<section_header_level_1><loc_60><loc_358><loc_258><loc_367>The Rise of Personal Computers (1980s)</section_header_level_1>
|
||||
<text><loc_60><loc_375><loc_433><loc_392>The advent of personal computers in the late 1970s and early 1980s transformed word processing from a niche tool to an essential technology for businesses and individuals alike.</text>
|
||||
<unordered_list><list_item><loc_76><loc_400><loc_439><loc_424>· WordStar (1978) : Developed for the CP/M operating system, WordStar was one of the first widely used word processing programs. It featured early examples of modern features like cut, copy, and paste.</list_item>
|
||||
<list_item><loc_76><loc_425><loc_441><loc_449>· Microsoft Word (1983) : Microsoft launched Word for MS-DOS in 1983, introducing a graphical user interface (GUI) and mouse support. Over the years, Microsoft Word became the industry standard for word processing.</list_item>
|
||||
</unordered_list>
|
||||
<page_break>
|
||||
<text><loc_60><loc_43><loc_434><loc_67>Other notable software from this era included WordPerfect, which was popular among legal professionals, and Apple's MacWrite, which leveraged the Macintosh's graphical capabilities.</text>
|
||||
<section_header_level_1><loc_60><loc_93><loc_229><loc_101>The Modern Era (1990s - Present)</section_header_level_1>
|
||||
<text><loc_60><loc_110><loc_429><loc_126>By the 1990s, word processing software had become more sophisticated, with features like spell check, grammar check, templates, and collaborative tools.</text>
|
||||
<unordered_list><list_item><loc_76><loc_135><loc_413><loc_151>· Microsoft Office Suite : Microsoft continued to dominate with its Office Suite, integrating Word with other productivity tools like Excel and PowerPoint.</list_item>
|
||||
<list_item><loc_76><loc_151><loc_435><loc_167>· OpenOffice and LibreOffice : Open-source alternatives emerged in the early 2000s, offering free and flexible word processing options.</list_item>
|
||||
<list_item><loc_76><loc_167><loc_441><loc_192>· Google Docs (2006) : The introduction of cloud-based word processing revolutionized collaboration. Google Docs enabled real-time editing and sharing, making it a staple for teams and remote work.</list_item>
|
||||
</unordered_list>
|
||||
<section_header_level_1><loc_60><loc_217><loc_195><loc_226>Future of Word Processing</section_header_level_1>
|
||||
<text><loc_60><loc_234><loc_437><loc_275>Today, word processors are more than just tools for typing. They integrate artificial intelligence for grammar and style suggestions (e.g., Grammarly), voice-to-text features, and advanced layout options. As AI continues to advance, word processors may evolve into even more intuitive tools that predict user needs, automate repetitive tasks, and support richer multimedia integration.</text>
|
||||
<text><loc_60><loc_300><loc_433><loc_325>From the clunky typewriters of the 19th century to the AI-powered cloud tools of today, the word processor has come a long way. It remains an essential tool for communication and creativity, shaping how we write and share ideas.</text>
|
||||
<page_break>
|
||||
<section_header_level_1><loc_60><loc_43><loc_232><loc_52>Specialized Word Processing Tools</section_header_level_1>
|
||||
<text><loc_60><loc_60><loc_432><loc_85>In addition to general-purpose word processors, specialized tools have emerged to cater to specific industries and needs. These tools incorporate unique features tailored to their users' workflows:</text>
|
||||
<unordered_list><list_item><loc_76><loc_93><loc_436><loc_134>· Academic and Technical Writing : Tools like LaTeX gained popularity among academics, scientists, and engineers. Unlike traditional word processors, LaTeX focuses on precise formatting, particularly for complex mathematical equations, scientific papers, and technical documents. It relies on a markup language to produce polished documents suitable for publishing.</list_item>
|
||||
<list_item><loc_76><loc_134><loc_423><loc_167>· Screenwriting Software : For screenwriters, tools like Final Draft and Celtx are specialized to handle scripts for film and television. These programs automate the formatting of dialogue, scene descriptions, and other elements unique to screenwriting.</list_item>
|
||||
<list_item><loc_76><loc_167><loc_441><loc_200>· Legal Document Processors : Word processors tailored for legal professionals, like WordPerfect, offered features such as redlining (early version tracking) and document comparison. Even today, many law firms rely on these tools due to their robust formatting options for contracts and legal briefs.</list_item>
|
||||
</unordered_list>
|
||||
<section_header_level_1><loc_60><loc_225><loc_286><loc_234>Key Features That Changed Word Processing</section_header_level_1>
|
||||
<text><loc_60><loc_242><loc_432><loc_267>The evolution of word processors wasn't just about hardware or software improvements-it was about the features that revolutionized how people wrote and edited. Some of these transformative features include:</text>
|
||||
<unordered_list><list_item><loc_76><loc_275><loc_428><loc_291>1. Undo/Redo : Introduced in the 1980s, the ability to undo mistakes and redo actions made experimentation and error correction much easier.</list_item>
|
||||
<list_item><loc_76><loc_292><loc_434><loc_308>2. Spell Check and Grammar Check : By the 1990s, these became standard, allowing users to spot errors automatically.</list_item>
|
||||
<list_item><loc_76><loc_308><loc_409><loc_324>3. Templates : Pre-designed formats for documents, such as resumes, letters, and invoices, helped users save time.</list_item>
|
||||
<list_item><loc_76><loc_324><loc_422><loc_340>4. Track Changes : A game-changer for collaboration, this feature allowed multiple users to suggest edits while maintaining the original text.</list_item>
|
||||
<list_item><loc_76><loc_341><loc_438><loc_365>5. Real-Time Collaboration : Tools like Google Docs and Microsoft 365 enabled multiple users to edit the same document simultaneously, forever changing teamwork dynamics.</list_item>
|
||||
</unordered_list>
|
||||
<section_header_level_1><loc_60><loc_390><loc_262><loc_399>The Cultural Impact of Word Processors</section_header_level_1>
|
||||
<text><loc_60><loc_408><loc_436><loc_432>The word processor didn't just change workplaces-it changed culture. It democratized writing, enabling anyone with access to a computer to produce professional-quality documents. This shift had profound implications for education, business, and creative fields:</text>
|
||||
<page_break>
|
||||
<unordered_list><list_item><loc_76><loc_43><loc_432><loc_67>· Accessibility : Writers no longer needed expensive publishing equipment or training in typesetting to create polished work. This accessibility paved the way for selfpublishing, blogging, and even fan fiction communities.</list_item>
|
||||
<list_item><loc_76><loc_67><loc_438><loc_92>· Education : Word processors became a cornerstone of education, teaching students not only how to write essays but also how to use technology effectively. Features like bibliography generators and integrated research tools enhanced learning.</list_item>
|
||||
<list_item><loc_76><loc_92><loc_433><loc_117>· Creative Writing : Writers gained powerful tools to organize their ideas. Programs like Scrivener allowed authors to manage large projects, from novels to screenplays, with features like chapter outlines and character notes.</list_item>
|
||||
</unordered_list>
|
||||
<section_header_level_1><loc_60><loc_142><loc_248><loc_151>Word Processors in a Post-Digital Era</section_header_level_1>
|
||||
<text><loc_60><loc_159><loc_438><loc_167>As we move further into the 21st century, the role of the word processor continues to evolve:</text>
|
||||
<unordered_list><list_item><loc_76><loc_176><loc_440><loc_208>1. Artificial Intelligence : Modern word processors are leveraging AI to suggest content improvements. Tools like Grammarly, ProWritingAid, and even native features in Word now analyze tone, conciseness, and clarity. Some AI systems can even generate entire paragraphs or rewrite sentences.</list_item>
|
||||
<list_item><loc_76><loc_208><loc_432><loc_241>2. Integration with Other Tools : Word processors are no longer standalone. They integrate with task managers, cloud storage, and project management platforms. For instance, Google Docs syncs with Google Drive, while Microsoft Word integrates seamlessly with OneDrive and Teams.</list_item>
|
||||
<list_item><loc_76><loc_241><loc_422><loc_274>3. Voice Typing : Speech-to-text capabilities have made word processing more accessible, particularly for those with disabilities. Tools like Dragon NaturallySpeaking and built-in options in Google Docs and Microsoft Word have made dictation mainstream.</list_item>
|
||||
<list_item><loc_76><loc_274><loc_434><loc_298>4. Multimedia Documents : Word processing has expanded beyond text. Modern tools allow users to embed images, videos, charts, and interactive elements, transforming simple documents into rich multimedia experiences.</list_item>
|
||||
<list_item><loc_76><loc_299><loc_429><loc_323>5. Cross-Platform Accessibility : Thanks to cloud computing, documents can now be accessed and edited across devices. Whether you're on a desktop, tablet, or smartphone, you can continue working seamlessly.</list_item>
|
||||
</unordered_list>
|
||||
<section_header_level_1><loc_60><loc_348><loc_192><loc_357>A Glimpse Into the Future</section_header_level_1>
|
||||
<text><loc_60><loc_366><loc_433><loc_382>The word processor's future lies in adaptability and intelligence. Some exciting possibilities include:</text>
|
||||
<unordered_list><list_item><loc_76><loc_390><loc_435><loc_406>· Fully AI-Assisted Writing : Imagine a word processor that understands your writing style, drafts emails, or creates entire essays based on minimal input.</list_item>
|
||||
<list_item><loc_76><loc_407><loc_441><loc_431>· Immersive Interfaces : As augmented reality (AR) and virtual reality (VR) technology advance, users may be able to write and edit in 3D spaces, collaborating in virtual environments.</list_item>
|
||||
<list_item><loc_76><loc_431><loc_436><loc_447>· Hyper-Personalization : Word processors could offer dynamic suggestions based on industry-specific needs, user habits, or even regional language variations.</list_item>
|
||||
</unordered_list>
|
||||
<page_break>
|
||||
<text><loc_60><loc_59><loc_429><loc_100>The journey of the word processor-from clunky typewriters to AI-powered platformsreflects humanity's broader technological progress. What began as a tool to simply replace handwriting has transformed into a powerful ally for creativity, communication, and collaboration. As technology continues to advance, the word processor will undoubtedly remain at the heart of how we express ideas and connect with one another.</text>
|
||||
</doctag>
|
1949
tests/data/groundtruth/docling_v2/multi_page.json
Normal file
1949
tests/data/groundtruth/docling_v2/multi_page.json
Normal file
File diff suppressed because it is too large
Load Diff
87
tests/data/groundtruth/docling_v2/multi_page.md
Normal file
87
tests/data/groundtruth/docling_v2/multi_page.md
Normal file
@ -0,0 +1,87 @@
|
||||
## The Evolution of the Word Processor
|
||||
|
||||
The concept of the word processor predates modern computers and has evolved through several technological milestones.
|
||||
|
||||
## Pre-Digital Era (19th - Early 20th Century)
|
||||
|
||||
The origins of word processing can be traced back to the invention of the typewriter in the mid-19th century. Patented in 1868 by Christopher Latham Sholes, the typewriter revolutionized written communication by enabling people to produce legible, professional documents more efficiently than handwriting.
|
||||
|
||||
During this period, the term "word processing" didn't exist, but the typewriter laid the groundwork for future developments. Over time, advancements such as carbon paper (for copies) and the electric typewriter (introduced by IBM in 1935) improved the speed and convenience of document creation.
|
||||
|
||||
## The Birth of Word Processing (1960s - 1970s)
|
||||
|
||||
The term "word processor" first emerged in the 1960s and referred to any system designed to streamline written communication and document production. Early word processors were not software programs but rather standalone machines.
|
||||
|
||||
- · IBM MT/ST (Magnetic Tape/Selectric Typewriter) : Introduced in 1964, this machine combined IBM's Selectric typewriter with magnetic tape storage. It allowed users to record, edit, and replay typed content-an early example of digital text storage.
|
||||
- · Wang Laboratories : In the 1970s, Wang introduced dedicated word processing machines. These devices, like the Wang 1200, featured small screens and floppy disks, making them revolutionary for their time.
|
||||
|
||||
These machines were primarily used in offices, where secretarial pools benefited from their ability to make revisions without retyping entire documents.
|
||||
|
||||
## The Rise of Personal Computers (1980s)
|
||||
|
||||
The advent of personal computers in the late 1970s and early 1980s transformed word processing from a niche tool to an essential technology for businesses and individuals alike.
|
||||
|
||||
- · WordStar (1978) : Developed for the CP/M operating system, WordStar was one of the first widely used word processing programs. It featured early examples of modern features like cut, copy, and paste.
|
||||
- · Microsoft Word (1983) : Microsoft launched Word for MS-DOS in 1983, introducing a graphical user interface (GUI) and mouse support. Over the years, Microsoft Word became the industry standard for word processing.
|
||||
|
||||
Other notable software from this era included WordPerfect, which was popular among legal professionals, and Apple's MacWrite, which leveraged the Macintosh's graphical capabilities.
|
||||
|
||||
## The Modern Era (1990s - Present)
|
||||
|
||||
By the 1990s, word processing software had become more sophisticated, with features like spell check, grammar check, templates, and collaborative tools.
|
||||
|
||||
- · Microsoft Office Suite : Microsoft continued to dominate with its Office Suite, integrating Word with other productivity tools like Excel and PowerPoint.
|
||||
- · OpenOffice and LibreOffice : Open-source alternatives emerged in the early 2000s, offering free and flexible word processing options.
|
||||
- · Google Docs (2006) : The introduction of cloud-based word processing revolutionized collaboration. Google Docs enabled real-time editing and sharing, making it a staple for teams and remote work.
|
||||
|
||||
## Future of Word Processing
|
||||
|
||||
Today, word processors are more than just tools for typing. They integrate artificial intelligence for grammar and style suggestions (e.g., Grammarly), voice-to-text features, and advanced layout options. As AI continues to advance, word processors may evolve into even more intuitive tools that predict user needs, automate repetitive tasks, and support richer multimedia integration.
|
||||
|
||||
From the clunky typewriters of the 19th century to the AI-powered cloud tools of today, the word processor has come a long way. It remains an essential tool for communication and creativity, shaping how we write and share ideas.
|
||||
|
||||
## Specialized Word Processing Tools
|
||||
|
||||
In addition to general-purpose word processors, specialized tools have emerged to cater to specific industries and needs. These tools incorporate unique features tailored to their users' workflows:
|
||||
|
||||
- · Academic and Technical Writing : Tools like LaTeX gained popularity among academics, scientists, and engineers. Unlike traditional word processors, LaTeX focuses on precise formatting, particularly for complex mathematical equations, scientific papers, and technical documents. It relies on a markup language to produce polished documents suitable for publishing.
|
||||
- · Screenwriting Software : For screenwriters, tools like Final Draft and Celtx are specialized to handle scripts for film and television. These programs automate the formatting of dialogue, scene descriptions, and other elements unique to screenwriting.
|
||||
- · Legal Document Processors : Word processors tailored for legal professionals, like WordPerfect, offered features such as redlining (early version tracking) and document comparison. Even today, many law firms rely on these tools due to their robust formatting options for contracts and legal briefs.
|
||||
|
||||
## Key Features That Changed Word Processing
|
||||
|
||||
The evolution of word processors wasn't just about hardware or software improvements-it was about the features that revolutionized how people wrote and edited. Some of these transformative features include:
|
||||
|
||||
- 1. Undo/Redo : Introduced in the 1980s, the ability to undo mistakes and redo actions made experimentation and error correction much easier.
|
||||
- 2. Spell Check and Grammar Check : By the 1990s, these became standard, allowing users to spot errors automatically.
|
||||
- 3. Templates : Pre-designed formats for documents, such as resumes, letters, and invoices, helped users save time.
|
||||
- 4. Track Changes : A game-changer for collaboration, this feature allowed multiple users to suggest edits while maintaining the original text.
|
||||
- 5. Real-Time Collaboration : Tools like Google Docs and Microsoft 365 enabled multiple users to edit the same document simultaneously, forever changing teamwork dynamics.
|
||||
|
||||
## The Cultural Impact of Word Processors
|
||||
|
||||
The word processor didn't just change workplaces-it changed culture. It democratized writing, enabling anyone with access to a computer to produce professional-quality documents. This shift had profound implications for education, business, and creative fields:
|
||||
|
||||
- · Accessibility : Writers no longer needed expensive publishing equipment or training in typesetting to create polished work. This accessibility paved the way for selfpublishing, blogging, and even fan fiction communities.
|
||||
- · Education : Word processors became a cornerstone of education, teaching students not only how to write essays but also how to use technology effectively. Features like bibliography generators and integrated research tools enhanced learning.
|
||||
- · Creative Writing : Writers gained powerful tools to organize their ideas. Programs like Scrivener allowed authors to manage large projects, from novels to screenplays, with features like chapter outlines and character notes.
|
||||
|
||||
## Word Processors in a Post-Digital Era
|
||||
|
||||
As we move further into the 21st century, the role of the word processor continues to evolve:
|
||||
|
||||
- 1. Artificial Intelligence : Modern word processors are leveraging AI to suggest content improvements. Tools like Grammarly, ProWritingAid, and even native features in Word now analyze tone, conciseness, and clarity. Some AI systems can even generate entire paragraphs or rewrite sentences.
|
||||
- 2. Integration with Other Tools : Word processors are no longer standalone. They integrate with task managers, cloud storage, and project management platforms. For instance, Google Docs syncs with Google Drive, while Microsoft Word integrates seamlessly with OneDrive and Teams.
|
||||
- 3. Voice Typing : Speech-to-text capabilities have made word processing more accessible, particularly for those with disabilities. Tools like Dragon NaturallySpeaking and built-in options in Google Docs and Microsoft Word have made dictation mainstream.
|
||||
- 4. Multimedia Documents : Word processing has expanded beyond text. Modern tools allow users to embed images, videos, charts, and interactive elements, transforming simple documents into rich multimedia experiences.
|
||||
- 5. Cross-Platform Accessibility : Thanks to cloud computing, documents can now be accessed and edited across devices. Whether you're on a desktop, tablet, or smartphone, you can continue working seamlessly.
|
||||
|
||||
## A Glimpse Into the Future
|
||||
|
||||
The word processor's future lies in adaptability and intelligence. Some exciting possibilities include:
|
||||
|
||||
- · Fully AI-Assisted Writing : Imagine a word processor that understands your writing style, drafts emails, or creates entire essays based on minimal input.
|
||||
- · Immersive Interfaces : As augmented reality (AR) and virtual reality (VR) technology advance, users may be able to write and edit in 3D spaces, collaborating in virtual environments.
|
||||
- · Hyper-Personalization : Word processors could offer dynamic suggestions based on industry-specific needs, user habits, or even regional language variations.
|
||||
|
||||
The journey of the word processor-from clunky typewriters to AI-powered platformsreflects humanity's broader technological progress. What began as a tool to simply replace handwriting has transformed into a powerful ally for creativity, communication, and collaboration. As technology continues to advance, the word processor will undoubtedly remain at the heart of how we express ideas and connect with one another.
|
21968
tests/data/groundtruth/docling_v2/multi_page.pages.json
Normal file
21968
tests/data/groundtruth/docling_v2/multi_page.pages.json
Normal file
File diff suppressed because it is too large
Load Diff
@ -334,7 +334,7 @@
|
||||
{
|
||||
"page_no": 1,
|
||||
"bbox": {
|
||||
"l": 134.9200439453125,
|
||||
"l": 134.9199981689453,
|
||||
"t": 487.109375,
|
||||
"r": 475.6635437011719,
|
||||
"b": 281.78173828125,
|
||||
@ -372,7 +372,7 @@
|
||||
{
|
||||
"page_no": 2,
|
||||
"bbox": {
|
||||
"l": 218.8155517578125,
|
||||
"l": 218.81556701660156,
|
||||
"t": 513.9846496582031,
|
||||
"r": 391.96246337890625,
|
||||
"b": 283.10589599609375,
|
||||
|
@ -1390,7 +1390,7 @@
|
||||
"id": 2,
|
||||
"label": "picture",
|
||||
"bbox": {
|
||||
"l": 134.9200439453125,
|
||||
"l": 134.9199981689453,
|
||||
"t": 304.890625,
|
||||
"r": 475.6635437011719,
|
||||
"b": 510.21826171875,
|
||||
@ -2174,7 +2174,7 @@
|
||||
"id": 2,
|
||||
"label": "picture",
|
||||
"bbox": {
|
||||
"l": 134.9200439453125,
|
||||
"l": 134.9199981689453,
|
||||
"t": 304.890625,
|
||||
"r": 475.6635437011719,
|
||||
"b": 510.21826171875,
|
||||
@ -2909,7 +2909,7 @@
|
||||
"id": 2,
|
||||
"label": "picture",
|
||||
"bbox": {
|
||||
"l": 134.9200439453125,
|
||||
"l": 134.9199981689453,
|
||||
"t": 304.890625,
|
||||
"r": 475.6635437011719,
|
||||
"b": 510.21826171875,
|
||||
@ -3623,7 +3623,7 @@
|
||||
"b": 268.20489999999995,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9870928525924683,
|
||||
"confidence": 0.987092912197113,
|
||||
"cells": [
|
||||
{
|
||||
"index": 0,
|
||||
@ -3938,7 +3938,7 @@
|
||||
"b": 532.05774,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9494236707687378,
|
||||
"confidence": 0.9494234323501587,
|
||||
"cells": [
|
||||
{
|
||||
"index": 12,
|
||||
@ -4302,7 +4302,7 @@
|
||||
"id": 2,
|
||||
"label": "picture",
|
||||
"bbox": {
|
||||
"l": 218.8155517578125,
|
||||
"l": 218.81556701660156,
|
||||
"t": 278.0153503417969,
|
||||
"r": 391.96246337890625,
|
||||
"b": 508.89410400390625,
|
||||
@ -4337,7 +4337,7 @@
|
||||
"b": 268.20489999999995,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9870928525924683,
|
||||
"confidence": 0.987092912197113,
|
||||
"cells": [
|
||||
{
|
||||
"index": 0,
|
||||
@ -4658,7 +4658,7 @@
|
||||
"b": 532.05774,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9494236707687378,
|
||||
"confidence": 0.9494234323501587,
|
||||
"cells": [
|
||||
{
|
||||
"index": 12,
|
||||
@ -5040,7 +5040,7 @@
|
||||
"id": 2,
|
||||
"label": "picture",
|
||||
"bbox": {
|
||||
"l": 218.8155517578125,
|
||||
"l": 218.81556701660156,
|
||||
"t": 278.0153503417969,
|
||||
"r": 391.96246337890625,
|
||||
"b": 508.89410400390625,
|
||||
@ -5072,7 +5072,7 @@
|
||||
"b": 268.20489999999995,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9870928525924683,
|
||||
"confidence": 0.987092912197113,
|
||||
"cells": [
|
||||
{
|
||||
"index": 0,
|
||||
@ -5393,7 +5393,7 @@
|
||||
"b": 532.05774,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9494236707687378,
|
||||
"confidence": 0.9494234323501587,
|
||||
"cells": [
|
||||
{
|
||||
"index": 12,
|
||||
@ -5729,7 +5729,7 @@
|
||||
"id": 2,
|
||||
"label": "picture",
|
||||
"bbox": {
|
||||
"l": 218.8155517578125,
|
||||
"l": 218.81556701660156,
|
||||
"t": 278.0153503417969,
|
||||
"r": 391.96246337890625,
|
||||
"b": 508.89410400390625,
|
||||
|
@ -8589,7 +8589,7 @@
|
||||
{
|
||||
"page_no": 1,
|
||||
"bbox": {
|
||||
"l": 33.09040069580078,
|
||||
"l": 33.09052658081055,
|
||||
"t": 498.9671630859375,
|
||||
"r": 585.1502075195312,
|
||||
"b": 89.5469970703125,
|
||||
@ -8683,9 +8683,9 @@
|
||||
{
|
||||
"page_no": 3,
|
||||
"bbox": {
|
||||
"l": 64.1669921875,
|
||||
"l": 64.16704559326172,
|
||||
"t": 188.49365234375,
|
||||
"r": 258.7742919921875,
|
||||
"r": 258.77435302734375,
|
||||
"b": 103.87176513671875,
|
||||
"coord_origin": "BOTTOMLEFT"
|
||||
},
|
||||
@ -8743,7 +8743,7 @@
|
||||
{
|
||||
"page_no": 4,
|
||||
"bbox": {
|
||||
"l": 145.4144744873047,
|
||||
"l": 145.41448974609375,
|
||||
"t": 264.7552490234375,
|
||||
"r": 252.08840942382812,
|
||||
"b": 156.616943359375,
|
||||
@ -8773,10 +8773,10 @@
|
||||
{
|
||||
"page_no": 5,
|
||||
"bbox": {
|
||||
"l": 32.075252532958984,
|
||||
"t": 721.4226226806641,
|
||||
"l": 32.075260162353516,
|
||||
"t": 721.4226608276367,
|
||||
"r": 239.620361328125,
|
||||
"b": 554.0420684814453,
|
||||
"b": 554.0421142578125,
|
||||
"coord_origin": "BOTTOMLEFT"
|
||||
},
|
||||
"charspan": [
|
||||
@ -8996,7 +8996,7 @@
|
||||
"page_no": 10,
|
||||
"bbox": {
|
||||
"l": 135.97177124023438,
|
||||
"t": 684.5892486572266,
|
||||
"t": 684.5892562866211,
|
||||
"r": 545.4180908203125,
|
||||
"b": 381.39068603515625,
|
||||
"coord_origin": "BOTTOMLEFT"
|
||||
@ -9063,9 +9063,9 @@
|
||||
{
|
||||
"page_no": 11,
|
||||
"bbox": {
|
||||
"l": 135.64837646484375,
|
||||
"t": 407.8262939453125,
|
||||
"r": 301.2367248535156,
|
||||
"l": 135.64834594726562,
|
||||
"t": 407.8263244628906,
|
||||
"r": 301.23675537109375,
|
||||
"b": 197.24334716796875,
|
||||
"coord_origin": "BOTTOMLEFT"
|
||||
},
|
||||
@ -9101,10 +9101,10 @@
|
||||
{
|
||||
"page_no": 14,
|
||||
"bbox": {
|
||||
"l": 63.801902770996094,
|
||||
"t": 696.6175842285156,
|
||||
"r": 547.11474609375,
|
||||
"b": 621.9678497314453,
|
||||
"l": 63.80195617675781,
|
||||
"t": 696.6176071166992,
|
||||
"r": 547.1146850585938,
|
||||
"b": 621.9679107666016,
|
||||
"coord_origin": "BOTTOMLEFT"
|
||||
},
|
||||
"charspan": [
|
||||
@ -9139,7 +9139,7 @@
|
||||
{
|
||||
"page_no": 14,
|
||||
"bbox": {
|
||||
"l": 63.985130310058594,
|
||||
"l": 63.9850959777832,
|
||||
"t": 364.09503173828125,
|
||||
"r": 530.0478515625,
|
||||
"b": 145.8603515625,
|
||||
@ -9178,9 +9178,9 @@
|
||||
"page_no": 15,
|
||||
"bbox": {
|
||||
"l": 136.5016632080078,
|
||||
"t": 672.7508773803711,
|
||||
"t": 672.7509078979492,
|
||||
"r": 545.4508666992188,
|
||||
"b": 314.4587707519531,
|
||||
"b": 314.45880126953125,
|
||||
"coord_origin": "BOTTOMLEFT"
|
||||
},
|
||||
"charspan": [
|
||||
@ -9322,10 +9322,10 @@
|
||||
{
|
||||
"page_no": 2,
|
||||
"bbox": {
|
||||
"l": 136.1496124267578,
|
||||
"t": 659.9669647216797,
|
||||
"r": 547.5267944335938,
|
||||
"b": 76.34844970703125,
|
||||
"l": 136.1495819091797,
|
||||
"t": 659.9669189453125,
|
||||
"r": 547.52685546875,
|
||||
"b": 76.3485107421875,
|
||||
"coord_origin": "BOTTOMLEFT"
|
||||
},
|
||||
"charspan": [
|
||||
@ -12490,9 +12490,9 @@
|
||||
"page_no": 8,
|
||||
"bbox": {
|
||||
"l": 135.52462768554688,
|
||||
"t": 502.2747802734375,
|
||||
"t": 502.2746887207031,
|
||||
"r": 545.8714599609375,
|
||||
"b": 349.949462890625,
|
||||
"b": 349.94940185546875,
|
||||
"coord_origin": "BOTTOMLEFT"
|
||||
},
|
||||
"charspan": [
|
||||
@ -13115,7 +13115,7 @@
|
||||
"page_no": 9,
|
||||
"bbox": {
|
||||
"l": 64.41139221191406,
|
||||
"t": 398.3863830566406,
|
||||
"t": 398.3863525390625,
|
||||
"r": 547.3950805664062,
|
||||
"b": 70.39208984375,
|
||||
"coord_origin": "BOTTOMLEFT"
|
||||
@ -15731,7 +15731,7 @@
|
||||
{
|
||||
"page_no": 12,
|
||||
"bbox": {
|
||||
"l": 63.55636978149414,
|
||||
"l": 63.55635070800781,
|
||||
"t": 687.7661285400391,
|
||||
"r": 548.5687255859375,
|
||||
"b": 495.77532958984375,
|
||||
|
File diff suppressed because it is too large
Load Diff
@ -1171,7 +1171,7 @@
|
||||
"b": 295.08200000000005,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9547483325004578,
|
||||
"confidence": 0.9547481536865234,
|
||||
"cells": [
|
||||
{
|
||||
"index": 17,
|
||||
@ -1311,7 +1311,7 @@
|
||||
"b": 350.522,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9672117233276367,
|
||||
"confidence": 0.9672118425369263,
|
||||
"cells": [
|
||||
{
|
||||
"index": 22,
|
||||
@ -1971,7 +1971,7 @@
|
||||
"b": 295.08200000000005,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9547483325004578,
|
||||
"confidence": 0.9547481536865234,
|
||||
"cells": [
|
||||
{
|
||||
"index": 17,
|
||||
@ -2117,7 +2117,7 @@
|
||||
"b": 350.522,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9672117233276367,
|
||||
"confidence": 0.9672118425369263,
|
||||
"cells": [
|
||||
{
|
||||
"index": 22,
|
||||
@ -2770,7 +2770,7 @@
|
||||
"b": 295.08200000000005,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9547483325004578,
|
||||
"confidence": 0.9547481536865234,
|
||||
"cells": [
|
||||
{
|
||||
"index": 17,
|
||||
@ -2916,7 +2916,7 @@
|
||||
"b": 350.522,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9672117233276367,
|
||||
"confidence": 0.9672118425369263,
|
||||
"cells": [
|
||||
{
|
||||
"index": 22,
|
||||
|
@ -5951,7 +5951,7 @@
|
||||
"b": 465.596681609368,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9393879771232605,
|
||||
"confidence": 0.93938809633255,
|
||||
"cells": [
|
||||
{
|
||||
"index": 77,
|
||||
@ -7406,7 +7406,7 @@
|
||||
"b": 534.1167018462124,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.5769620537757874,
|
||||
"confidence": 0.5769621729850769,
|
||||
"cells": [
|
||||
{
|
||||
"index": 134,
|
||||
@ -8046,7 +8046,7 @@
|
||||
"b": 650.6431884765625,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.6444889903068542,
|
||||
"confidence": 0.6444893479347229,
|
||||
"cells": [],
|
||||
"children": []
|
||||
}
|
||||
@ -10042,7 +10042,7 @@
|
||||
"b": 465.596681609368,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9393879771232605,
|
||||
"confidence": 0.93938809633255,
|
||||
"cells": [
|
||||
{
|
||||
"index": 77,
|
||||
@ -11509,7 +11509,7 @@
|
||||
"b": 534.1167018462124,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.5769620537757874,
|
||||
"confidence": 0.5769621729850769,
|
||||
"cells": [
|
||||
{
|
||||
"index": 134,
|
||||
@ -12155,7 +12155,7 @@
|
||||
"b": 650.6431884765625,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.6444889903068542,
|
||||
"confidence": 0.6444893479347229,
|
||||
"cells": [],
|
||||
"children": []
|
||||
},
|
||||
@ -14148,7 +14148,7 @@
|
||||
"b": 465.596681609368,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9393879771232605,
|
||||
"confidence": 0.93938809633255,
|
||||
"cells": [
|
||||
{
|
||||
"index": 77,
|
||||
@ -15615,7 +15615,7 @@
|
||||
"b": 534.1167018462124,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.5769620537757874,
|
||||
"confidence": 0.5769621729850769,
|
||||
"cells": [
|
||||
{
|
||||
"index": 134,
|
||||
@ -16261,7 +16261,7 @@
|
||||
"b": 650.6431884765625,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.6444889903068542,
|
||||
"confidence": 0.6444893479347229,
|
||||
"cells": [],
|
||||
"children": []
|
||||
},
|
||||
|
@ -1102,7 +1102,7 @@
|
||||
"page_no": 1,
|
||||
"bbox": {
|
||||
"l": 388.5767822265625,
|
||||
"t": 806.0041046142578,
|
||||
"t": 806.0040969848633,
|
||||
"r": 482.4759216308594,
|
||||
"b": 739.034423828125,
|
||||
"coord_origin": "BOTTOMLEFT"
|
||||
|
@ -1391,7 +1391,7 @@
|
||||
"label": "picture",
|
||||
"bbox": {
|
||||
"l": 388.5767822265625,
|
||||
"t": 36.03587341308594,
|
||||
"t": 36.03588104248047,
|
||||
"r": 482.4759216308594,
|
||||
"b": 103.00555419921875,
|
||||
"coord_origin": "TOPLEFT"
|
||||
@ -1477,7 +1477,7 @@
|
||||
"b": 81.03008981017001,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.6917961239814758,
|
||||
"confidence": 0.6917959451675415,
|
||||
"cells": [
|
||||
{
|
||||
"index": 2,
|
||||
@ -1517,7 +1517,7 @@
|
||||
"b": 790.0379791491694,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.899228036403656,
|
||||
"confidence": 0.8992282152175903,
|
||||
"cells": [
|
||||
{
|
||||
"index": 3,
|
||||
@ -1597,7 +1597,7 @@
|
||||
"b": 323.44982924225053,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.6362584233283997,
|
||||
"confidence": 0.6362582445144653,
|
||||
"cells": [
|
||||
{
|
||||
"index": 5,
|
||||
@ -2361,7 +2361,7 @@
|
||||
"b": 179.2998695799522,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.7258325815200806,
|
||||
"confidence": 0.7258322834968567,
|
||||
"cells": [
|
||||
{
|
||||
"index": 5,
|
||||
@ -2891,7 +2891,7 @@
|
||||
"b": 233.17986945372706,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.8121814727783203,
|
||||
"confidence": 0.8121819496154785,
|
||||
"cells": [
|
||||
{
|
||||
"index": 25,
|
||||
@ -2931,7 +2931,7 @@
|
||||
"b": 228.73998946412837,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.7672220468521118,
|
||||
"confidence": 0.7672221660614014,
|
||||
"cells": [
|
||||
{
|
||||
"index": 26,
|
||||
@ -2971,7 +2971,7 @@
|
||||
"b": 255.88982940052404,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.8320456743240356,
|
||||
"confidence": 0.8320454955101013,
|
||||
"cells": [
|
||||
{
|
||||
"index": 27,
|
||||
@ -3011,7 +3011,7 @@
|
||||
"b": 251.44994941092557,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.5538824796676636,
|
||||
"confidence": 0.5538817644119263,
|
||||
"cells": [
|
||||
{
|
||||
"index": 28,
|
||||
@ -3051,7 +3051,7 @@
|
||||
"b": 278.5698293473914,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.7909000515937805,
|
||||
"confidence": 0.7908995151519775,
|
||||
"cells": [
|
||||
{
|
||||
"index": 29,
|
||||
@ -3131,7 +3131,7 @@
|
||||
"b": 323.44982924225053,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.6534578204154968,
|
||||
"confidence": 0.6534579396247864,
|
||||
"cells": [
|
||||
{
|
||||
"index": 31,
|
||||
@ -3236,7 +3236,7 @@
|
||||
"b": 296.80999930466,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.5417144298553467,
|
||||
"confidence": 0.5417138934135437,
|
||||
"cells": [
|
||||
{
|
||||
"index": 35,
|
||||
@ -3318,7 +3318,7 @@
|
||||
"b": 596.0198686036978,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.719137966632843,
|
||||
"confidence": 0.7191378474235535,
|
||||
"cells": [
|
||||
{
|
||||
"index": 37,
|
||||
@ -3822,7 +3822,7 @@
|
||||
"b": 386.56997909437825,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.8262879252433777,
|
||||
"confidence": 0.8262876868247986,
|
||||
"cells": [
|
||||
{
|
||||
"index": 38,
|
||||
@ -3862,7 +3862,7 @@
|
||||
"b": 413.70983903079747,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.7766718864440918,
|
||||
"confidence": 0.7766715884208679,
|
||||
"cells": [
|
||||
{
|
||||
"index": 39,
|
||||
@ -3902,7 +3902,7 @@
|
||||
"b": 409.26995904119883,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.8204737901687622,
|
||||
"confidence": 0.8204739093780518,
|
||||
"cells": [
|
||||
{
|
||||
"index": 40,
|
||||
@ -3942,7 +3942,7 @@
|
||||
"b": 436.3898589776647,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.7670677900314331,
|
||||
"confidence": 0.7670676708221436,
|
||||
"cells": [
|
||||
{
|
||||
"index": 41,
|
||||
@ -3982,7 +3982,7 @@
|
||||
"b": 432.0699789877849,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.8048340082168579,
|
||||
"confidence": 0.8048339486122131,
|
||||
"cells": [
|
||||
{
|
||||
"index": 42,
|
||||
@ -4062,7 +4062,7 @@
|
||||
"b": 454.7499689346523,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.827337384223938,
|
||||
"confidence": 0.8273372054100037,
|
||||
"cells": [
|
||||
{
|
||||
"index": 44,
|
||||
@ -4102,7 +4102,7 @@
|
||||
"b": 481.8698388711183,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.7342236638069153,
|
||||
"confidence": 0.7342240214347839,
|
||||
"cells": [
|
||||
{
|
||||
"index": 45,
|
||||
@ -4142,7 +4142,7 @@
|
||||
"b": 477.42995888151955,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.8411222696304321,
|
||||
"confidence": 0.8411223888397217,
|
||||
"cells": [
|
||||
{
|
||||
"index": 46,
|
||||
@ -4182,7 +4182,7 @@
|
||||
"b": 528.3098487623228,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.7251589894294739,
|
||||
"confidence": 0.7251590490341187,
|
||||
"cells": [
|
||||
{
|
||||
"index": 47,
|
||||
@ -4247,7 +4247,7 @@
|
||||
"b": 501.78997882445117,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.7848678827285767,
|
||||
"confidence": 0.7848676443099976,
|
||||
"cells": [
|
||||
{
|
||||
"index": 49,
|
||||
@ -4287,7 +4287,7 @@
|
||||
"b": 573.2198486571116,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.7586438059806824,
|
||||
"confidence": 0.758643627166748,
|
||||
"cells": [
|
||||
{
|
||||
"index": 50,
|
||||
@ -4352,7 +4352,7 @@
|
||||
"b": 546.69997871924,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.7897851467132568,
|
||||
"confidence": 0.7897858619689941,
|
||||
"cells": [
|
||||
{
|
||||
"index": 52,
|
||||
@ -4432,7 +4432,7 @@
|
||||
"b": 591.5799886140991,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.8144810795783997,
|
||||
"confidence": 0.8144806027412415,
|
||||
"cells": [
|
||||
{
|
||||
"index": 54,
|
||||
@ -4484,7 +4484,7 @@
|
||||
"label": "picture",
|
||||
"bbox": {
|
||||
"l": 388.5767822265625,
|
||||
"t": 36.03587341308594,
|
||||
"t": 36.03588104248047,
|
||||
"r": 482.4759216308594,
|
||||
"b": 103.00555419921875,
|
||||
"coord_origin": "TOPLEFT"
|
||||
@ -4580,7 +4580,7 @@
|
||||
"b": 81.03008981017001,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.6917961239814758,
|
||||
"confidence": 0.6917959451675415,
|
||||
"cells": [
|
||||
{
|
||||
"index": 2,
|
||||
@ -4626,7 +4626,7 @@
|
||||
"b": 790.0379791491694,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.899228036403656,
|
||||
"confidence": 0.8992282152175903,
|
||||
"cells": [
|
||||
{
|
||||
"index": 3,
|
||||
@ -4718,7 +4718,7 @@
|
||||
"b": 323.44982924225053,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.6362584233283997,
|
||||
"confidence": 0.6362582445144653,
|
||||
"cells": [
|
||||
{
|
||||
"index": 5,
|
||||
@ -5482,7 +5482,7 @@
|
||||
"b": 179.2998695799522,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.7258325815200806,
|
||||
"confidence": 0.7258322834968567,
|
||||
"cells": [
|
||||
{
|
||||
"index": 5,
|
||||
@ -6012,7 +6012,7 @@
|
||||
"b": 233.17986945372706,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.8121814727783203,
|
||||
"confidence": 0.8121819496154785,
|
||||
"cells": [
|
||||
{
|
||||
"index": 25,
|
||||
@ -6052,7 +6052,7 @@
|
||||
"b": 228.73998946412837,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.7672220468521118,
|
||||
"confidence": 0.7672221660614014,
|
||||
"cells": [
|
||||
{
|
||||
"index": 26,
|
||||
@ -6092,7 +6092,7 @@
|
||||
"b": 255.88982940052404,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.8320456743240356,
|
||||
"confidence": 0.8320454955101013,
|
||||
"cells": [
|
||||
{
|
||||
"index": 27,
|
||||
@ -6132,7 +6132,7 @@
|
||||
"b": 251.44994941092557,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.5538824796676636,
|
||||
"confidence": 0.5538817644119263,
|
||||
"cells": [
|
||||
{
|
||||
"index": 28,
|
||||
@ -6172,7 +6172,7 @@
|
||||
"b": 278.5698293473914,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.7909000515937805,
|
||||
"confidence": 0.7908995151519775,
|
||||
"cells": [
|
||||
{
|
||||
"index": 29,
|
||||
@ -6252,7 +6252,7 @@
|
||||
"b": 323.44982924225053,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.6534578204154968,
|
||||
"confidence": 0.6534579396247864,
|
||||
"cells": [
|
||||
{
|
||||
"index": 31,
|
||||
@ -6357,7 +6357,7 @@
|
||||
"b": 296.80999930466,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.5417144298553467,
|
||||
"confidence": 0.5417138934135437,
|
||||
"cells": [
|
||||
{
|
||||
"index": 35,
|
||||
@ -6451,7 +6451,7 @@
|
||||
"b": 596.0198686036978,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.719137966632843,
|
||||
"confidence": 0.7191378474235535,
|
||||
"cells": [
|
||||
{
|
||||
"index": 37,
|
||||
@ -6955,7 +6955,7 @@
|
||||
"b": 386.56997909437825,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.8262879252433777,
|
||||
"confidence": 0.8262876868247986,
|
||||
"cells": [
|
||||
{
|
||||
"index": 38,
|
||||
@ -6995,7 +6995,7 @@
|
||||
"b": 413.70983903079747,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.7766718864440918,
|
||||
"confidence": 0.7766715884208679,
|
||||
"cells": [
|
||||
{
|
||||
"index": 39,
|
||||
@ -7035,7 +7035,7 @@
|
||||
"b": 409.26995904119883,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.8204737901687622,
|
||||
"confidence": 0.8204739093780518,
|
||||
"cells": [
|
||||
{
|
||||
"index": 40,
|
||||
@ -7075,7 +7075,7 @@
|
||||
"b": 436.3898589776647,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.7670677900314331,
|
||||
"confidence": 0.7670676708221436,
|
||||
"cells": [
|
||||
{
|
||||
"index": 41,
|
||||
@ -7115,7 +7115,7 @@
|
||||
"b": 432.0699789877849,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.8048340082168579,
|
||||
"confidence": 0.8048339486122131,
|
||||
"cells": [
|
||||
{
|
||||
"index": 42,
|
||||
@ -7195,7 +7195,7 @@
|
||||
"b": 454.7499689346523,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.827337384223938,
|
||||
"confidence": 0.8273372054100037,
|
||||
"cells": [
|
||||
{
|
||||
"index": 44,
|
||||
@ -7235,7 +7235,7 @@
|
||||
"b": 481.8698388711183,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.7342236638069153,
|
||||
"confidence": 0.7342240214347839,
|
||||
"cells": [
|
||||
{
|
||||
"index": 45,
|
||||
@ -7275,7 +7275,7 @@
|
||||
"b": 477.42995888151955,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.8411222696304321,
|
||||
"confidence": 0.8411223888397217,
|
||||
"cells": [
|
||||
{
|
||||
"index": 46,
|
||||
@ -7315,7 +7315,7 @@
|
||||
"b": 528.3098487623228,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.7251589894294739,
|
||||
"confidence": 0.7251590490341187,
|
||||
"cells": [
|
||||
{
|
||||
"index": 47,
|
||||
@ -7380,7 +7380,7 @@
|
||||
"b": 501.78997882445117,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.7848678827285767,
|
||||
"confidence": 0.7848676443099976,
|
||||
"cells": [
|
||||
{
|
||||
"index": 49,
|
||||
@ -7420,7 +7420,7 @@
|
||||
"b": 573.2198486571116,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.7586438059806824,
|
||||
"confidence": 0.758643627166748,
|
||||
"cells": [
|
||||
{
|
||||
"index": 50,
|
||||
@ -7485,7 +7485,7 @@
|
||||
"b": 546.69997871924,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.7897851467132568,
|
||||
"confidence": 0.7897858619689941,
|
||||
"cells": [
|
||||
{
|
||||
"index": 52,
|
||||
@ -7565,7 +7565,7 @@
|
||||
"b": 591.5799886140991,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.8144810795783997,
|
||||
"confidence": 0.8144806027412415,
|
||||
"cells": [
|
||||
{
|
||||
"index": 54,
|
||||
@ -7610,7 +7610,7 @@
|
||||
"label": "picture",
|
||||
"bbox": {
|
||||
"l": 388.5767822265625,
|
||||
"t": 36.03587341308594,
|
||||
"t": 36.03588104248047,
|
||||
"r": 482.4759216308594,
|
||||
"b": 103.00555419921875,
|
||||
"coord_origin": "TOPLEFT"
|
||||
@ -7706,7 +7706,7 @@
|
||||
"b": 81.03008981017001,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.6917961239814758,
|
||||
"confidence": 0.6917959451675415,
|
||||
"cells": [
|
||||
{
|
||||
"index": 2,
|
||||
@ -7798,7 +7798,7 @@
|
||||
"b": 323.44982924225053,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.6362584233283997,
|
||||
"confidence": 0.6362582445144653,
|
||||
"cells": [
|
||||
{
|
||||
"index": 5,
|
||||
@ -8562,7 +8562,7 @@
|
||||
"b": 179.2998695799522,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.7258325815200806,
|
||||
"confidence": 0.7258322834968567,
|
||||
"cells": [
|
||||
{
|
||||
"index": 5,
|
||||
@ -9092,7 +9092,7 @@
|
||||
"b": 233.17986945372706,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.8121814727783203,
|
||||
"confidence": 0.8121819496154785,
|
||||
"cells": [
|
||||
{
|
||||
"index": 25,
|
||||
@ -9132,7 +9132,7 @@
|
||||
"b": 228.73998946412837,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.7672220468521118,
|
||||
"confidence": 0.7672221660614014,
|
||||
"cells": [
|
||||
{
|
||||
"index": 26,
|
||||
@ -9172,7 +9172,7 @@
|
||||
"b": 255.88982940052404,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.8320456743240356,
|
||||
"confidence": 0.8320454955101013,
|
||||
"cells": [
|
||||
{
|
||||
"index": 27,
|
||||
@ -9212,7 +9212,7 @@
|
||||
"b": 251.44994941092557,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.5538824796676636,
|
||||
"confidence": 0.5538817644119263,
|
||||
"cells": [
|
||||
{
|
||||
"index": 28,
|
||||
@ -9252,7 +9252,7 @@
|
||||
"b": 278.5698293473914,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.7909000515937805,
|
||||
"confidence": 0.7908995151519775,
|
||||
"cells": [
|
||||
{
|
||||
"index": 29,
|
||||
@ -9332,7 +9332,7 @@
|
||||
"b": 323.44982924225053,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.6534578204154968,
|
||||
"confidence": 0.6534579396247864,
|
||||
"cells": [
|
||||
{
|
||||
"index": 31,
|
||||
@ -9437,7 +9437,7 @@
|
||||
"b": 296.80999930466,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.5417144298553467,
|
||||
"confidence": 0.5417138934135437,
|
||||
"cells": [
|
||||
{
|
||||
"index": 35,
|
||||
@ -9531,7 +9531,7 @@
|
||||
"b": 596.0198686036978,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.719137966632843,
|
||||
"confidence": 0.7191378474235535,
|
||||
"cells": [
|
||||
{
|
||||
"index": 37,
|
||||
@ -10035,7 +10035,7 @@
|
||||
"b": 386.56997909437825,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.8262879252433777,
|
||||
"confidence": 0.8262876868247986,
|
||||
"cells": [
|
||||
{
|
||||
"index": 38,
|
||||
@ -10075,7 +10075,7 @@
|
||||
"b": 413.70983903079747,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.7766718864440918,
|
||||
"confidence": 0.7766715884208679,
|
||||
"cells": [
|
||||
{
|
||||
"index": 39,
|
||||
@ -10115,7 +10115,7 @@
|
||||
"b": 409.26995904119883,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.8204737901687622,
|
||||
"confidence": 0.8204739093780518,
|
||||
"cells": [
|
||||
{
|
||||
"index": 40,
|
||||
@ -10155,7 +10155,7 @@
|
||||
"b": 436.3898589776647,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.7670677900314331,
|
||||
"confidence": 0.7670676708221436,
|
||||
"cells": [
|
||||
{
|
||||
"index": 41,
|
||||
@ -10195,7 +10195,7 @@
|
||||
"b": 432.0699789877849,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.8048340082168579,
|
||||
"confidence": 0.8048339486122131,
|
||||
"cells": [
|
||||
{
|
||||
"index": 42,
|
||||
@ -10275,7 +10275,7 @@
|
||||
"b": 454.7499689346523,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.827337384223938,
|
||||
"confidence": 0.8273372054100037,
|
||||
"cells": [
|
||||
{
|
||||
"index": 44,
|
||||
@ -10315,7 +10315,7 @@
|
||||
"b": 481.8698388711183,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.7342236638069153,
|
||||
"confidence": 0.7342240214347839,
|
||||
"cells": [
|
||||
{
|
||||
"index": 45,
|
||||
@ -10355,7 +10355,7 @@
|
||||
"b": 477.42995888151955,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.8411222696304321,
|
||||
"confidence": 0.8411223888397217,
|
||||
"cells": [
|
||||
{
|
||||
"index": 46,
|
||||
@ -10395,7 +10395,7 @@
|
||||
"b": 528.3098487623228,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.7251589894294739,
|
||||
"confidence": 0.7251590490341187,
|
||||
"cells": [
|
||||
{
|
||||
"index": 47,
|
||||
@ -10460,7 +10460,7 @@
|
||||
"b": 501.78997882445117,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.7848678827285767,
|
||||
"confidence": 0.7848676443099976,
|
||||
"cells": [
|
||||
{
|
||||
"index": 49,
|
||||
@ -10500,7 +10500,7 @@
|
||||
"b": 573.2198486571116,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.7586438059806824,
|
||||
"confidence": 0.758643627166748,
|
||||
"cells": [
|
||||
{
|
||||
"index": 50,
|
||||
@ -10565,7 +10565,7 @@
|
||||
"b": 546.69997871924,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.7897851467132568,
|
||||
"confidence": 0.7897858619689941,
|
||||
"cells": [
|
||||
{
|
||||
"index": 52,
|
||||
@ -10645,7 +10645,7 @@
|
||||
"b": 591.5799886140991,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.8144810795783997,
|
||||
"confidence": 0.8144806027412415,
|
||||
"cells": [
|
||||
{
|
||||
"index": 54,
|
||||
@ -10695,7 +10695,7 @@
|
||||
"b": 790.0379791491694,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.899228036403656,
|
||||
"confidence": 0.8992282152175903,
|
||||
"cells": [
|
||||
{
|
||||
"index": 3,
|
||||
|
BIN
tests/data/pdf/multi_page.pdf
Normal file
BIN
tests/data/pdf/multi_page.pdf
Normal file
Binary file not shown.
@ -44,10 +44,10 @@
|
||||
"prov": [
|
||||
{
|
||||
"bbox": [
|
||||
69.0,
|
||||
688.5883585611979,
|
||||
506.6666666666667,
|
||||
767.2550252278646
|
||||
69.6796630536824,
|
||||
689.0124221922704,
|
||||
504.8720051760782,
|
||||
764.9216921155637
|
||||
],
|
||||
"page": 1,
|
||||
"span": [
|
||||
|
@ -15,20 +15,20 @@
|
||||
"a": 255
|
||||
},
|
||||
"rect": {
|
||||
"r_x0": 71.33333333333333,
|
||||
"r_y0": 99.33333333333333,
|
||||
"r_x1": 506.6666666666667,
|
||||
"r_y1": 99.33333333333333,
|
||||
"r_x2": 506.6666666666667,
|
||||
"r_y2": 74.66666666666667,
|
||||
"r_x3": 71.33333333333333,
|
||||
"r_y3": 74.66666666666667,
|
||||
"r_x0": 73.34702132031646,
|
||||
"r_y0": 97.99999977896755,
|
||||
"r_x1": 503.64955224479564,
|
||||
"r_y1": 97.99999977896755,
|
||||
"r_x2": 503.64955224479564,
|
||||
"r_y2": 76.99999977896756,
|
||||
"r_x3": 73.34702132031646,
|
||||
"r_y3": 76.99999977896756,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"text": "Docling bundles PDF document conversion to",
|
||||
"orig": "Docling bundles PDF document conversion to",
|
||||
"text_direction": "left_to_right",
|
||||
"confidence": 0.9555703127793324,
|
||||
"confidence": 1.0,
|
||||
"from_ocr": true
|
||||
},
|
||||
{
|
||||
@ -40,20 +40,20 @@
|
||||
"a": 255
|
||||
},
|
||||
"rect": {
|
||||
"r_x0": 69.0,
|
||||
"r_y0": 126.66666666666667,
|
||||
"r_x1": 506.6666666666667,
|
||||
"r_y1": 126.66666666666667,
|
||||
"r_x2": 506.6666666666667,
|
||||
"r_y2": 100.66666666666667,
|
||||
"r_x3": 69.0,
|
||||
"r_y3": 100.66666666666667,
|
||||
"r_x0": 69.6796630536824,
|
||||
"r_y0": 124.83139494707741,
|
||||
"r_x1": 504.8720051760782,
|
||||
"r_y1": 124.83139494707741,
|
||||
"r_x2": 504.8720051760782,
|
||||
"r_y2": 104.00000011573796,
|
||||
"r_x3": 69.6796630536824,
|
||||
"r_y3": 104.00000011573796,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"text": "JSON and Markdown in an easy self contained",
|
||||
"orig": "JSON and Markdown in an easy self contained",
|
||||
"text_direction": "left_to_right",
|
||||
"confidence": 0.9741098171752292,
|
||||
"confidence": 1.0,
|
||||
"from_ocr": true
|
||||
},
|
||||
{
|
||||
@ -65,20 +65,20 @@
|
||||
"a": 255
|
||||
},
|
||||
"rect": {
|
||||
"r_x0": 70.66666666666667,
|
||||
"r_y0": 153.33333333333334,
|
||||
"r_x1": 154.0,
|
||||
"r_y1": 153.33333333333334,
|
||||
"r_x2": 154.0,
|
||||
"r_y2": 128.66666666666666,
|
||||
"r_x3": 70.66666666666667,
|
||||
"r_y3": 128.66666666666666,
|
||||
"r_x0": 71.84193505100733,
|
||||
"r_y0": 152.90926970226084,
|
||||
"r_x1": 153.088934155825,
|
||||
"r_y1": 152.90926970226084,
|
||||
"r_x2": 153.088934155825,
|
||||
"r_y2": 129.797125232046,
|
||||
"r_x3": 71.84193505100733,
|
||||
"r_y3": 129.797125232046,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"text": "package",
|
||||
"orig": "package",
|
||||
"text_direction": "left_to_right",
|
||||
"confidence": 0.6702765056141881,
|
||||
"confidence": 1.0,
|
||||
"from_ocr": true
|
||||
}
|
||||
],
|
||||
@ -90,13 +90,13 @@
|
||||
"id": 0,
|
||||
"label": "text",
|
||||
"bbox": {
|
||||
"l": 69.0,
|
||||
"t": 74.66666666666667,
|
||||
"r": 506.6666666666667,
|
||||
"b": 153.33333333333334,
|
||||
"l": 69.6796630536824,
|
||||
"t": 76.99999977896756,
|
||||
"r": 504.8720051760782,
|
||||
"b": 152.90926970226084,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9715733528137207,
|
||||
"confidence": 0.9715732336044312,
|
||||
"cells": [
|
||||
{
|
||||
"index": 0,
|
||||
@ -107,20 +107,20 @@
|
||||
"a": 255
|
||||
},
|
||||
"rect": {
|
||||
"r_x0": 71.33333333333333,
|
||||
"r_y0": 99.33333333333333,
|
||||
"r_x1": 506.6666666666667,
|
||||
"r_y1": 99.33333333333333,
|
||||
"r_x2": 506.6666666666667,
|
||||
"r_y2": 74.66666666666667,
|
||||
"r_x3": 71.33333333333333,
|
||||
"r_y3": 74.66666666666667,
|
||||
"r_x0": 73.34702132031646,
|
||||
"r_y0": 97.99999977896755,
|
||||
"r_x1": 503.64955224479564,
|
||||
"r_y1": 97.99999977896755,
|
||||
"r_x2": 503.64955224479564,
|
||||
"r_y2": 76.99999977896756,
|
||||
"r_x3": 73.34702132031646,
|
||||
"r_y3": 76.99999977896756,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"text": "Docling bundles PDF document conversion to",
|
||||
"orig": "Docling bundles PDF document conversion to",
|
||||
"text_direction": "left_to_right",
|
||||
"confidence": 0.9555703127793324,
|
||||
"confidence": 1.0,
|
||||
"from_ocr": true
|
||||
},
|
||||
{
|
||||
@ -132,20 +132,20 @@
|
||||
"a": 255
|
||||
},
|
||||
"rect": {
|
||||
"r_x0": 69.0,
|
||||
"r_y0": 126.66666666666667,
|
||||
"r_x1": 506.6666666666667,
|
||||
"r_y1": 126.66666666666667,
|
||||
"r_x2": 506.6666666666667,
|
||||
"r_y2": 100.66666666666667,
|
||||
"r_x3": 69.0,
|
||||
"r_y3": 100.66666666666667,
|
||||
"r_x0": 69.6796630536824,
|
||||
"r_y0": 124.83139494707741,
|
||||
"r_x1": 504.8720051760782,
|
||||
"r_y1": 124.83139494707741,
|
||||
"r_x2": 504.8720051760782,
|
||||
"r_y2": 104.00000011573796,
|
||||
"r_x3": 69.6796630536824,
|
||||
"r_y3": 104.00000011573796,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"text": "JSON and Markdown in an easy self contained",
|
||||
"orig": "JSON and Markdown in an easy self contained",
|
||||
"text_direction": "left_to_right",
|
||||
"confidence": 0.9741098171752292,
|
||||
"confidence": 1.0,
|
||||
"from_ocr": true
|
||||
},
|
||||
{
|
||||
@ -157,20 +157,20 @@
|
||||
"a": 255
|
||||
},
|
||||
"rect": {
|
||||
"r_x0": 70.66666666666667,
|
||||
"r_y0": 153.33333333333334,
|
||||
"r_x1": 154.0,
|
||||
"r_y1": 153.33333333333334,
|
||||
"r_x2": 154.0,
|
||||
"r_y2": 128.66666666666666,
|
||||
"r_x3": 70.66666666666667,
|
||||
"r_y3": 128.66666666666666,
|
||||
"r_x0": 71.84193505100733,
|
||||
"r_y0": 152.90926970226084,
|
||||
"r_x1": 153.088934155825,
|
||||
"r_y1": 152.90926970226084,
|
||||
"r_x2": 153.088934155825,
|
||||
"r_y2": 129.797125232046,
|
||||
"r_x3": 71.84193505100733,
|
||||
"r_y3": 129.797125232046,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"text": "package",
|
||||
"orig": "package",
|
||||
"text_direction": "left_to_right",
|
||||
"confidence": 0.6702765056141881,
|
||||
"confidence": 1.0,
|
||||
"from_ocr": true
|
||||
}
|
||||
],
|
||||
@ -195,13 +195,13 @@
|
||||
"id": 0,
|
||||
"label": "text",
|
||||
"bbox": {
|
||||
"l": 69.0,
|
||||
"t": 74.66666666666667,
|
||||
"r": 506.6666666666667,
|
||||
"b": 153.33333333333334,
|
||||
"l": 69.6796630536824,
|
||||
"t": 76.99999977896756,
|
||||
"r": 504.8720051760782,
|
||||
"b": 152.90926970226084,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9715733528137207,
|
||||
"confidence": 0.9715732336044312,
|
||||
"cells": [
|
||||
{
|
||||
"index": 0,
|
||||
@ -212,20 +212,20 @@
|
||||
"a": 255
|
||||
},
|
||||
"rect": {
|
||||
"r_x0": 71.33333333333333,
|
||||
"r_y0": 99.33333333333333,
|
||||
"r_x1": 506.6666666666667,
|
||||
"r_y1": 99.33333333333333,
|
||||
"r_x2": 506.6666666666667,
|
||||
"r_y2": 74.66666666666667,
|
||||
"r_x3": 71.33333333333333,
|
||||
"r_y3": 74.66666666666667,
|
||||
"r_x0": 73.34702132031646,
|
||||
"r_y0": 97.99999977896755,
|
||||
"r_x1": 503.64955224479564,
|
||||
"r_y1": 97.99999977896755,
|
||||
"r_x2": 503.64955224479564,
|
||||
"r_y2": 76.99999977896756,
|
||||
"r_x3": 73.34702132031646,
|
||||
"r_y3": 76.99999977896756,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"text": "Docling bundles PDF document conversion to",
|
||||
"orig": "Docling bundles PDF document conversion to",
|
||||
"text_direction": "left_to_right",
|
||||
"confidence": 0.9555703127793324,
|
||||
"confidence": 1.0,
|
||||
"from_ocr": true
|
||||
},
|
||||
{
|
||||
@ -237,20 +237,20 @@
|
||||
"a": 255
|
||||
},
|
||||
"rect": {
|
||||
"r_x0": 69.0,
|
||||
"r_y0": 126.66666666666667,
|
||||
"r_x1": 506.6666666666667,
|
||||
"r_y1": 126.66666666666667,
|
||||
"r_x2": 506.6666666666667,
|
||||
"r_y2": 100.66666666666667,
|
||||
"r_x3": 69.0,
|
||||
"r_y3": 100.66666666666667,
|
||||
"r_x0": 69.6796630536824,
|
||||
"r_y0": 124.83139494707741,
|
||||
"r_x1": 504.8720051760782,
|
||||
"r_y1": 124.83139494707741,
|
||||
"r_x2": 504.8720051760782,
|
||||
"r_y2": 104.00000011573796,
|
||||
"r_x3": 69.6796630536824,
|
||||
"r_y3": 104.00000011573796,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"text": "JSON and Markdown in an easy self contained",
|
||||
"orig": "JSON and Markdown in an easy self contained",
|
||||
"text_direction": "left_to_right",
|
||||
"confidence": 0.9741098171752292,
|
||||
"confidence": 1.0,
|
||||
"from_ocr": true
|
||||
},
|
||||
{
|
||||
@ -262,20 +262,20 @@
|
||||
"a": 255
|
||||
},
|
||||
"rect": {
|
||||
"r_x0": 70.66666666666667,
|
||||
"r_y0": 153.33333333333334,
|
||||
"r_x1": 154.0,
|
||||
"r_y1": 153.33333333333334,
|
||||
"r_x2": 154.0,
|
||||
"r_y2": 128.66666666666666,
|
||||
"r_x3": 70.66666666666667,
|
||||
"r_y3": 128.66666666666666,
|
||||
"r_x0": 71.84193505100733,
|
||||
"r_y0": 152.90926970226084,
|
||||
"r_x1": 153.088934155825,
|
||||
"r_y1": 152.90926970226084,
|
||||
"r_x2": 153.088934155825,
|
||||
"r_y2": 129.797125232046,
|
||||
"r_x3": 71.84193505100733,
|
||||
"r_y3": 129.797125232046,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"text": "package",
|
||||
"orig": "package",
|
||||
"text_direction": "left_to_right",
|
||||
"confidence": 0.6702765056141881,
|
||||
"confidence": 1.0,
|
||||
"from_ocr": true
|
||||
}
|
||||
],
|
||||
@ -293,13 +293,13 @@
|
||||
"id": 0,
|
||||
"label": "text",
|
||||
"bbox": {
|
||||
"l": 69.0,
|
||||
"t": 74.66666666666667,
|
||||
"r": 506.6666666666667,
|
||||
"b": 153.33333333333334,
|
||||
"l": 69.6796630536824,
|
||||
"t": 76.99999977896756,
|
||||
"r": 504.8720051760782,
|
||||
"b": 152.90926970226084,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9715733528137207,
|
||||
"confidence": 0.9715732336044312,
|
||||
"cells": [
|
||||
{
|
||||
"index": 0,
|
||||
@ -310,20 +310,20 @@
|
||||
"a": 255
|
||||
},
|
||||
"rect": {
|
||||
"r_x0": 71.33333333333333,
|
||||
"r_y0": 99.33333333333333,
|
||||
"r_x1": 506.6666666666667,
|
||||
"r_y1": 99.33333333333333,
|
||||
"r_x2": 506.6666666666667,
|
||||
"r_y2": 74.66666666666667,
|
||||
"r_x3": 71.33333333333333,
|
||||
"r_y3": 74.66666666666667,
|
||||
"r_x0": 73.34702132031646,
|
||||
"r_y0": 97.99999977896755,
|
||||
"r_x1": 503.64955224479564,
|
||||
"r_y1": 97.99999977896755,
|
||||
"r_x2": 503.64955224479564,
|
||||
"r_y2": 76.99999977896756,
|
||||
"r_x3": 73.34702132031646,
|
||||
"r_y3": 76.99999977896756,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"text": "Docling bundles PDF document conversion to",
|
||||
"orig": "Docling bundles PDF document conversion to",
|
||||
"text_direction": "left_to_right",
|
||||
"confidence": 0.9555703127793324,
|
||||
"confidence": 1.0,
|
||||
"from_ocr": true
|
||||
},
|
||||
{
|
||||
@ -335,20 +335,20 @@
|
||||
"a": 255
|
||||
},
|
||||
"rect": {
|
||||
"r_x0": 69.0,
|
||||
"r_y0": 126.66666666666667,
|
||||
"r_x1": 506.6666666666667,
|
||||
"r_y1": 126.66666666666667,
|
||||
"r_x2": 506.6666666666667,
|
||||
"r_y2": 100.66666666666667,
|
||||
"r_x3": 69.0,
|
||||
"r_y3": 100.66666666666667,
|
||||
"r_x0": 69.6796630536824,
|
||||
"r_y0": 124.83139494707741,
|
||||
"r_x1": 504.8720051760782,
|
||||
"r_y1": 124.83139494707741,
|
||||
"r_x2": 504.8720051760782,
|
||||
"r_y2": 104.00000011573796,
|
||||
"r_x3": 69.6796630536824,
|
||||
"r_y3": 104.00000011573796,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"text": "JSON and Markdown in an easy self contained",
|
||||
"orig": "JSON and Markdown in an easy self contained",
|
||||
"text_direction": "left_to_right",
|
||||
"confidence": 0.9741098171752292,
|
||||
"confidence": 1.0,
|
||||
"from_ocr": true
|
||||
},
|
||||
{
|
||||
@ -360,20 +360,20 @@
|
||||
"a": 255
|
||||
},
|
||||
"rect": {
|
||||
"r_x0": 70.66666666666667,
|
||||
"r_y0": 153.33333333333334,
|
||||
"r_x1": 154.0,
|
||||
"r_y1": 153.33333333333334,
|
||||
"r_x2": 154.0,
|
||||
"r_y2": 128.66666666666666,
|
||||
"r_x3": 70.66666666666667,
|
||||
"r_y3": 128.66666666666666,
|
||||
"r_x0": 71.84193505100733,
|
||||
"r_y0": 152.90926970226084,
|
||||
"r_x1": 153.088934155825,
|
||||
"r_y1": 152.90926970226084,
|
||||
"r_x2": 153.088934155825,
|
||||
"r_y2": 129.797125232046,
|
||||
"r_x3": 71.84193505100733,
|
||||
"r_y3": 129.797125232046,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"text": "package",
|
||||
"orig": "package",
|
||||
"text_direction": "left_to_right",
|
||||
"confidence": 0.6702765056141881,
|
||||
"confidence": 1.0,
|
||||
"from_ocr": true
|
||||
}
|
||||
],
|
||||
|
@ -1,2 +1,2 @@
|
||||
<doctag><text><loc_58><loc_44><loc_426><loc_91>Docling bundles PDF document conversion to JSON and Markdown in an easy self contained package</text>
|
||||
<doctag><text><loc_59><loc_46><loc_424><loc_91>Docling bundles PDF document conversion to JSON and Markdown in an easy self contained package</text>
|
||||
</doctag>
|
@ -42,10 +42,10 @@
|
||||
{
|
||||
"page_no": 1,
|
||||
"bbox": {
|
||||
"l": 69.0,
|
||||
"t": 767.2550252278646,
|
||||
"r": 506.6666666666667,
|
||||
"b": 688.5883585611979,
|
||||
"l": 69.6796630536824,
|
||||
"t": 764.9216921155637,
|
||||
"r": 504.8720051760782,
|
||||
"b": 689.0124221922704,
|
||||
"coord_origin": "BOTTOMLEFT"
|
||||
},
|
||||
"charspan": [
|
||||
|
@ -15,20 +15,20 @@
|
||||
"a": 255
|
||||
},
|
||||
"rect": {
|
||||
"r_x0": 71.33333333333333,
|
||||
"r_y0": 99.33333333333333,
|
||||
"r_x1": 506.6666666666667,
|
||||
"r_y1": 99.33333333333333,
|
||||
"r_x2": 506.6666666666667,
|
||||
"r_y2": 74.66666666666667,
|
||||
"r_x3": 71.33333333333333,
|
||||
"r_y3": 74.66666666666667,
|
||||
"r_x0": 73.34702132031646,
|
||||
"r_y0": 97.99999977896755,
|
||||
"r_x1": 503.64955224479564,
|
||||
"r_y1": 97.99999977896755,
|
||||
"r_x2": 503.64955224479564,
|
||||
"r_y2": 76.99999977896756,
|
||||
"r_x3": 73.34702132031646,
|
||||
"r_y3": 76.99999977896756,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"text": "Docling bundles PDF document conversion to",
|
||||
"orig": "Docling bundles PDF document conversion to",
|
||||
"text_direction": "left_to_right",
|
||||
"confidence": 0.9555703127793324,
|
||||
"confidence": 1.0,
|
||||
"from_ocr": true
|
||||
},
|
||||
{
|
||||
@ -40,20 +40,20 @@
|
||||
"a": 255
|
||||
},
|
||||
"rect": {
|
||||
"r_x0": 69.0,
|
||||
"r_y0": 126.66666666666667,
|
||||
"r_x1": 506.6666666666667,
|
||||
"r_y1": 126.66666666666667,
|
||||
"r_x2": 506.6666666666667,
|
||||
"r_y2": 100.66666666666667,
|
||||
"r_x3": 69.0,
|
||||
"r_y3": 100.66666666666667,
|
||||
"r_x0": 69.6796630536824,
|
||||
"r_y0": 124.83139494707741,
|
||||
"r_x1": 504.8720051760782,
|
||||
"r_y1": 124.83139494707741,
|
||||
"r_x2": 504.8720051760782,
|
||||
"r_y2": 104.00000011573796,
|
||||
"r_x3": 69.6796630536824,
|
||||
"r_y3": 104.00000011573796,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"text": "JSON and Markdown in an easy self contained",
|
||||
"orig": "JSON and Markdown in an easy self contained",
|
||||
"text_direction": "left_to_right",
|
||||
"confidence": 0.9741098171752292,
|
||||
"confidence": 1.0,
|
||||
"from_ocr": true
|
||||
},
|
||||
{
|
||||
@ -65,20 +65,20 @@
|
||||
"a": 255
|
||||
},
|
||||
"rect": {
|
||||
"r_x0": 70.66666666666667,
|
||||
"r_y0": 153.33333333333334,
|
||||
"r_x1": 154.0,
|
||||
"r_y1": 153.33333333333334,
|
||||
"r_x2": 154.0,
|
||||
"r_y2": 128.66666666666666,
|
||||
"r_x3": 70.66666666666667,
|
||||
"r_y3": 128.66666666666666,
|
||||
"r_x0": 71.84193505100733,
|
||||
"r_y0": 152.90926970226084,
|
||||
"r_x1": 153.088934155825,
|
||||
"r_y1": 152.90926970226084,
|
||||
"r_x2": 153.088934155825,
|
||||
"r_y2": 129.797125232046,
|
||||
"r_x3": 71.84193505100733,
|
||||
"r_y3": 129.797125232046,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"text": "package",
|
||||
"orig": "package",
|
||||
"text_direction": "left_to_right",
|
||||
"confidence": 0.6702765056141881,
|
||||
"confidence": 1.0,
|
||||
"from_ocr": true
|
||||
}
|
||||
],
|
||||
@ -90,13 +90,13 @@
|
||||
"id": 0,
|
||||
"label": "text",
|
||||
"bbox": {
|
||||
"l": 69.0,
|
||||
"t": 74.66666666666667,
|
||||
"r": 506.6666666666667,
|
||||
"b": 153.33333333333334,
|
||||
"l": 69.6796630536824,
|
||||
"t": 76.99999977896756,
|
||||
"r": 504.8720051760782,
|
||||
"b": 152.90926970226084,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9715733528137207,
|
||||
"confidence": 0.9715732336044312,
|
||||
"cells": [
|
||||
{
|
||||
"index": 0,
|
||||
@ -107,20 +107,20 @@
|
||||
"a": 255
|
||||
},
|
||||
"rect": {
|
||||
"r_x0": 71.33333333333333,
|
||||
"r_y0": 99.33333333333333,
|
||||
"r_x1": 506.6666666666667,
|
||||
"r_y1": 99.33333333333333,
|
||||
"r_x2": 506.6666666666667,
|
||||
"r_y2": 74.66666666666667,
|
||||
"r_x3": 71.33333333333333,
|
||||
"r_y3": 74.66666666666667,
|
||||
"r_x0": 73.34702132031646,
|
||||
"r_y0": 97.99999977896755,
|
||||
"r_x1": 503.64955224479564,
|
||||
"r_y1": 97.99999977896755,
|
||||
"r_x2": 503.64955224479564,
|
||||
"r_y2": 76.99999977896756,
|
||||
"r_x3": 73.34702132031646,
|
||||
"r_y3": 76.99999977896756,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"text": "Docling bundles PDF document conversion to",
|
||||
"orig": "Docling bundles PDF document conversion to",
|
||||
"text_direction": "left_to_right",
|
||||
"confidence": 0.9555703127793324,
|
||||
"confidence": 1.0,
|
||||
"from_ocr": true
|
||||
},
|
||||
{
|
||||
@ -132,20 +132,20 @@
|
||||
"a": 255
|
||||
},
|
||||
"rect": {
|
||||
"r_x0": 69.0,
|
||||
"r_y0": 126.66666666666667,
|
||||
"r_x1": 506.6666666666667,
|
||||
"r_y1": 126.66666666666667,
|
||||
"r_x2": 506.6666666666667,
|
||||
"r_y2": 100.66666666666667,
|
||||
"r_x3": 69.0,
|
||||
"r_y3": 100.66666666666667,
|
||||
"r_x0": 69.6796630536824,
|
||||
"r_y0": 124.83139494707741,
|
||||
"r_x1": 504.8720051760782,
|
||||
"r_y1": 124.83139494707741,
|
||||
"r_x2": 504.8720051760782,
|
||||
"r_y2": 104.00000011573796,
|
||||
"r_x3": 69.6796630536824,
|
||||
"r_y3": 104.00000011573796,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"text": "JSON and Markdown in an easy self contained",
|
||||
"orig": "JSON and Markdown in an easy self contained",
|
||||
"text_direction": "left_to_right",
|
||||
"confidence": 0.9741098171752292,
|
||||
"confidence": 1.0,
|
||||
"from_ocr": true
|
||||
},
|
||||
{
|
||||
@ -157,20 +157,20 @@
|
||||
"a": 255
|
||||
},
|
||||
"rect": {
|
||||
"r_x0": 70.66666666666667,
|
||||
"r_y0": 153.33333333333334,
|
||||
"r_x1": 154.0,
|
||||
"r_y1": 153.33333333333334,
|
||||
"r_x2": 154.0,
|
||||
"r_y2": 128.66666666666666,
|
||||
"r_x3": 70.66666666666667,
|
||||
"r_y3": 128.66666666666666,
|
||||
"r_x0": 71.84193505100733,
|
||||
"r_y0": 152.90926970226084,
|
||||
"r_x1": 153.088934155825,
|
||||
"r_y1": 152.90926970226084,
|
||||
"r_x2": 153.088934155825,
|
||||
"r_y2": 129.797125232046,
|
||||
"r_x3": 71.84193505100733,
|
||||
"r_y3": 129.797125232046,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"text": "package",
|
||||
"orig": "package",
|
||||
"text_direction": "left_to_right",
|
||||
"confidence": 0.6702765056141881,
|
||||
"confidence": 1.0,
|
||||
"from_ocr": true
|
||||
}
|
||||
],
|
||||
@ -195,13 +195,13 @@
|
||||
"id": 0,
|
||||
"label": "text",
|
||||
"bbox": {
|
||||
"l": 69.0,
|
||||
"t": 74.66666666666667,
|
||||
"r": 506.6666666666667,
|
||||
"b": 153.33333333333334,
|
||||
"l": 69.6796630536824,
|
||||
"t": 76.99999977896756,
|
||||
"r": 504.8720051760782,
|
||||
"b": 152.90926970226084,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9715733528137207,
|
||||
"confidence": 0.9715732336044312,
|
||||
"cells": [
|
||||
{
|
||||
"index": 0,
|
||||
@ -212,20 +212,20 @@
|
||||
"a": 255
|
||||
},
|
||||
"rect": {
|
||||
"r_x0": 71.33333333333333,
|
||||
"r_y0": 99.33333333333333,
|
||||
"r_x1": 506.6666666666667,
|
||||
"r_y1": 99.33333333333333,
|
||||
"r_x2": 506.6666666666667,
|
||||
"r_y2": 74.66666666666667,
|
||||
"r_x3": 71.33333333333333,
|
||||
"r_y3": 74.66666666666667,
|
||||
"r_x0": 73.34702132031646,
|
||||
"r_y0": 97.99999977896755,
|
||||
"r_x1": 503.64955224479564,
|
||||
"r_y1": 97.99999977896755,
|
||||
"r_x2": 503.64955224479564,
|
||||
"r_y2": 76.99999977896756,
|
||||
"r_x3": 73.34702132031646,
|
||||
"r_y3": 76.99999977896756,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"text": "Docling bundles PDF document conversion to",
|
||||
"orig": "Docling bundles PDF document conversion to",
|
||||
"text_direction": "left_to_right",
|
||||
"confidence": 0.9555703127793324,
|
||||
"confidence": 1.0,
|
||||
"from_ocr": true
|
||||
},
|
||||
{
|
||||
@ -237,20 +237,20 @@
|
||||
"a": 255
|
||||
},
|
||||
"rect": {
|
||||
"r_x0": 69.0,
|
||||
"r_y0": 126.66666666666667,
|
||||
"r_x1": 506.6666666666667,
|
||||
"r_y1": 126.66666666666667,
|
||||
"r_x2": 506.6666666666667,
|
||||
"r_y2": 100.66666666666667,
|
||||
"r_x3": 69.0,
|
||||
"r_y3": 100.66666666666667,
|
||||
"r_x0": 69.6796630536824,
|
||||
"r_y0": 124.83139494707741,
|
||||
"r_x1": 504.8720051760782,
|
||||
"r_y1": 124.83139494707741,
|
||||
"r_x2": 504.8720051760782,
|
||||
"r_y2": 104.00000011573796,
|
||||
"r_x3": 69.6796630536824,
|
||||
"r_y3": 104.00000011573796,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"text": "JSON and Markdown in an easy self contained",
|
||||
"orig": "JSON and Markdown in an easy self contained",
|
||||
"text_direction": "left_to_right",
|
||||
"confidence": 0.9741098171752292,
|
||||
"confidence": 1.0,
|
||||
"from_ocr": true
|
||||
},
|
||||
{
|
||||
@ -262,20 +262,20 @@
|
||||
"a": 255
|
||||
},
|
||||
"rect": {
|
||||
"r_x0": 70.66666666666667,
|
||||
"r_y0": 153.33333333333334,
|
||||
"r_x1": 154.0,
|
||||
"r_y1": 153.33333333333334,
|
||||
"r_x2": 154.0,
|
||||
"r_y2": 128.66666666666666,
|
||||
"r_x3": 70.66666666666667,
|
||||
"r_y3": 128.66666666666666,
|
||||
"r_x0": 71.84193505100733,
|
||||
"r_y0": 152.90926970226084,
|
||||
"r_x1": 153.088934155825,
|
||||
"r_y1": 152.90926970226084,
|
||||
"r_x2": 153.088934155825,
|
||||
"r_y2": 129.797125232046,
|
||||
"r_x3": 71.84193505100733,
|
||||
"r_y3": 129.797125232046,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"text": "package",
|
||||
"orig": "package",
|
||||
"text_direction": "left_to_right",
|
||||
"confidence": 0.6702765056141881,
|
||||
"confidence": 1.0,
|
||||
"from_ocr": true
|
||||
}
|
||||
],
|
||||
@ -293,13 +293,13 @@
|
||||
"id": 0,
|
||||
"label": "text",
|
||||
"bbox": {
|
||||
"l": 69.0,
|
||||
"t": 74.66666666666667,
|
||||
"r": 506.6666666666667,
|
||||
"b": 153.33333333333334,
|
||||
"l": 69.6796630536824,
|
||||
"t": 76.99999977896756,
|
||||
"r": 504.8720051760782,
|
||||
"b": 152.90926970226084,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"confidence": 0.9715733528137207,
|
||||
"confidence": 0.9715732336044312,
|
||||
"cells": [
|
||||
{
|
||||
"index": 0,
|
||||
@ -310,20 +310,20 @@
|
||||
"a": 255
|
||||
},
|
||||
"rect": {
|
||||
"r_x0": 71.33333333333333,
|
||||
"r_y0": 99.33333333333333,
|
||||
"r_x1": 506.6666666666667,
|
||||
"r_y1": 99.33333333333333,
|
||||
"r_x2": 506.6666666666667,
|
||||
"r_y2": 74.66666666666667,
|
||||
"r_x3": 71.33333333333333,
|
||||
"r_y3": 74.66666666666667,
|
||||
"r_x0": 73.34702132031646,
|
||||
"r_y0": 97.99999977896755,
|
||||
"r_x1": 503.64955224479564,
|
||||
"r_y1": 97.99999977896755,
|
||||
"r_x2": 503.64955224479564,
|
||||
"r_y2": 76.99999977896756,
|
||||
"r_x3": 73.34702132031646,
|
||||
"r_y3": 76.99999977896756,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"text": "Docling bundles PDF document conversion to",
|
||||
"orig": "Docling bundles PDF document conversion to",
|
||||
"text_direction": "left_to_right",
|
||||
"confidence": 0.9555703127793324,
|
||||
"confidence": 1.0,
|
||||
"from_ocr": true
|
||||
},
|
||||
{
|
||||
@ -335,20 +335,20 @@
|
||||
"a": 255
|
||||
},
|
||||
"rect": {
|
||||
"r_x0": 69.0,
|
||||
"r_y0": 126.66666666666667,
|
||||
"r_x1": 506.6666666666667,
|
||||
"r_y1": 126.66666666666667,
|
||||
"r_x2": 506.6666666666667,
|
||||
"r_y2": 100.66666666666667,
|
||||
"r_x3": 69.0,
|
||||
"r_y3": 100.66666666666667,
|
||||
"r_x0": 69.6796630536824,
|
||||
"r_y0": 124.83139494707741,
|
||||
"r_x1": 504.8720051760782,
|
||||
"r_y1": 124.83139494707741,
|
||||
"r_x2": 504.8720051760782,
|
||||
"r_y2": 104.00000011573796,
|
||||
"r_x3": 69.6796630536824,
|
||||
"r_y3": 104.00000011573796,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"text": "JSON and Markdown in an easy self contained",
|
||||
"orig": "JSON and Markdown in an easy self contained",
|
||||
"text_direction": "left_to_right",
|
||||
"confidence": 0.9741098171752292,
|
||||
"confidence": 1.0,
|
||||
"from_ocr": true
|
||||
},
|
||||
{
|
||||
@ -360,20 +360,20 @@
|
||||
"a": 255
|
||||
},
|
||||
"rect": {
|
||||
"r_x0": 70.66666666666667,
|
||||
"r_y0": 153.33333333333334,
|
||||
"r_x1": 154.0,
|
||||
"r_y1": 153.33333333333334,
|
||||
"r_x2": 154.0,
|
||||
"r_y2": 128.66666666666666,
|
||||
"r_x3": 70.66666666666667,
|
||||
"r_y3": 128.66666666666666,
|
||||
"r_x0": 71.84193505100733,
|
||||
"r_y0": 152.90926970226084,
|
||||
"r_x1": 153.088934155825,
|
||||
"r_y1": 152.90926970226084,
|
||||
"r_x2": 153.088934155825,
|
||||
"r_y2": 129.797125232046,
|
||||
"r_x3": 71.84193505100733,
|
||||
"r_y3": 129.797125232046,
|
||||
"coord_origin": "TOPLEFT"
|
||||
},
|
||||
"text": "package",
|
||||
"orig": "package",
|
||||
"text_direction": "left_to_right",
|
||||
"confidence": 0.6702765056141881,
|
||||
"confidence": 1.0,
|
||||
"from_ocr": true
|
||||
}
|
||||
],
|
||||
|
@ -75,3 +75,16 @@ def test_crop_page_image(test_doc_path):
|
||||
def test_num_pages(test_doc_path):
|
||||
doc_backend = _get_backend(test_doc_path)
|
||||
doc_backend.page_count() == 9
|
||||
|
||||
|
||||
def test_merge_row():
|
||||
pdf_doc = Path("./tests/data/pdf/multi_page.pdf")
|
||||
|
||||
doc_backend = _get_backend(pdf_doc)
|
||||
page_backend: PyPdfiumPageBackend = doc_backend.load_page(4)
|
||||
cell = page_backend.get_text_cells()[0]
|
||||
|
||||
assert (
|
||||
cell.text
|
||||
== "The journey of the word processor—from clunky typewriters to AI-powered platforms—"
|
||||
)
|
||||
|
Loading…
Reference in New Issue
Block a user