feat: Add pipeline timings and toggle visualization, establish debug settings (#183)

* Add settings to turn visualization on or off Signed-off-by: Christoph Auer <cau@zurich.ibm.com> * Add profiling code to all models Signed-off-by: Christoph Auer <cau@zurich.ibm.com> * Refactor and fix profiling codes Signed-off-by: Christoph Auer <cau@zurich.ibm.com> * Visualization codes output PNG to debug dir Signed-off-by: Christoph Auer <cau@zurich.ibm.com> * Fixes for time logging Signed-off-by: Christoph Auer <cau@zurich.ibm.com> * Optimize imports Signed-off-by: Christoph Auer <cau@zurich.ibm.com> * Update lockfile Signed-off-by: Christoph Auer <cau@zurich.ibm.com> * Add start_timestamps to ProfilingItem Signed-off-by: Christoph Auer <cau@zurich.ibm.com> --------- Signed-off-by: Christoph Auer <cau@zurich.ibm.com>
2024-10-30 15:04:19 +01:00
parent 94a5290789
commit 2a2c65bf4f
23 changed files with 998 additions and 771 deletions
@@ -12,8 +12,10 @@ from docling.datamodel.base_models import (
    Table,
    TextElement,
 )
+from docling.datamodel.document import ConversionResult
 from docling.models.base_model import BasePageModel
 from docling.models.layout_model import LayoutModel
+from docling.utils.profiling import TimeRecorder

 _log = logging.getLogger(__name__)

@@ -51,122 +53,122 @@ class PageAssembleModel(BasePageModel):

        return sanitized_text.strip()  # Strip any leading or trailing whitespace

-    def __call__(self, page_batch: Iterable[Page]) -> Iterable[Page]:
+    def __call__(
+        self, conv_res: ConversionResult, page_batch: Iterable[Page]
+    ) -> Iterable[Page]:
        for page in page_batch:
            assert page._backend is not None
            if not page._backend.is_valid():
                yield page
            else:
-                assert page.predictions.layout is not None
+                with TimeRecorder(conv_res, "page_assemble"):

-                # assembles some JSON output page by page.
+                    assert page.predictions.layout is not None

-                elements: List[PageElement] = []
-                headers: List[PageElement] = []
-                body: List[PageElement] = []
+                    # assembles some JSON output page by page.

-                for cluster in page.predictions.layout.clusters:
-                    # _log.info("Cluster label seen:", cluster.label)
-                    if cluster.label in LayoutModel.TEXT_ELEM_LABELS:
+                    elements: List[PageElement] = []
+                    headers: List[PageElement] = []
+                    body: List[PageElement] = []

-                        textlines = [
-                            cell.text.replace("\x02", "-").strip()
-                            for cell in cluster.cells
-                            if len(cell.text.strip()) > 0
-                        ]
-                        text = self.sanitize_text(textlines)
-                        text_el = TextElement(
-                            label=cluster.label,
-                            id=cluster.id,
-                            text=text,
-                            page_no=page.page_no,
-                            cluster=cluster,
-                        )
-                        elements.append(text_el)
+                    for cluster in page.predictions.layout.clusters:
+                        # _log.info("Cluster label seen:", cluster.label)
+                        if cluster.label in LayoutModel.TEXT_ELEM_LABELS:

-                        if cluster.label in LayoutModel.PAGE_HEADER_LABELS:
-                            headers.append(text_el)
-                        else:
-                            body.append(text_el)
-                    elif cluster.label == LayoutModel.TABLE_LABEL:
-                        tbl = None
-                        if page.predictions.tablestructure:
-                            tbl = page.predictions.tablestructure.table_map.get(
-                                cluster.id, None
-                            )
-                        if (
-                            not tbl
-                        ):  # fallback: add table without structure, if it isn't present
-                            tbl = Table(
+                            textlines = [
+                                cell.text.replace("\x02", "-").strip()
+                                for cell in cluster.cells
+                                if len(cell.text.strip()) > 0
+                            ]
+                            text = self.sanitize_text(textlines)
+                            text_el = TextElement(
                                label=cluster.label,
                                id=cluster.id,
-                                text="",
-                                otsl_seq=[],
-                                table_cells=[],
-                                cluster=cluster,
-                                page_no=page.page_no,
-                            )
-
-                        elements.append(tbl)
-                        body.append(tbl)
-                    elif cluster.label == LayoutModel.FIGURE_LABEL:
-                        fig = None
-                        if page.predictions.figures_classification:
-                            fig = (
-                                page.predictions.figures_classification.figure_map.get(
-                                    cluster.id, None
-                                )
-                            )
-                        if (
-                            not fig
-                        ):  # fallback: add figure without classification, if it isn't present
-                            fig = FigureElement(
-                                label=cluster.label,
-                                id=cluster.id,
-                                text="",
-                                data=None,
-                                cluster=cluster,
-                                page_no=page.page_no,
-                            )
-                        elements.append(fig)
-                        body.append(fig)
-                    elif cluster.label == LayoutModel.FORMULA_LABEL:
-                        equation = None
-                        if page.predictions.equations_prediction:
-                            equation = (
-                                page.predictions.equations_prediction.equation_map.get(
-                                    cluster.id, None
-                                )
-                            )
-                        if (
-                            not equation
-                        ):  # fallback: add empty formula, if it isn't present
-                            text = self.sanitize_text(
-                                [
-                                    cell.text.replace("\x02", "-").strip()
-                                    for cell in cluster.cells
-                                    if len(cell.text.strip()) > 0
-                                ]
-                            )
-                            equation = TextElement(
-                                label=cluster.label,
-                                id=cluster.id,
-                                cluster=cluster,
-                                page_no=page.page_no,
                                text=text,
+                                page_no=page.page_no,
+                                cluster=cluster,
                            )
-                        elements.append(equation)
-                        body.append(equation)
+                            elements.append(text_el)

-                page.assembled = AssembledUnit(
-                    elements=elements, headers=headers, body=body
-                )
+                            if cluster.label in LayoutModel.PAGE_HEADER_LABELS:
+                                headers.append(text_el)
+                            else:
+                                body.append(text_el)
+                        elif cluster.label == LayoutModel.TABLE_LABEL:
+                            tbl = None
+                            if page.predictions.tablestructure:
+                                tbl = page.predictions.tablestructure.table_map.get(
+                                    cluster.id, None
+                                )
+                            if (
+                                not tbl
+                            ):  # fallback: add table without structure, if it isn't present
+                                tbl = Table(
+                                    label=cluster.label,
+                                    id=cluster.id,
+                                    text="",
+                                    otsl_seq=[],
+                                    table_cells=[],
+                                    cluster=cluster,
+                                    page_no=page.page_no,
+                                )

-                # Remove page images (can be disabled)
-                if not self.options.keep_images:
-                    page._image_cache = {}
+                            elements.append(tbl)
+                            body.append(tbl)
+                        elif cluster.label == LayoutModel.FIGURE_LABEL:
+                            fig = None
+                            if page.predictions.figures_classification:
+                                fig = page.predictions.figures_classification.figure_map.get(
+                                    cluster.id, None
+                                )
+                            if (
+                                not fig
+                            ):  # fallback: add figure without classification, if it isn't present
+                                fig = FigureElement(
+                                    label=cluster.label,
+                                    id=cluster.id,
+                                    text="",
+                                    data=None,
+                                    cluster=cluster,
+                                    page_no=page.page_no,
+                                )
+                            elements.append(fig)
+                            body.append(fig)
+                        elif cluster.label == LayoutModel.FORMULA_LABEL:
+                            equation = None
+                            if page.predictions.equations_prediction:
+                                equation = page.predictions.equations_prediction.equation_map.get(
+                                    cluster.id, None
+                                )
+                            if (
+                                not equation
+                            ):  # fallback: add empty formula, if it isn't present
+                                text = self.sanitize_text(
+                                    [
+                                        cell.text.replace("\x02", "-").strip()
+                                        for cell in cluster.cells
+                                        if len(cell.text.strip()) > 0
+                                    ]
+                                )
+                                equation = TextElement(
+                                    label=cluster.label,
+                                    id=cluster.id,
+                                    cluster=cluster,
+                                    page_no=page.page_no,
+                                    text=text,
+                                )
+                            elements.append(equation)
+                            body.append(equation)

-                # Unload backend
-                page._backend.unload()
+                    page.assembled = AssembledUnit(
+                        elements=elements, headers=headers, body=body
+                    )
+
+                    # Remove page images (can be disabled)
+                    if not self.options.keep_images:
+                        page._image_cache = {}
+
+                    # Unload backend
+                    page._backend.unload()

                yield page