diff --git a/docling/models/easyocr_model.py b/docling/models/easyocr_model.py index 6c72be5..1b8e914 100644 --- a/docling/models/easyocr_model.py +++ b/docling/models/easyocr_model.py @@ -31,12 +31,9 @@ class EasyOcrModel(BaseOcrModel): "Alternatively, Docling has support for other OCR engines. See the documentation." ) - use_gpu = ( - False if torch.backends.mps.is_available() else self.options.use_gpu - ) self.reader = easyocr.Reader( lang_list=self.options.lang, - gpu=use_gpu, + gpu=self.options.use_gpu, model_storage_directory=self.options.model_storage_directory, download_enabled=self.options.download_enabled, ) diff --git a/docs/examples/custom_convert.py b/docs/examples/custom_convert.py index 204ae59..7631848 100644 --- a/docs/examples/custom_convert.py +++ b/docs/examples/custom_convert.py @@ -80,6 +80,20 @@ def main(): } ) + # Docling Parse with EasyOCR (CPU only) + # ---------------------- + # pipeline_options = PdfPipelineOptions() + # pipeline_options.do_ocr = True + # pipeline_options.ocr_options.use_gpu = False # <-- set this. + # pipeline_options.do_table_structure = True + # pipeline_options.table_structure_options.do_cell_matching = True + + # doc_converter = DocumentConverter( + # format_options={ + # InputFormat.PDF: PdfFormatOption(pipeline_options=pipeline_options) + # } + # ) + # Docling Parse with Tesseract # ---------------------- # pipeline_options = PdfPipelineOptions()