Use celery multiprocessing if available

Closes #9
ocrmypdf · Aug 30, 2024 · a9916e5 · a9916e5
1 parent f3d5f7a
commit a9916e5
Showing 1 changed file with 10 additions and 5 deletions.
diff --git a/ocrmypdf_easyocr/__init__.py b/ocrmypdf_easyocr/__init__.py
@@ -5,11 +5,10 @@
 
 from __future__ import annotations
 
+import contextlib
 import logging
-import multiprocessing.managers
 import os
 import sys
-import contextlib
 import threading
 import traceback
 from pathlib import Path
@@ -27,6 +26,12 @@
 from ocrmypdf_easyocr._easyocr import tidy_easyocr_result
 from ocrmypdf_easyocr._pdf import easyocr_to_pikepdf
 
+try:
+    # Use Celery's multiprocessing if available
+    import billiard as multiprocessing
+except ImportError:
+    import multiprocessing.managers
+
 log = logging.getLogger(__name__)
 
 ISO_639_3_2: dict[str, str] = {
@@ -113,12 +118,12 @@ def _ocr_process(q: multiprocessing.Queue[Task], options):
             if reader is None:
                 use_gpu = options.gpu
                 languages = [ISO_639_3_2[lang] for lang in options.languages]
-                
+
                 # Redirect stdout to stderr during Reader initialization to be compliant with ocrmypdf
-                # otherwise piping a pdf output to stdout gets interfered with the progress bar of loading the model to ram 
+                # otherwise piping a pdf output to stdout gets interfered with the progress bar of loading the model to ram
                 with contextlib.redirect_stdout(sys.stderr):
                     reader = easyocr.Reader(languages, use_gpu)
-                    
+
             output_dict["output"] = reader.readtext(
                 gray, batch_size=options.easyocr_batch_size
             )