fix: [ocr] fix ocr supported languages

2024-04-26 10:49:24 +02:00 · 2024-04-26 10:49:24 +02:00 · 5503d8134a
parent 1d1671c00f
commit 5503d8134a
1 changed files with 3 additions and 4 deletions
--- a/bin/modules/OcrExtractor.py
+++ b/bin/modules/OcrExtractor.py
@ -24,7 +24,7 @@ from lib.objects import Ocrs


 # Default to eng
-def get_model_languages(obj, ocr_languages, add_en=True):
+def get_model_languages(obj, add_en=True):
    if add_en:
        model_languages = {'en'}
    else:
@ -54,8 +54,6 @@ def get_model_languages(obj, ocr_languages, add_en=True):
            model_languages.add(lang)
            return model_languages

-    model_languages = Ocrs.sanityze_ocr_languages(model_languages, ocr_languages=ocr_languages)
-
    return model_languages

    #  TODO thread
@ -100,7 +98,8 @@ class OcrExtractor(AbstractModule):

        if not ocr.exists():
            path = image.get_filepath()
-            languages = get_model_languages(image, self.ocr_languages)
+            languages = get_model_languages(image)
+            languages = Ocrs.sanityze_ocr_languages(languages, ocr_languages=self.ocr_languages)
            print(image.id, languages)
            texts = Ocrs.extract_text(path, languages)
            if texts: