From 4dec21fa7796dfa8206d26d1000c28e24ebfbb57 Mon Sep 17 00:00:00 2001 From: Christoph Auer Date: Wed, 1 Feb 2023 10:36:10 +0100 Subject: [PATCH] Add option to control OCR behaviour with page images Signed-off-by: Christoph Auer --- deepsearch/documents/core/models.py | 1 + 1 file changed, 1 insertion(+) diff --git a/deepsearch/documents/core/models.py b/deepsearch/documents/core/models.py index defc7edb..bce06b14 100644 --- a/deepsearch/documents/core/models.py +++ b/deepsearch/documents/core/models.py @@ -254,6 +254,7 @@ class OCRSettings(BaseModel): backend: str = "tesseract-ocr" # validate with available options on CCS API config: dict = {} # implementation specific to OCR backend merge_mode: Optional[OCRModeEnum] = OCRModeEnum.prioritize_ocr + use_individual_bitmaps: bool = True @classmethod def get_backends(