From 8b35c9fddba1cd7695a33ce4d9aa5e2d9dd312b2 Mon Sep 17 00:00:00 2001 From: Michael Date: Mon, 22 Jan 2024 18:01:51 +0000 Subject: [PATCH] Tesseract: Improved detection --- tesseract/tesseract.php | 4 ++++ 1 file changed, 4 insertions(+) diff --git a/tesseract/tesseract.php b/tesseract/tesseract.php index 3c61273f..b3e1feb6 100644 --- a/tesseract/tesseract.php +++ b/tesseract/tesseract.php @@ -24,6 +24,10 @@ function tesseract_ocr_detection(&$media) { $ocr = new TesseractOCR(); try { + $languages = $ocr->availableLanguages(); + if ($languages) { + $ocr->lang(implode('+', $languages)); + } $ocr->tempDir(System::getTempPath()); $ocr->imageData($media['img_str'], strlen($media['img_str'])); $media['description'] = $ocr->run();