From 9dcdb6e9a692c8855173df543168867edc82a0b8 Mon Sep 17 00:00:00 2001 From: Jean-Francois Dockes Date: Thu, 13 Jun 2019 08:33:55 +0200 Subject: [PATCH] pdf: ocr function was broken for python3 in some cases (depending on how the ocr language was specified) --- src/filters/rclpdf.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/src/filters/rclpdf.py b/src/filters/rclpdf.py index 616cacfa..69a7b1fe 100755 --- a/src/filters/rclpdf.py +++ b/src/filters/rclpdf.py @@ -243,7 +243,7 @@ class PDFExtractor: tesseractlang = os.environ.get("RECOLL_TESSERACT_LANG", ""); if tesseractlang: return tesseractlang - pdflangfile = os.path.join(self.confdir, b"ocrpdf") + pdflangfile = os.path.join(self.confdir, "ocrpdf") if os.path.isfile(pdflangfile): tesseractlang = open(pdflangfile, "r").read().strip() if tesseractlang: