pdf: ocr function was broken for python3 in some cases (depending on how the ocr language was specified)

2019-06-13 08:33:55 +02:00 · 2019-06-13 08:33:55 +02:00 · 9dcdb6e9a6
commit 9dcdb6e9a6
parent 4c205e44e0
1 changed files with 1 additions and 1 deletions
--- a/src/filters/rclpdf.py
+++ b/src/filters/rclpdf.py
@ -243,7 +243,7 @@ class PDFExtractor:
        tesseractlang = os.environ.get("RECOLL_TESSERACT_LANG", "");
        if tesseractlang:
            return tesseractlang
-        pdflangfile = os.path.join(self.confdir, b"ocrpdf")
+        pdflangfile = os.path.join(self.confdir, "ocrpdf")
        if os.path.isfile(pdflangfile):
            tesseractlang = open(pdflangfile, "r").read().strip()
        if tesseractlang: