recoll/tests/config/recoll.conf.in
Jean-Francois Dockes 728129e5ce Text splitter: move apos and dash character conversions to unac_except_trans.
This was complicated and caused problems with highlight areas position computations in
plaintorich. Also, simplify the code for processing some dangling characters.
2021-11-02 14:32:38 +01:00

83 lines
1.9 KiB
Plaintext
Raw Permalink Blame History

This file contains ambiguous Unicode characters

This file contains Unicode characters that might be confused with other characters. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.

# The actual recoll.conf is created from this by the top level runtest.sh
# not by the configure script
cachedir = @RECOLL_TESTCACHEDIR@
loglevel = 6
logfilename = /tmp/logrcltst
idxlogfilename = /tmp/idxlogrcltst
daemloglevel = 6
daemlogfilename = /tmp/rclmontrace
systemfilecommand = xdg-mime query filetype
indexStripChars = 1
detectxattronly = 1
topdirs = @RECOLL_TESTDATA@
#thrQSizes = -1 -1 -1
# Adding to skippedNames
skippedNames+ = notinskippednames
# Removing from skippedNames
skippedNames- = recollrc
# Adding to noContentSuffixes
noContentSuffixes+ = .nosuff
# Removing from noContentSuffixes
noContentSuffixes- = .md5
# Comics_12 causes rclppt to loop. We keep it around for general testing
# but it takes too much time when running the test-set
skippedPaths = \
@RECOLL_TESTDATA@/.hg \
@RECOLL_TESTDATA@/skipped/real* \
@RECOLL_TESTDATA@/config \
@RECOLL_TESTDATA@/ppt/Comics_12.pps
daemSkippedPaths = \
@RECOLL_TESTDATA@/.hg \
@RECOLL_TESTDATA@/skipped/real* \
@RECOLL_TESTDATA@/config
unac_except_trans = åå Åå ää Ää öö Öö üü Üü ßss œoe Œoe æae ÆAE fifi flfl ' ❜' ʼ' -
pdfextrameta = pdf:Producer dc:identifier
pdfextrametafix = @RECOLL_TESTS@/config/pdfemf.py
# Can't use dir key as rclpdf doesnt call setkeydir
pdfattach = 1
[@RECOLL_TESTDATA@/pdf]
ocrprogs = tesseract
pdfocr = 1
pdfocrlang = eng
[@RECOLL_TESTDATA@/utf8]
defaultcharset = utf-8
[@RECOLL_TESTDATA@/ru_RU.KOI8-R]
defaultcharset = KOI8-R
[@RECOLL_TESTDATA@/info]
localfields = rclaptg=gnuinfo
[@RECOLL_TESTDATA@/mail/thunderbird]
mhmboxquirks = tbird
[@RECOLL_TESTDATA@/cjk]
localfields= ; keyword = ckjtsthuniique; blabla= "some string"
[@RECOLL_TESTDATA@/idxtypes]
indexedmimetypes = text/plain
[@RECOLL_TESTDATA@/excltypes]
excludedmimetypes = text/plain
[@RECOLL_TESTDATA@/excludehtml]
indexedmimetypes = application/pdf
[@RECOLL_TESTDATA@/onlynames]
onlyNames = *.matchesonepat *.matchestwopat