diff --git a/src/sampleconf/mimeconf b/src/sampleconf/mimeconf index a85e2f78..47b8d099 100644 --- a/src/sampleconf/mimeconf +++ b/src/sampleconf/mimeconf @@ -28,14 +28,14 @@ application/x-bzip2 = uncompress rcluncomp bunzip2 %f %t # A different format (ie text/plain), and a character set can be defined for # each filter, see the exemples below (ie: msword) [index] -# Note: rcldoc did some work to splice hyphenated words at eol. Seems -# actually not needed because antiword apparently does it too + +# MSWORD: install wvware and restore the rcldoc version to fix the "text +# stream of this file is too small to handle" error if it's a problem for you # application/msword = exec rcldoc application/msword = exec antiword -t -i 1 -m UTF-8;mimetype=text/plain;charset=utf-8 -# Alternatively you can use wvWare for msword. It's much slower than -# antiword, but will handle documents which provoke the 'I'm afraid the -# text stream of this file is too small to handle' antiword error +# You can also use wvware directly but it's much slower. # application/msword = exec wvWare --charset=utf-8 --nographics + application/ogg = execm rclaudio application/pdf = exec rclpdf application/postscript = exec pstotext;charset=iso-8859-1;mimetype=text/plain diff --git a/website/BUGS.html b/website/BUGS.html index 09f41004..f13d4e8c 100644 --- a/website/BUGS.html +++ b/website/BUGS.html @@ -67,15 +67,19 @@
I'm afraid the text stream of this file is too small to handle. -+ + Only small files produced by Microsoft Word on a Mac, or by - OpenOffice will trigger this message. As a workaround, install - wvWare and modify mimeconf to use the rcldoc filter (instead of - directly executing antiword). Rcldoc will try antiword, then - will use vwWare if it is available. This will result in - slightly slower indexing for doc files. + OpenOffice will trigger this message.