From 81d486d4be8c8a9790c1607d0ecb2236b7c68978 Mon Sep 17 00:00:00 2001 From: Uwe Steinmann Date: Tue, 25 Jun 2013 16:53:52 +0200 Subject: [PATCH] add -enc parameter to pdftotext --- install/settings.xml.template_install | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/install/settings.xml.template_install b/install/settings.xml.template_install index 847c03578..57c8f449e 100644 --- a/install/settings.xml.template_install +++ b/install/settings.xml.template_install @@ -234,7 +234,7 @@ - pdftotext -nopgbrk %s - | sed -e 's/ [a-zA-Z0-9.]\{1\} / /g' -e 's/[0-9.]//g' + pdftotext -enc UTF-8 -nopgbrk %s - | sed -e 's/ [a-zA-Z0-9.]\{1\} / /g' -e 's/[0-9.]//g' catdoc %s