# $Id: ExtractText.cf,v 1.8 2009/07/10 13:49:37 jonas Exp $
extracttext_mime_magic yes
#extracttext_log_to_stderr yes
#extracttext_log_msgid yes
#extracttext_log_text yes
#add_header all ExtractText _EXTRACTTEXTCHARS_ _EXTRACTTEXTWORDS_ <_EXTRACTTEXTFLAGS_> [_EXTRACTTEXTTOOLS_] {_EXTRACTTEXTEXTENSIONS_} (_EXTRACTTEXTTYPES_)
extracttext_external antiword {CS:UTF-8} /usr/local/bin/antiword -t -w 0 -m UTF-8.txt -
extracttext_use antiword .doc .dot application/(?:vnd\\.?)?ms-?word.*
extracttext_module openxml Mail::SpamAssassin::Plugin::ExtractText::OpenXML
extracttext_use openxml .docx .dotx .dotm application/(?:vnd\\.?)openxml.*?word.*
extracttext_use openxml .doc .dot application/(?:vnd\\.?)?ms-?word.*
extracttext_external unrtf {CS:UTF-8} {CF:<{\\[:=-.*?-=:\\]}>} /usr/local/bin/unrtf -t ExtractText.tags --nopict
extracttext_use unrtf .doc .rtf application/rtf text/rtf
extracttext_external odt2txt {CS:UTF-8} {CF:\\[--\\s+\\S+:\\s.*?--\\]} /usr/local/bin/odt2txt --encoding=UTF-8 ${file}
extracttext_use odt2txt .odt .ott application/.*?opendocument.*text
extracttext_use odt2txt .sdw .stw application/(?:x-)?soffice application/(?:x-)?starwriter
extracttext_external pdftohtml {CS:
(2009-07-10)