1# This file is an example. The real configuration must be done in conf/elasticsearch.conf
2#
3# Use this file to setup media parsers. The parsers must return text or JSON.
4#
5# Configure one file type per line: file extension followed by parser location (full file system path or URL).
6# You can use %in% for the input file.
7#
8
9# use the local pdftotext tool to extract PDF data:
10pdf    /usr/bin/pdftotext %in% -
11
12# use a free installation of Apache Tika on the Web for Word Documents
13docx   http://givemetext.okfnlabs.org/tika/rmeta
14
15# use our own parser for JPEGs
16jpg    bin/plugin.php elasticsearch_img %in%
17jpeg   bin/plugin.php elasticsearch_img %in%
18