Ignore:
Timestamp:
2020-06-18T19:22:34+12:00 (4 years ago)
Author:
ak19
Message:

UnknownConverterPlugin configured to use Tika for doc processing

File:
1 edited

Legend:

Unmodified
Added
Removed
  • main/trunk/model-sites-dev/opotiki/collect/textdemo/etc/collectionConfig.xml

    r34136 r34206  
    107107            <plugin name="PDFv2Plugin">
    108108                <option name="-convert_to" value="paged_pretty_html"/>
     109            </plugin>
     110            <!-- Configuring an UnknownConverterPlugin for docx processing with Tika -->
     111            <plugin name="UnknownConverterPlugin">
     112              <option name="-exec_cmd" value="java -jar $GSDLHOME/ext/tika/tika-app-1.24.1.jar --html %%INPUT_FILE &gt; %%OUTPUT"/>
     113              <option name="-convert_to" value="html"/>
     114              <option name="-mime_type" value="application/vnd.openxmlformats-officedocument.wordprocessingml.document"/>
     115              <option name="-srcicon" value="icondocx"/>
     116              <option name="-process_extension" value="docx"/>
    109117            </plugin>
    110118            <plugin name="RTFPlugin"/>
Note: See TracChangeset for help on using the changeset viewer.