<?xml version="1.0" encoding="UTF-8"?> | |
<!-- | |
Licensed to the Apache Software Foundation (ASF) under one | |
or more contributor license agreements. See the NOTICE file | |
distributed with this work for additional information | |
regarding copyright ownership. The ASF licenses this file | |
to you under the Apache License, Version 2.0 (the | |
"License"); you may not use this file except in compliance | |
with the License. You may obtain a copy of the License at | |
http://www.apache.org/licenses/LICENSE-2.0 | |
Unless required by applicable law or agreed to in writing, | |
software distributed under the License is distributed on an | |
"AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY | |
KIND, either express or implied. See the License for the | |
specific language governing permissions and limitations | |
under the License. | |
--> | |
<analysisEngineDescription xmlns="http://uima.apache.org/resourceSpecifier"> | |
<frameworkImplementation>org.apache.uima.java</frameworkImplementation> | |
<primitive>true</primitive> | |
<annotatorImplementationName>org.apache.uima.tika.MarkupAnnotator</annotatorImplementationName> | |
<analysisEngineMetaData> | |
<name>org.apache.uima.tika.MarkupAnnotator</name> | |
<description>Uses Tika to generate annotations from original markup</description> | |
<version>1.0</version> | |
<vendor>Apache Software Foundation</vendor> | |
<configurationParameters> | |
<configurationParameter> | |
<name>ORIGINAL_VIEW_PARAM_NAME</name> | |
<description>Name of the view used for storing the original content</description> | |
<type>String</type> | |
<multiValued>false</multiValued> | |
<mandatory>true</mandatory> | |
</configurationParameter> | |
<configurationParameter> | |
<name>TEXT_VIEW_PARAM_NAME</name> | |
<description>Name of the view used to store the text extracted from the original document</description> | |
<type>String</type> | |
<multiValued>false</multiValued> | |
<mandatory>true</mandatory> | |
</configurationParameter> | |
<configurationParameter> | |
<name>SET_TEXT_VIEW_DEFAULT_PARAM_NAME</name> | |
<description>Indicates whether the Text view should be marked as the one to use by default</description> | |
<type>Boolean</type> | |
<multiValued>false</multiValued> | |
<mandatory>true</mandatory> | |
</configurationParameter> | |
</configurationParameters> | |
<configurationParameterSettings> | |
<nameValuePair> | |
<name>ORIGINAL_VIEW_PARAM_NAME</name> | |
<value> | |
<string>_InitialView</string> | |
</value> | |
</nameValuePair> | |
<nameValuePair> | |
<name>TEXT_VIEW_PARAM_NAME</name> | |
<value> | |
<string>textView</string> | |
</value> | |
</nameValuePair> | |
<nameValuePair> | |
<name>SET_TEXT_VIEW_DEFAULT_PARAM_NAME</name> | |
<value> | |
<boolean>true</boolean> | |
</value> | |
</nameValuePair> | |
</configurationParameterSettings> | |
<typeSystemDescription> | |
<imports> | |
<import name="MarkupAnnotationTypeSystem"/> | |
</imports> | |
</typeSystemDescription> | |
<typePriorities/> | |
<fsIndexCollection/> | |
<capabilities> | |
<capability> | |
<inputs/> | |
<outputs> | |
<type allAnnotatorFeatures="true">org.apache.uima.MarkupAnnotation</type> | |
</outputs> | |
<languagesSupported> | |
<language>x-unspecified</language> | |
</languagesSupported> | |
</capability> | |
</capabilities> | |
<operationalProperties> | |
<modifiesCas>true</modifiesCas> | |
<multipleDeploymentAllowed>true</multipleDeploymentAllowed> | |
<outputsNewCASes>true</outputsNewCASes> | |
</operationalProperties> | |
</analysisEngineMetaData> | |
<externalResourceDependencies> | |
<externalResourceDependency> | |
<key>tikaConfigFile</key> | |
<description>XML configuration file for Tika</description> | |
<optional>true</optional> | |
</externalResourceDependency> | |
</externalResourceDependencies> | |
<resourceManagerConfiguration> | |
<externalResources> | |
<externalResource> | |
<name>tikaConfigFile</name> | |
<description>XMLconfig file for Tika. If not found the component will rely on the default config</description> | |
<fileResourceSpecifier> | |
<fileUrl>tika_config.xml</fileUrl> | |
</fileResourceSpecifier> | |
</externalResource> | |
</externalResources> | |
<externalResourceBindings> | |
<externalResourceBinding> | |
<key>tikaConfigFile</key> | |
<resourceName>tikaConfigFile</resourceName> | |
</externalResourceBinding> | |
</externalResourceBindings> | |
</resourceManagerConfiguration> | |
</analysisEngineDescription> |