| <?xml version="1.0" encoding="UTF-8" ?> |
| |
| <!-- |
| *************************************************************** |
| * Licensed to the Apache Software Foundation (ASF) under one |
| * or more contributor license agreements. See the NOTICE file |
| * distributed with this work for additional information |
| * regarding copyright ownership. The ASF licenses this file |
| * to you under the Apache License, Version 2.0 (the |
| * "License"); you may not use this file except in compliance |
| * with the License. You may obtain a copy of the License at |
| * |
| * http://www.apache.org/licenses/LICENSE-2.0 |
| * |
| * Unless required by applicable law or agreed to in writing, |
| * software distributed under the License is distributed on an |
| * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY |
| * KIND, either express or implied. See the License for the |
| * specific language governing permissions and limitations |
| * under the License. |
| *************************************************************** |
| --> |
| |
| <analysisEngineDescription xmlns="http://uima.apache.org/resourceSpecifier"> |
| <frameworkImplementation>org.apache.uima.cpp</frameworkImplementation> |
| <primitive>false</primitive> |
| |
| <delegateAnalysisEngineSpecifiers> |
| <delegateAnalysisEngine key="Segmenter"> |
| <import location="SimpleTextSegmenter.xml" /> |
| </delegateAnalysisEngine> |
| |
| <delegateAnalysisEngine key="Tokenizer"> |
| <import location="tok.xml" /> |
| </delegateAnalysisEngine> |
| |
| <delegateAnalysisEngine key="Merger"> |
| <import location="SimpleTextMerger.xml"/> |
| </delegateAnalysisEngine> |
| </delegateAnalysisEngineSpecifiers> |
| |
| <analysisEngineMetaData> |
| <name>Aggregate CAS Multiplier example that segments, annotates and merges CASes</name> |
| <description> |
| Splits a document into pieces (by default sentences, see SimpleTextSegmenter.xml) and then annotate each |
| piece independently and then merges them into one document while keeping only specific annotation types. |
| </description> |
| |
| <configurationParameters> |
| <configurationParameter> |
| <name>AnnotationTypesToPreserve</name> |
| <description>Names of annotation types to keep in the merged CAS</description> |
| <type>String</type> |
| <multiValued>true</multiValued> |
| <mandatory>false</mandatory> |
| <overrides> |
| <parameter>Merger/AnnotationTypesToCopy</parameter> |
| </overrides> |
| </configurationParameter> |
| <configurationParameter> |
| <name>CASOutputFreq</name> |
| <type>Integer</type> |
| <multiValued>false</multiValued> |
| <mandatory>false</mandatory> |
| <overrides> |
| <parameter>Merger/OutputFrequency</parameter> |
| </overrides> |
| </configurationParameter> |
| </configurationParameters> |
| |
| <configurationParameterSettings> |
| <nameValuePair> |
| <name>AnnotationTypesToPreserve</name> |
| <value> |
| <array> |
| <string>uima.tt.TokenAnnotation</string> |
| </array> |
| </value> |
| </nameValuePair> |
| <nameValuePair> |
| <name>CASOutputFreq</name> |
| <value> |
| <integer>2</integer> |
| </value> |
| </nameValuePair> |
| </configurationParameterSettings> |
| |
| <flowConstraints> |
| <fixedFlow> |
| <node>Segmenter</node> |
| <node>Tokenizer</node> |
| <node>Merger</node> |
| </fixedFlow> |
| </flowConstraints> |
| |
| <capabilities> |
| <capability> |
| <inputs /> |
| <outputs> |
| <type>uima.tt.TokenAnnotation</type> |
| </outputs> |
| <languagesSupported> |
| <language>en</language> |
| </languagesSupported> |
| </capability> |
| </capabilities> |
| |
| <operationalProperties> |
| <modifiesCas>true</modifiesCas> |
| <multipleDeploymentAllowed>true</multipleDeploymentAllowed> |
| <outputsNewCASes>true</outputsNewCASes> |
| </operationalProperties> |
| </analysisEngineMetaData> |
| </analysisEngineDescription> |