| <?xml version="1.0" encoding="UTF-8" ?> |
| <!-- |
| * Licensed to the Apache Software Foundation (ASF) under one |
| * or more contributor license agreements. See the NOTICE file |
| * distributed with this work for additional information |
| * regarding copyright ownership. The ASF licenses this file |
| * to you under the Apache License, Version 2.0 (the |
| * "License"); you may not use this file except in compliance |
| * with the License. You may obtain a copy of the License at |
| * |
| * http://www.apache.org/licenses/LICENSE-2.0 |
| * |
| * Unless required by applicable law or agreed to in writing, |
| * software distributed under the License is distributed on an |
| * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY |
| * KIND, either express or implied. See the License for the |
| * specific language governing permissions and limitations |
| * under the License. |
| --> |
| |
| <!-- Descriptor for a simple name recognizer TAE that uses regular expressions. |
| --> |
| <taeDescription xmlns="http://uima.apache.org/resourceSpecifier"> |
| <frameworkImplementation>org.apache.uima.java</frameworkImplementation> |
| <primitive>true</primitive> |
| <annotatorImplementationName>org.apache.uima.examples.cas.RegExAnnotator</annotatorImplementationName> |
| |
| <analysisEngineMetaData> |
| <name>Simple Name Recognizer using Regular Expressions</name> |
| <description>Detects Names using a simple regular expression.</description> |
| |
| <configurationParameters> |
| <configurationParameter> |
| <name>Patterns</name> |
| <description>Regular expression patterns to match. The language is that supported by Java 1.4.</description> |
| <type>String</type> |
| <multiValued>true</multiValued> |
| <mandatory>false</mandatory> |
| </configurationParameter> |
| |
| <configurationParameter> |
| <name>TypeNames</name> |
| <description>Names of CAS Types to create for the patterns found. The indexes of this array |
| correspond to the indexes of the Patterns or PatternFiles arrays. If a match is found for |
| Patterns[i], it will result in an annotation of type |
| TypeNames[i].</description> |
| <type>String</type> |
| <multiValued>true</multiValued> |
| <mandatory>false</mandatory> |
| </configurationParameter> |
| |
| <configurationParameter> |
| <name>ContainingAnnotationTypes</name> |
| <description>Names of CAS Input Types within which annotations should be created.</description> |
| <type>String</type> |
| <multiValued>true</multiValued> |
| <mandatory>false</mandatory> |
| </configurationParameter> |
| |
| <configurationParameter> |
| <name>AnnotateEntireContainingAnnotation</name> |
| <description>When the ContainingAnnoationTypes parameter is specified, a value of true for this |
| parameter will cause the entire containing annotation to be used as the span of the new |
| annotation, rather than just the span of the regular expression match. This can be used |
| to "classify" previously created annotations according to whether or not they contain |
| text matching a regular expression. |
| </description> |
| <type>Boolean</type> |
| <multiValued>false</multiValued> |
| <mandatory>false</mandatory> |
| </configurationParameter> |
| </configurationParameters> |
| |
| <configurationParameterSettings> |
| <nameValuePair> |
| <name>Patterns</name> |
| <value><array> |
| <string>\p{Upper}\w*(\.?\s\p{Upper}\w*)+</string> |
| </array></value> |
| </nameValuePair> |
| <nameValuePair> |
| <name>TypeNames</name> |
| <value><array> |
| <string>example.Name</string> |
| </array></value> |
| </nameValuePair> |
| </configurationParameterSettings> |
| |
| <typeSystemDescription> |
| <types> |
| |
| <typeDescription> |
| <name>example.Name</name> |
| <description>A proper name.</description> |
| <supertypeName>uima.tcas.Annotation</supertypeName> |
| </typeDescription> |
| |
| </types> |
| </typeSystemDescription> |
| |
| <capabilities> |
| <capability> |
| <inputs/> |
| <outputs> |
| <type>example.Name</type> |
| </outputs> |
| </capability> |
| </capabilities> |
| |
| </analysisEngineMetaData> |
| </taeDescription> |