| /* |
| * Licensed to the Apache Software Foundation (ASF) under one or more |
| * contributor license agreements. See the NOTICE file distributed with |
| * this work for additional information regarding copyright ownership. |
| * The ASF licenses this file to You under the Apache License, Version 2.0 |
| * (the "License"); you may not use this file except in compliance with |
| * the License. You may obtain a copy of the License at |
| * |
| * http://www.apache.org/licenses/LICENSE-2.0 |
| * |
| * Unless required by applicable law or agreed to in writing, software |
| * distributed under the License is distributed on an "AS IS" BASIS, |
| * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| * See the License for the specific language governing permissions and |
| * limitations under the License. |
| */ |
| |
| package opennlp.tools.chunker; |
| |
| import java.util.List; |
| |
| import opennlp.tools.util.Sequence; |
| import opennlp.tools.util.Span; |
| |
| /** |
| * The interface for chunkers which provide chunk tags for a sequence of tokens. |
| */ |
| public interface Chunker { |
| |
| /** |
| * Generates chunk tags for the given sequence returning the result in a list. |
| * |
| * @param toks a list of the tokens or words of the sequence. |
| * @param tags a list of the pos tags of the sequence. |
| * |
| * @return a list of chunk tags for each token in the sequence. |
| * |
| * @deprecated please use {@link #chunk(String[], String[])} instead. |
| */ |
| @Deprecated |
| public List<String> chunk(List<String> toks, List<String> tags); |
| |
| /** |
| * Generates chunk tags for the given sequence returning the result in an array. |
| * |
| * @param toks an array of the tokens or words of the sequence. |
| * @param tags an array of the pos tags of the sequence. |
| * |
| * @return an array of chunk tags for each token in the sequence. |
| */ |
| public String[] chunk(String[] toks, String tags[]); |
| |
| /** |
| * Generates tagged chunk spans for the given sequence returning the result in a span array. |
| * |
| * @param toks an array of the tokens or words of the sequence. |
| * @param tags an array of the pos tags of the sequence. |
| * |
| * @return an array of spans with chunk tags for each chunk in the sequence. |
| */ |
| public Span[] chunkAsSpans(String[] toks, String tags[]); |
| |
| /** |
| * Returns the top k chunk sequences for the specified sentence with the specified pos-tags |
| * @param sentence The tokens of the sentence. |
| * @param tags The pos-tags for the specified sentence. |
| * |
| * @return the top k chunk sequences for the specified sentence. |
| * |
| * @deprecated please use {@link #topKSequences(String[], String[])} instead. |
| */ |
| @Deprecated |
| public Sequence[] topKSequences(List<String> sentence, List<String> tags); |
| |
| |
| /** |
| * Returns the top k chunk sequences for the specified sentence with the specified pos-tags |
| * @param sentence The tokens of the sentence. |
| * @param tags The pos-tags for the specified sentence. |
| * |
| * @return the top k chunk sequences for the specified sentence. |
| */ |
| public Sequence[] topKSequences(String[] sentence, String[] tags); |
| |
| /** |
| * Returns the top k chunk sequences for the specified sentence with the specified pos-tags |
| * @param sentence The tokens of the sentence. |
| * @param tags The pos-tags for the specified sentence. |
| * @param minSequenceScore A lower bound on the score of a returned sequence. |
| * |
| * @return the top k chunk sequences for the specified sentence. |
| */ |
| public Sequence[] topKSequences(String[] sentence, String[] tags, double minSequenceScore); |
| } |