| /* |
| * Licensed to the Apache Software Foundation (ASF) under one |
| * or more contributor license agreements. See the NOTICE file |
| * distributed with this work for additional information |
| * regarding copyright ownership. The ASF licenses this file |
| * to you under the Apache License, Version 2.0 (the |
| * "License"); you may not use this file except in compliance |
| * with the License. You may obtain a copy of the License at |
| * |
| * http://www.apache.org/licenses/LICENSE-2.0 |
| * |
| * Unless required by applicable law or agreed to in writing, |
| * software distributed under the License is distributed on an |
| * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY |
| * KIND, either express or implied. See the License for the |
| * specific language governing permissions and limitations |
| * under the License. |
| */ |
| |
| package org.apache.uima.cas.test; |
| |
| import java.io.File; |
| import java.io.IOException; |
| |
| import javax.xml.parsers.SAXParser; |
| import javax.xml.parsers.SAXParserFactory; |
| |
| import org.apache.uima.UIMAFramework; |
| import org.apache.uima.cas.CAS; |
| import org.apache.uima.cas.impl.XCASDeserializer; |
| import org.apache.uima.cas.text.AnnotationTreeNode; |
| import org.apache.uima.resource.metadata.FsIndexDescription; |
| import org.apache.uima.resource.metadata.TypeSystemDescription; |
| import org.apache.uima.test.junit_extension.JUnitExtension; |
| import org.apache.uima.util.CasCreationUtils; |
| import org.apache.uima.util.XMLInputSource; |
| |
| import junit.framework.TestCase; |
| |
| public class AnnotationTreeTest extends TestCase { |
| |
| private static final String casDataDirName = "CASTests"; |
| |
| private static final String xcasSampleDirName = "xcas"; |
| |
| private static final String sampleXcas1FileName = "sample1.xcas"; |
| |
| private static final String sampleTsFileName = "sample.ts"; |
| |
| public AnnotationTreeTest(String desc) { |
| super(desc); |
| } |
| |
| public void testTree() throws Exception { |
| |
| // The two XCASes used in this test contain the same data, but the |
| // second one contains all annotations twice. So in that case, every |
| // other annotation is filtered by the unambiguous iterator. |
| |
| File dataDir = JUnitExtension.getFile(casDataDirName); |
| File xcasDir = new File(dataDir, xcasSampleDirName); |
| |
| try { |
| File tsFile = new File(xcasDir, sampleTsFileName); |
| Object descriptor = UIMAFramework.getXMLParser().parse(new XMLInputSource(tsFile)); |
| // instantiate CAS to get type system. Also build style |
| // map file if there is none. |
| TypeSystemDescription tsDesc = (TypeSystemDescription) descriptor; |
| CAS cas = CasCreationUtils.createCas(tsDesc, null, new FsIndexDescription[0]); |
| SAXParser parser = SAXParserFactory.newInstance().newSAXParser(); |
| XCASDeserializer xcasDeserializer = new XCASDeserializer(cas.getTypeSystem()); |
| File xcasFile = new File(xcasDir, sampleXcas1FileName); |
| parser.parse(xcasFile, xcasDeserializer.getXCASHandler(cas)); |
| AnnotationTreeNode root = cas.getAnnotationIndex().tree(cas.getDocumentAnnotation()) |
| .getRoot(); |
| // There are 7 paragraph annotations in the CAS. |
| assertTrue("There should be 7 paragraphs, but are: " + root.getChildCount(), root |
| .getChildCount() == 7); |
| // The first paragraph contains 19 sentences, each subsequent one |
| // contains only one sentence. |
| assertTrue(root.getChild(0).getChildCount() == 19); |
| for (int i = 1; i < root.getChildCount(); i++) { |
| assertTrue(root.getChild(i).getChildCount() == 1); |
| } |
| // First sentence contains 8 tokens. |
| assertTrue(root.getChild(0).getChild(0).getChildCount() == 8); |
| // Same for only sentence in second paragraph. |
| assertTrue(root.getChild(1).getChild(0).getChildCount() == 8); |
| } catch (IOException e) { |
| e.printStackTrace(); |
| assertTrue(false); |
| } |
| } |
| |
| } |