blob: dba80180b47f0d62ffba1277371ca9b12e3331c9 [file] [log] [blame]
/*
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing,
* software distributed under the License is distributed on an
* "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
* KIND, either express or implied. See the License for the
* specific language governing permissions and limitations
* under the License.
*/
package org.apache.uima.ruta.engine;
import java.io.File;
import java.io.FileOutputStream;
import org.apache.uima.UimaContext;
import org.apache.uima.analysis_engine.AnalysisEngineProcessException;
import org.apache.uima.cas.AbstractCas;
import org.apache.uima.cas.CAS;
import org.apache.uima.cas.FSIterator;
import org.apache.uima.cas.Feature;
import org.apache.uima.cas.Type;
import org.apache.uima.cas.impl.XmiCasSerializer;
import org.apache.uima.cas.text.AnnotationFS;
import org.apache.uima.fit.component.JCasMultiplier_ImplBase;
import org.apache.uima.fit.descriptor.ConfigurationParameter;
import org.apache.uima.jcas.JCas;
import org.apache.uima.resource.ResourceInitializationException;
import org.apache.uima.util.CasCopier;
import org.apache.uima.util.XMLSerializer;
/**
* This Analysis Engine is able to serialize the processed CAS to an XMI file whereas the the source
* and destination view can be specified A descriptor file for this Analysis Engine is located in
* the folder <code>descriptor/utils</code> of a UIMA Ruta project.
*
*/
public class ViewWriter extends JCasMultiplier_ImplBase {
/**
* This string parameter specifies the absolute path of the resulting file named
* <code>output.xmi</code>. However, if an annotation of the type
* <code>org.apache.uima.examples.SourceDocumentInformation</code> is given, then the value of
* this parameter is interpreted to be relative to the URI stored in the annotation and the name
* of the file will be adapted to the name of the source file. If this functionality is activated
* in the preferences, then the UIMA Ruta Workbench adds the SourceDocumentInformation annotation
* when the user launches a script file.
*/
public static final String PARAM_OUTPUT = "output";
@ConfigurationParameter(name = PARAM_OUTPUT, mandatory = false, defaultValue = "")
private String output;
/**
* The name of the view that should be stored in a file. The default value is "_InitialView".
*/
public static final String PARAM_INPUT_VIEW = "inputView";
@ConfigurationParameter(name = PARAM_INPUT_VIEW, mandatory = false, defaultValue = "_InitialView")
private String inputView;
/**
* The name, which should be used, to store the view in the file. The default value is "_InitialView".
*/
public static final String PARAM_OUTPUT_VIEW = "outputView";
@ConfigurationParameter(name = PARAM_OUTPUT_VIEW, mandatory = false, defaultValue = "_InitialView")
private String outputView;
private CAS outView;
@Override
public void initialize(UimaContext aContext) throws ResourceInitializationException {
super.initialize(aContext);
output = (String) aContext.getConfigParameterValue(PARAM_OUTPUT);
inputView = (String) aContext.getConfigParameterValue(PARAM_INPUT_VIEW);
outputView = (String) aContext.getConfigParameterValue(PARAM_OUTPUT_VIEW);
}
private static void writeXmi(CAS aCas, File name) throws Exception {
FileOutputStream out = null;
try {
// write XMI
out = new FileOutputStream(name);
XmiCasSerializer ser = new XmiCasSerializer(aCas.getTypeSystem());
XMLSerializer xmlSer = new XMLSerializer(out, false);
ser.serialize(aCas, xmlSer.getContentHandler());
} catch (Exception e) {
throw e;
} finally {
if (out != null) {
out.close();
}
}
}
@Override
public void process(JCas jcas) throws AnalysisEngineProcessException {
CAS cas = jcas.getCas();
Type sdiType = cas.getTypeSystem().getType(RutaEngine.SOURCE_DOCUMENT_INFORMATION);
File file = new File(output);
if (file.isDirectory()) {
String filename = "output.xmi";
file = new File(output, filename);
}
if (sdiType != null) {
FSIterator<AnnotationFS> sdiit = cas.getAnnotationIndex(sdiType).iterator();
if (sdiit.isValid()) {
AnnotationFS annotationFS = sdiit.get();
Feature uriFeature = sdiType.getFeatureByBaseName("uri");
String stringValue = annotationFS.getStringValue(uriFeature);
File f = new File(stringValue);
String name = f.getName();
if (!name.endsWith(".xmi")) {
name = name + ".xmi";
}
String parent = f.getParent().endsWith("/") ? f.getParent() : f.getParent() + "/";
file = new File(parent + output, name);
file.getParentFile().mkdirs();
}
}
CAS inView = cas.getView(inputView);
if (outView == null) {
outView = getContext().getEmptyCas(CAS.class);
}
outView.reset();
CasCopier cc = new CasCopier(inView, outView, true);
cc.copyCasView(inView, outputView, true);
try {
writeXmi(outView, file);
} catch (Exception e) {
throw new AnalysisEngineProcessException(e);
}
}
@Override
public void collectionProcessComplete() {
if (outView != null) {
outView.release();
}
outView = null;
}
public boolean hasNext() throws AnalysisEngineProcessException {
return false;
}
public AbstractCas next() throws AnalysisEngineProcessException {
return null;
}
}