daffodil-runtime1/src/main/scala/edu/illinois/ncsa/daffodil/api/DFDLParserUnparser.scala - daffodil - Git at Google

 /* Copyright (c) 2012-2015 Tresys Technology, LLC. All rights reserved.
  *
  * Developed by: Tresys Technology, LLC
  *               http://www.tresys.com
  *
  * Permission is hereby granted, free of charge, to any person obtaining a copy of
  * this software and associated documentation files (the "Software"), to deal with
  * the Software without restriction, including without limitation the rights to
  * use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies
  * of the Software, and to permit persons to whom the Software is furnished to do
  * so, subject to the following conditions:
  *
  *  1. Redistributions of source code must retain the above copyright notice,
  *     this list of conditions and the following disclaimers.
  *
  *  2. Redistributions in binary form must reproduce the above copyright
  *     notice, this list of conditions and the following disclaimers in the
  *     documentation and/or other materials provided with the distribution.
  *
  *  3. Neither the names of Tresys Technology, nor the names of its contributors
  *     may be used to endorse or promote products derived from this Software
  *     without specific prior written permission.
  *
  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
  * CONTRIBUTORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
  * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS WITH THE
  * SOFTWARE.
  */

 package edu.illinois.ncsa.daffodil.api

 import edu.illinois.ncsa.daffodil.processors.ProcessorResult
 import edu.illinois.ncsa.daffodil.processors.Success
 import java.io.File
 import edu.illinois.ncsa.daffodil.processors.VariableMap
 import edu.illinois.ncsa.daffodil.externalvars.Binding
 import edu.illinois.ncsa.daffodil.infoset.InfosetInputter
 import edu.illinois.ncsa.daffodil.infoset.InfosetOutputter
 import edu.illinois.ncsa.daffodil.processors.Failure

 /**
  * This file contains traits that define an abstract API that any DFDL processor
  * can satisfy. The intention is to allow test rigs and other systems to run tests
  * against multiple DFDL implementations for comparison purposes.
  */

 /**
  * APIs for DFDL Parsing and Unparsing
  *
  * Assumed that applications will provide information not all at once, but will provide first:
  * <ol>
  * <li> Schema (which can be multiple schema files by way of include/import)
  * <li> XML Catalog, or other means by which include/import are found.
  * <li> Control settings/features for how they want the parser to behave.
  * <li> Error handlers.
  * <li> Root node and namespace
  * <li> Externally defined variables
  * </ol>
  * After that, the application will want to use one of two primary patterns:
  * <ul>
  * <li> Random access: one input source, evaluate many different paths
  * <li> Bulk Parsing: one path, many different input sources
  * </ul>
  * The output direction is symmetric.
  *
  * So the API provides a way to set the path specially, providing for schema-aware compilation of the XPath expression in the bulk processing case.
  *
  */
 object DFDL {

   type Input = java.nio.channels.ReadableByteChannel // binary input stream/buffer
   type Output = java.nio.channels.WritableByteChannel // binary output stream/buffer

   trait Compiler {

     /**
      * User must establish error handlers, setup features appropriately before using the data access objects.
      *
      * Other features are TBD, but may include
      *
      * <ul>
      * <li>validation checking of the data - whether to warn or error.
      * <li>schema validation - validation of the DFDL Schema itself
      * <li>error recovery information - paths to anchor elements or similar
      * <li>error and warning tolerances - how many before failing entirely, escalation for warnings
      * <li>debug modes & tracing modes
      * <li>amount of buffering to make available for backward reference (0 meaning no backward reference)
      * <li>amount of buffering to make available for lookahead/speculation - bounding this can make error detection/recovery faster
      * <li>grammar ambiguity policies - whether to escalate certain ambiguous use of delimiters to errors, or try to parse anyway
      * </ul>
      */

     /**
      * There are two places you can set the root element, or you can omit it.
      * You can set it here on the compiler. This saves compilation time, as
      * it will only compile things needed by your root element. (Good to make
      * tests run fast.) If you don't specify a root, then it compiles all top
      * level elements, anticipating that different uses of the compiled schema
      * might subsequently ask for different top level elements.
      *
      * If you don't specify a root here, then you can specify one later on the
      * ProcessorFactory object, but that won't save you as much compilation time.
      *
      * If you don't set a root at all, then it compiles all top level elements
      * and uses the first element in the first schema file as the root.
      *
      * When specifying a root element, you either specify its namespace, or
      * you can specify the empty string "" as the namespace which means "no namespace".
      * If you specify a root element name, but pass null as the namespace, then
      * it will search for a unique element with your root element name, and
      * if that is unambiguous, it will use it as the root.
      */
     def setDistinguishedRootNode(name: String, namespace: String)
     def setExternalDFDLVariable(name: String, namespace: String, value: String)

     /**
      * Compilation returns a parser factory, which must be interrogated for diagnostics
      * to see if compilation was successful or not.
      */
     def compileSource(schemaSource: DaffodilSchemaSource): ProcessorFactory

     def reload(savedParser: File): DataProcessor
   }

   /**
    * The point of processor factory is to allow compilation of the path expression.
    */
   trait ProcessorFactory extends WithDiagnostics {

     /**
      * If you didn't set a root on the compiler, then get another
      * chance to specify one here.
      *
      * If you don't set a root at all it uses the first element in the
      * first schema document as the root.
      *
      * If you don't specify a namespace, or pass null, then it searches, and if
      * it is unambiguous, it will use the unique global element with
      * that name.
      *
      * Note: null used specifically here not an Option type, because this API
      * will shine through to a Java API.
      *
      * To explicitly specify that there is no-namespace, pass "" as
      * the namespace argument.
      */
     def setDistinguishedRootNode(name: String, namespace: String = null)
     def onPath(xpath: String): DataProcessor
   }

   trait DataProcessor extends WithDiagnostics {
     def setValidationMode(mode: ValidationMode.Type): Unit
     def getValidationMode(): ValidationMode.Type
     def save(output: DFDL.Output): Unit
     def setExternalVariables(extVars: Map[String, String]): Unit
     def setExternalVariables(extVars: File): Unit
     def setExternalVariables(extVars: File, tunable: DaffodilTunables): Unit
     def setExternalVariables(extVars: Seq[Binding]): Unit
     def getVariables(): VariableMap
     def setTunable(tunable: String, value: String): Unit
     def setTunables(tunables: Map[String,String]): Unit
     def getTunables(): DaffodilTunables

     /**
      * Unparses (that is, serializes) data to the output, returns an object which contains any diagnostics.
      */
     def unparse(input: InfosetInputter, output: DFDL.Output): UnparseResult
     /**
      * Returns an object which contains the result, and/or diagnostic information.
      *
      * For testing purposes (mostly), you can restrict the number of bits to
      * fewer than the entire input.
      */
     def parse(input: Input, output: InfosetOutputter, lengthLimitInBits: Long = -1): ParseResult

     /**
      * Returns an object which contains the result, and/or diagnostic information.
      * <p>
      * Use this rather than passing a channel/stream because it enables some
      * I/O optimizations.
      */
     def parse(file: File, output: InfosetOutputter): ParseResult
   }

   trait ParseResult extends Result with WithDiagnostics {
     def resultState: State
   }

   trait UnparseResult extends Result with WithDiagnostics {
     /**
      * Data is 'scannable' if it consists entirely of textual data, and that data
      * is all in the same encoding.
      */
     def isScannable: Boolean
     def encodingName: String
   }

   /**
    * Interface for Parse and Unparse states
    */
   trait State {
     def processorStatus: ProcessorResult
     def validationStatus: Boolean
     def diagnostics: Seq[Diagnostic]
     def currentLocation: DataLocation
   }

   /**
    * Interface for Parse and Unparse results
    */
   abstract class Result {
     protected def resultState: State
     var diagnostics: Seq[Diagnostic] = Nil

     private def resultStatusDiagnostics: Seq[Diagnostic] = {
       resultState.processorStatus match {
         case Failure(c) => List(c)
         case Success => Nil
       }
     }

     def getDiagnostics = {
       (diagnostics.toSet ++ resultState.diagnostics.toSet ++ resultStatusDiagnostics.toSet).toSeq
     }

     def addDiagnostic(d: Diagnostic) {
       diagnostics = d +: diagnostics
     }

     def isError = isProcessingError || isValidationError
     def isProcessingError = resultState.processorStatus != Success
     def isValidationError = resultState.validationStatus != true
   }
 }
	/* Copyright (c) 2012-2015 Tresys Technology, LLC. All rights reserved.
	*
	* Developed by: Tresys Technology, LLC
	* http://www.tresys.com
	*
	* Permission is hereby granted, free of charge, to any person obtaining a copy of
	* this software and associated documentation files (the "Software"), to deal with
	* the Software without restriction, including without limitation the rights to
	* use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies
	* of the Software, and to permit persons to whom the Software is furnished to do
	* so, subject to the following conditions:
	*
	* 1. Redistributions of source code must retain the above copyright notice,
	* this list of conditions and the following disclaimers.
	*
	* 2. Redistributions in binary form must reproduce the above copyright
	* notice, this list of conditions and the following disclaimers in the
	* documentation and/or other materials provided with the distribution.
	*
	* 3. Neither the names of Tresys Technology, nor the names of its contributors
	* may be used to endorse or promote products derived from this Software
	* without specific prior written permission.
	*
	* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
	* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
	* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
	* CONTRIBUTORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
	* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
	* OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS WITH THE
	* SOFTWARE.
	*/

	package edu.illinois.ncsa.daffodil.api

	import edu.illinois.ncsa.daffodil.processors.ProcessorResult
	import edu.illinois.ncsa.daffodil.processors.Success
	import java.io.File
	import edu.illinois.ncsa.daffodil.processors.VariableMap
	import edu.illinois.ncsa.daffodil.externalvars.Binding
	import edu.illinois.ncsa.daffodil.infoset.InfosetInputter
	import edu.illinois.ncsa.daffodil.infoset.InfosetOutputter
	import edu.illinois.ncsa.daffodil.processors.Failure

	/**
	* This file contains traits that define an abstract API that any DFDL processor
	* can satisfy. The intention is to allow test rigs and other systems to run tests
	* against multiple DFDL implementations for comparison purposes.
	*/

	/**
	* APIs for DFDL Parsing and Unparsing
	*
	* Assumed that applications will provide information not all at once, but will provide first:
	* <ol>
	* <li> Schema (which can be multiple schema files by way of include/import)
	* <li> XML Catalog, or other means by which include/import are found.
	* <li> Control settings/features for how they want the parser to behave.
	* <li> Error handlers.
	* <li> Root node and namespace
	* <li> Externally defined variables
	* </ol>
	* After that, the application will want to use one of two primary patterns:
	* <ul>
	* <li> Random access: one input source, evaluate many different paths
	* <li> Bulk Parsing: one path, many different input sources
	* </ul>
	* The output direction is symmetric.
	*
	* So the API provides a way to set the path specially, providing for schema-aware compilation of the XPath expression in the bulk processing case.
	*
	*/
	object DFDL {

	type Input = java.nio.channels.ReadableByteChannel // binary input stream/buffer
	type Output = java.nio.channels.WritableByteChannel // binary output stream/buffer

	trait Compiler {

	/**
	* User must establish error handlers, setup features appropriately before using the data access objects.
	*
	* Other features are TBD, but may include
	*
	* <ul>
	* <li>validation checking of the data - whether to warn or error.
	* <li>schema validation - validation of the DFDL Schema itself
	* <li>error recovery information - paths to anchor elements or similar
	* <li>error and warning tolerances - how many before failing entirely, escalation for warnings
	* <li>debug modes & tracing modes
	* <li>amount of buffering to make available for backward reference (0 meaning no backward reference)
	* <li>amount of buffering to make available for lookahead/speculation - bounding this can make error detection/recovery faster
	* <li>grammar ambiguity policies - whether to escalate certain ambiguous use of delimiters to errors, or try to parse anyway
	* </ul>
	*/

	/**
	* There are two places you can set the root element, or you can omit it.
	* You can set it here on the compiler. This saves compilation time, as
	* it will only compile things needed by your root element. (Good to make
	* tests run fast.) If you don't specify a root, then it compiles all top
	* level elements, anticipating that different uses of the compiled schema
	* might subsequently ask for different top level elements.
	*
	* If you don't specify a root here, then you can specify one later on the
	* ProcessorFactory object, but that won't save you as much compilation time.
	*
	* If you don't set a root at all, then it compiles all top level elements
	* and uses the first element in the first schema file as the root.
	*
	* When specifying a root element, you either specify its namespace, or
	* you can specify the empty string "" as the namespace which means "no namespace".
	* If you specify a root element name, but pass null as the namespace, then
	* it will search for a unique element with your root element name, and
	* if that is unambiguous, it will use it as the root.
	*/
	def setDistinguishedRootNode(name: String, namespace: String)
	def setExternalDFDLVariable(name: String, namespace: String, value: String)

	/**
	* Compilation returns a parser factory, which must be interrogated for diagnostics
	* to see if compilation was successful or not.
	*/
	def compileSource(schemaSource: DaffodilSchemaSource): ProcessorFactory

	def reload(savedParser: File): DataProcessor
	}

	/**
	* The point of processor factory is to allow compilation of the path expression.
	*/
	trait ProcessorFactory extends WithDiagnostics {

	/**
	* If you didn't set a root on the compiler, then get another
	* chance to specify one here.
	*
	* If you don't set a root at all it uses the first element in the
	* first schema document as the root.
	*
	* If you don't specify a namespace, or pass null, then it searches, and if
	* it is unambiguous, it will use the unique global element with
	* that name.
	*
	* Note: null used specifically here not an Option type, because this API
	* will shine through to a Java API.
	*
	* To explicitly specify that there is no-namespace, pass "" as
	* the namespace argument.
	*/
	def setDistinguishedRootNode(name: String, namespace: String = null)
	def onPath(xpath: String): DataProcessor
	}

	trait DataProcessor extends WithDiagnostics {
	def setValidationMode(mode: ValidationMode.Type): Unit
	def getValidationMode(): ValidationMode.Type
	def save(output: DFDL.Output): Unit
	def setExternalVariables(extVars: Map[String, String]): Unit
	def setExternalVariables(extVars: File): Unit
	def setExternalVariables(extVars: File, tunable: DaffodilTunables): Unit
	def setExternalVariables(extVars: Seq[Binding]): Unit
	def getVariables(): VariableMap
	def setTunable(tunable: String, value: String): Unit
	def setTunables(tunables: Map[String,String]): Unit
	def getTunables(): DaffodilTunables

	/**
	* Unparses (that is, serializes) data to the output, returns an object which contains any diagnostics.
	*/
	def unparse(input: InfosetInputter, output: DFDL.Output): UnparseResult
	/**
	* Returns an object which contains the result, and/or diagnostic information.
	*
	* For testing purposes (mostly), you can restrict the number of bits to
	* fewer than the entire input.
	*/
	def parse(input: Input, output: InfosetOutputter, lengthLimitInBits: Long = -1): ParseResult

	/**
	* Returns an object which contains the result, and/or diagnostic information.
	* <p>
	* Use this rather than passing a channel/stream because it enables some
	* I/O optimizations.
	*/
	def parse(file: File, output: InfosetOutputter): ParseResult
	}

	trait ParseResult extends Result with WithDiagnostics {
	def resultState: State
	}

	trait UnparseResult extends Result with WithDiagnostics {
	/**
	* Data is 'scannable' if it consists entirely of textual data, and that data
	* is all in the same encoding.
	*/
	def isScannable: Boolean
	def encodingName: String
	}

	/**
	* Interface for Parse and Unparse states
	*/
	trait State {
	def processorStatus: ProcessorResult
	def validationStatus: Boolean
	def diagnostics: Seq[Diagnostic]
	def currentLocation: DataLocation
	}

	/**
	* Interface for Parse and Unparse results
	*/
	abstract class Result {
	protected def resultState: State
	var diagnostics: Seq[Diagnostic] = Nil

	private def resultStatusDiagnostics: Seq[Diagnostic] = {
	resultState.processorStatus match {
	case Failure(c) => List(c)
	case Success => Nil
	}
	}

	def getDiagnostics = {
	(diagnostics.toSet ++ resultState.diagnostics.toSet ++ resultStatusDiagnostics.toSet).toSeq
	}

	def addDiagnostic(d: Diagnostic) {
	diagnostics = d +: diagnostics
	}

	def isError = isProcessingError \|\| isValidationError
	def isProcessingError = resultState.processorStatus != Success
	def isValidationError = resultState.validationStatus != true
	}
	}