src/org/apache/xml/security/c14n/implementations/CanonicalizerBase.java - santuario-xml-security-java - Git at Google

 /*
  * Copyright  1999-2004 The Apache Software Foundation.
  *
  *  Licensed under the Apache License, Version 2.0 (the "License");
  *  you may not use this file except in compliance with the License.
  *  You may obtain a copy of the License at
  *
  *      http://www.apache.org/licenses/LICENSE-2.0
  *
  *  Unless required by applicable law or agreed to in writing, software
  *  distributed under the License is distributed on an "AS IS" BASIS,
  *  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  *  See the License for the specific language governing permissions and
  *  limitations under the License.
  *
  */
 package org.apache.xml.security.c14n.implementations;


 import java.io.ByteArrayOutputStream;
 import java.io.IOException;
 import java.io.OutputStream;
 import java.io.UnsupportedEncodingException;
 import java.util.ArrayList;
 import java.util.Iterator;
 import java.util.List;
 import java.util.ListIterator;
 import java.util.Set;

 import javax.xml.parsers.DocumentBuilderFactory;

 import org.apache.xml.security.c14n.CanonicalizationException;
 import org.apache.xml.security.c14n.CanonicalizerSpi;
 import org.apache.xml.security.c14n.helper.AttrCompare;
 import org.apache.xml.security.utils.Constants;
 import org.apache.xml.security.utils.XMLUtils;
 import org.w3c.dom.Attr;
 import org.w3c.dom.Comment;
 import org.w3c.dom.Element;
 import org.w3c.dom.NamedNodeMap;
 import org.w3c.dom.Node;
 import org.w3c.dom.ProcessingInstruction;


 /**
  * Abstract base class for canonicalization algorithms.
  *
  * @author Christian Geuer-Pollmann <geuerp@apache.org>
  * @version $Revision$
  */
 public abstract class CanonicalizerBase extends CanonicalizerSpi {
    //Constants to be outputed, In char array form, so
    //less garbage is generate when outputed.
    private static final byte[] _END_PI = {'?','>'};
    private static final byte[] _BEGIN_PI = {'<','?'};
    private static final byte[] _END_COMM = {'-','-','>'};
    private static final byte[] _BEGIN_COMM = {'<','!','-','-'};
    private static final byte[] __XA_ = {'&','#','x','A',';'};
    private static final byte[] __X9_ = {'&','#','x','9',';'};
    private static final byte[] _QUOT_ = {'&','q','u','o','t',';'};
    private static final byte[] __XD_ = {'&','#','x','D',';'};
    private static final byte[] _GT_ = {'&','g','t',';'};
    private static final byte[] _LT_ = {'&','l','t',';'};
    private static final byte[] _END_TAG = {'<','/'};
    private static final byte[] _AMP_ = {'&','a','m','p',';'};
    final static AttrCompare COMPARE=new AttrCompare();
    final static String XML="xml";
    final static String XMLNS="xmlns";
    final static byte[] equalsStr= {'=','\"'};
    static final int NODE_BEFORE_DOCUMENT_ELEMENT = -1;
    static final int NODE_NOT_BEFORE_OR_AFTER_DOCUMENT_ELEMENT = 0;
    static final int NODE_AFTER_DOCUMENT_ELEMENT = 1;
    //The null xmlns definiton.
    protected static final Attr nullNode;
    static {
     try {
         nullNode=DocumentBuilderFactory.newInstance().
             newDocumentBuilder().newDocument().createAttributeNS(Constants.NamespaceSpecNS,XMLNS);
         nullNode.setValue("");
     } catch (Exception e) {
         throw new RuntimeException("Unable to create nullNode"/*,*/+e);
     }
    }

    boolean _includeComments;
    Set _xpathNodeSet = null;
    /**
     * The node to be skiped/excluded from the DOM tree
     * in subtree canonicalizations.
     */
    Node _excludeNode =null;
    OutputStream _writer = new ByteArrayOutputStream();//null;

    /**
     * Constructor CanonicalizerBase
     *
     * @param includeComments
     */
    public CanonicalizerBase(boolean includeComments) {
       this._includeComments = includeComments;
    }

    /**
     * Method engineCanonicalizeSubTree
     * @inheritDoc
     * @param rootNode
     * @throws CanonicalizationException
     */
    public byte[] engineCanonicalizeSubTree(Node rootNode)
            throws CanonicalizationException {
    		return engineCanonicalizeSubTree(rootNode,(Node)null);
    }
    /**
     * Canonicalizes a Subtree node.
     * @param rootNode the root of the subtree to canicalize
     * @param excludeNode a node to be excluded from the canicalize operation
     * @return The canonicalize stream.
     * @throws CanonicalizationException
     */
     public byte[] engineCanonicalizeSubTree(Node rootNode,Node excludeNode)
     throws CanonicalizationException {
     	this._excludeNode = excludeNode;
         try {
          NameSpaceSymbTable ns=new NameSpaceSymbTable();
          if (rootNode instanceof Element) {
          	//Fills the nssymbtable with the definitions of the parent of the root subnode
          	getParentNameSpaces((Element)rootNode,ns);
          }
          this.canonicalizeSubTree(rootNode,ns);
          this._writer.close();
          if (this._writer instanceof ByteArrayOutputStream) {
             byte []result=((ByteArrayOutputStream)this._writer).toByteArray();
             if (reset) {
                 ((ByteArrayOutputStream)this._writer).reset();
             }
          	return result;
          }
          return null;

       } catch (UnsupportedEncodingException ex) {
          throw new CanonicalizationException("empty", ex);
       } catch (IOException ex) {
          throw new CanonicalizationException("empty", ex);
       }
    }


    /**
     * Method canonicalizeSubTree, this function is a recursive one.
     *
     * @param currentNode
     * @param ns
     * @throws CanonicalizationException
     * @throws IOException
     */
    final void canonicalizeSubTree(Node currentNode, NameSpaceSymbTable ns)
            throws CanonicalizationException, IOException {

       switch (currentNode.getNodeType()) {

       case Node.DOCUMENT_TYPE_NODE :
       default :
          break;

       case Node.ENTITY_NODE :
       case Node.NOTATION_NODE :
       case Node.DOCUMENT_FRAGMENT_NODE :
       case Node.ATTRIBUTE_NODE :
          // illegal node type during traversal
          throw new CanonicalizationException("empty");
       case Node.DOCUMENT_NODE :
          for (Node currentChild = currentNode.getFirstChild();
                  currentChild != null;
                  currentChild = currentChild.getNextSibling()) {
             canonicalizeSubTree(currentChild,ns);
          }
          break;

       case Node.COMMENT_NODE :
          if (this._includeComments) {
             outputCommentToWriter((Comment) currentNode, this._writer);
          }
          break;

       case Node.PROCESSING_INSTRUCTION_NODE :
          outputPItoWriter((ProcessingInstruction) currentNode, this._writer);
          break;

       case Node.TEXT_NODE :
       case Node.CDATA_SECTION_NODE :
          outputTextToWriter(currentNode.getNodeValue(), this._writer);
          break;

       case Node.ELEMENT_NODE :
       	if (currentNode==this._excludeNode) {
       		return;
       	}
         OutputStream writer=this._writer;
          Element currentElement = (Element) currentNode;
          //Add a level to the nssymbtable. So latter can be pop-back.
       	 ns.outputNodePush();
          writer.write('<');
          String tagName=currentElement.getTagName();
          writeStringToUtf8(tagName,writer);

          Iterator attrs = this.handleAttributesSubtree(currentElement,ns);
          if (attrs!=null) {
          	//we output all Attrs which are available
          	while (attrs.hasNext()) {
          		Attr attr = (Attr) attrs.next();
          		outputAttrToWriter(attr.getNodeName(),
                                     attr.getNodeValue(), writer);
          	}
          }

          writer.write('>');

          // traversal
          for (Node currentChild = currentNode.getFirstChild();
                  currentChild != null;
                  currentChild = currentChild.getNextSibling()) {
             canonicalizeSubTree(currentChild,ns);
          }

          writer.write(_END_TAG);
          writeStringToUtf8(tagName,writer);
          writer.write('>');
          //We fineshed with this level, pop to the previous definitions.
          ns.outputNodePop();
          break;
       }
    }

    /**
     * Checks whether a Comment or ProcessingInstruction is before or after the
     * document element. This is needed for prepending or appending "\n"s.
     *
     * @param currentNode comment or pi to check
     * @return NODE_BEFORE_DOCUMENT_ELEMENT, NODE_NOT_BEFORE_OR_AFTER_DOCUMENT_ELEMENT or NODE_AFTER_DOCUMENT_ELEMENT
     * @see #NODE_BEFORE_DOCUMENT_ELEMENT
     * @see #NODE_NOT_BEFORE_OR_AFTER_DOCUMENT_ELEMENT
     * @see #NODE_AFTER_DOCUMENT_ELEMENT
     */
    final static int getPositionRelativeToDocumentElement(Node currentNode) {

       if ((currentNode == null) ||
             (currentNode.getParentNode().getNodeType() != Node.DOCUMENT_NODE) ) {
          return CanonicalizerBase.NODE_NOT_BEFORE_OR_AFTER_DOCUMENT_ELEMENT;
       }
       Element documentElement = currentNode.getOwnerDocument().getDocumentElement();
       if ( (documentElement == null)  || (documentElement == currentNode) ){
          return CanonicalizerBase.NODE_NOT_BEFORE_OR_AFTER_DOCUMENT_ELEMENT;
       }

       for (Node x = currentNode; x != null; x = x.getNextSibling()) {
          if (x == documentElement) {
             return CanonicalizerBase.NODE_BEFORE_DOCUMENT_ELEMENT;
          }
       }

       return CanonicalizerBase.NODE_AFTER_DOCUMENT_ELEMENT;
    }

    /**
     * Method engineCanonicalizeXPathNodeSet
     * @inheritDoc
     * @param xpathNodeSet
     * @throws CanonicalizationException
     */
    public byte[] engineCanonicalizeXPathNodeSet(Set xpathNodeSet)
            throws CanonicalizationException {
       if (xpathNodeSet.size() == 0) {
         return new byte[0];
       }
       this._xpathNodeSet = xpathNodeSet;
       try {
          Node rootNodeOfC14n = XMLUtils.getOwnerDocument(this._xpathNodeSet);
          this.canonicalizeXPathNodeSet(rootNodeOfC14n,new  NameSpaceSymbTable());
          this._writer.close();
          if (this._writer instanceof ByteArrayOutputStream) {
             byte [] sol=((ByteArrayOutputStream)this._writer).toByteArray();
             if (reset) {
             	((ByteArrayOutputStream)this._writer).reset();
             }
          	return sol;
          }
          return null;
       } catch (UnsupportedEncodingException ex) {
          throw new CanonicalizationException("empty", ex);
       } catch (IOException ex) {
          throw new CanonicalizationException("empty", ex);
       }
    }

    /**
     * Canoicalizes all the nodes included in the currentNode and contained in the
 	* _xpathNodeSet field.
     *
     * @param currentNode
 	* @param ns
     * @throws CanonicalizationException
     * @throws IOException
     */
    final void canonicalizeXPathNodeSet(Node currentNode, NameSpaceSymbTable ns )
            throws CanonicalizationException, IOException {
       boolean currentNodeIsVisible = this._xpathNodeSet.contains(currentNode);

       switch (currentNode.getNodeType()) {

       case Node.DOCUMENT_TYPE_NODE :
       default :
          break;

       case Node.ENTITY_NODE :
       case Node.NOTATION_NODE :
       case Node.DOCUMENT_FRAGMENT_NODE :
       case Node.ATTRIBUTE_NODE :
          throw new CanonicalizationException("empty");
       case Node.DOCUMENT_NODE :
          for (Node currentChild = currentNode.getFirstChild();
                  currentChild != null;
                  currentChild = currentChild.getNextSibling()) {
             canonicalizeXPathNodeSet(currentChild,ns);
          }
          break;

       case Node.COMMENT_NODE :
          if (currentNodeIsVisible && this._includeComments) {
             outputCommentToWriter((Comment) currentNode, this._writer);
          }
          break;

       case Node.PROCESSING_INSTRUCTION_NODE :
          if (currentNodeIsVisible) {
             outputPItoWriter((ProcessingInstruction) currentNode, this._writer);
          }
          break;

       case Node.TEXT_NODE :
       case Node.CDATA_SECTION_NODE :
          if (currentNodeIsVisible) {
             outputTextToWriter(currentNode.getNodeValue(), this._writer);

             for (Node nextSibling = currentNode.getNextSibling();
                     (nextSibling != null)
                     && ((nextSibling.getNodeType() == Node.TEXT_NODE)
                         || (nextSibling.getNodeType()
                             == Node.CDATA_SECTION_NODE));
                     nextSibling = nextSibling.getNextSibling()) {
                /* The XPath data model allows to select only the first of a
                 * sequence of mixed text and CDATA nodes. But we must output
                 * them all, so we must search:
                 *
                 * @see http://nagoya.apache.org/bugzilla/show_bug.cgi?id=6329
                 */
                outputTextToWriter(nextSibling.getNodeValue(), this._writer);
             }
          }
          break;

       case Node.ELEMENT_NODE :
          Element currentElement = (Element) currentNode;
       	 OutputStream writer=this._writer;
          String tagName=currentElement.getTagName();
          if (currentNodeIsVisible) {
             //This is an outputNode.
          	ns.outputNodePush();
             writer.write('<');
             writeStringToUtf8(tagName,writer);
          } else {
            //Not an outputNode.
          	ns.push();
          }

          // we output all Attrs which are available
          Iterator attrs = handleAttributes(currentElement,ns);
          while (attrs.hasNext()) {
             Attr attr = (Attr) attrs.next();
             outputAttrToWriter(attr.getNodeName(), attr.getNodeValue(), writer);
          }

          if (currentNodeIsVisible) {
             writer.write('>');
          }

          // traversal
          for (Node currentChild = currentNode.getFirstChild();
                  currentChild != null;
                  currentChild = currentChild.getNextSibling()) {
             canonicalizeXPathNodeSet(currentChild,ns);
          }

          if (currentNodeIsVisible) {
             writer.write(_END_TAG);
             writeStringToUtf8(tagName,writer);
             //this._writer.write(currentElement.getTagName().getBytes("UTF8"));
             writer.write('>');
             ns.outputNodePop();
          } else {
          	ns.pop();
          }
          break;
       }
    }

    	/**
 	 * Adds to ns the definitons from the parent elements of el
    	 * @param el
    	 * @param ns
    	 */
    	final static void getParentNameSpaces(Element el,NameSpaceSymbTable ns)  {
    		List parents=new ArrayList();
    		Node n1=el.getParentNode();
    		if (!(n1 instanceof Element)) {
    			return;
    		}
    		//Obtain all the parents of the elemnt
    		Element parent=(Element) el.getParentNode();
    		while (parent!=null) {
    			parents.add(parent);
    			Node n=parent.getParentNode();
    			if (!(n instanceof Element )) {
    				break;
    			}
    			parent=(Element)n;
    		}
    		//Visit them in reverse order.
    		ListIterator it=parents.listIterator(parents.size());
    		while (it.hasPrevious()) {
    		Element ele=(Element)it.previous();
         if (!ele.hasAttributes()) {
         	continue;
         }
 		NamedNodeMap attrs = ele.getAttributes();
    		int attrsLength = attrs.getLength();
    		 for (int i = 0; i < attrsLength; i++) {
             Attr N = (Attr) attrs.item(i);
             if (!Constants.NamespaceSpecNS.equals(N.getNamespaceURI())) {
                //Not a namespace definition, ignore.
                continue;
             }

             String NName=N.getLocalName();
             String NValue=N.getNodeValue();
             if (XML.equals(NName)
                     && Constants.XML_LANG_SPACE_SpecNS.equals(NValue)) {
                continue;
             }
             ns.addMapping(NName,NValue,N);
    		 }
    		}
         Attr nsprefix;
         if (((nsprefix=ns.getMappingWithoutRendered("xmlns"))!=null)
                 && "".equals(nsprefix.getValue())) {
              ns.addMappingAndRender("xmlns","",nullNode);
         }
    	}
    /**
     * Outputs an Attribute to the internal Writer.
     *
     * The string value of the node is modified by replacing
     * <UL>
     * <LI>all ampersands (&) with <CODE>&amp;amp;</CODE></LI>
     * <LI>all open angle brackets (<) with <CODE>&amp;lt;</CODE></LI>
     * <LI>all quotation mark characters with <CODE>&amp;quot;</CODE></LI>
     * <LI>and the whitespace characters <CODE>#x9</CODE>, #xA, and #xD, with character
     * references. The character references are written in uppercase
     * hexadecimal with no leading zeroes (for example, <CODE>#xD</CODE> is represented
     * by the character reference <CODE>&amp;#xD;</CODE>)</LI>
     * </UL>
     *
     * @param name
     * @param value
     * @param writer
     * @throws IOException
     */
    static final void outputAttrToWriter(final String name, final String value, final OutputStream writer) throws IOException {
       writer.write(' ');
       writeStringToUtf8(name,writer);
       writer.write(equalsStr);
       byte  []toWrite;
       final int length = value.length();
       for (int i=0;i < length; i++) {
          char c = value.charAt(i);

          switch (c) {

          case '&' :
          	toWrite=_AMP_;
             //writer.write(_AMP_);
             break;

          case '<' :
          	toWrite=_LT_;
             //writer.write(_LT_);
             break;

          case '"' :
          	toWrite=_QUOT_;
             //writer.write(_QUOT_);
             break;

          case 0x09 :    // '\t'
          	toWrite=__X9_;
             //writer.write(__X9_);
             break;

          case 0x0A :    // '\n'
          	toWrite=__XA_;
             //writer.write(__XA_);
             break;

          case 0x0D :    // '\r'
          	toWrite=__XD_;
             //writer.write(__XD_);
             break;

          default :
             writeCharToUtf8(c,writer);
             //this._writer.write(c);
             continue;
          }
          writer.write(toWrite);
       }

       writer.write('\"');
    }

    final static void writeCharToUtf8(final char c,final OutputStream out) throws IOException{
    	char ch;
     if (/*(c >= 0x0001) &&*/ (c <= 0x007F)) {
    		out.write(c);
    		return;
    	} else if (c > 0x07FF) {
         ch=(char)(c>>>12);
         if (ch>0) {
         	out.write(0xE0 | ( ch & 0x0F));
         } else {
         	out.write(0xE0);
         }
         out.write(0x80 | ((c >>>  6) & 0x3F));
    		out.write(0x80 | ((c) & 0x3F));
    		return;

    	} else {
         ch=(char)(c>>>6);
         if (ch>0) {
         	out.write(0xC0 | (ch & 0x1F));
         } else {
         	out.write(0xC0);
         }
    		out.write(0x80 | ((c) & 0x3F));
    		return;
    	}

    }

    final static void writeStringToUtf8(final String str,final OutputStream out) throws IOException{
    	final int length=str.length();
    	int i=0;
     char ch,c;
    	while (i<length) {
    		c=str.charAt(i++);
         if (/*(c >= 0x0001) &&*/ (c <= 0x007F)) {
             out.write(c);
             continue;
         } else if (c > 0x07FF) {
             ch=(char)(c>>>12);
             if (ch>0) {
                 out.write(0xE0 | ( ch & 0x0F));
             } else {
                 out.write(0xE0);
             }
             out.write(0x80 | ((c >>>  6) & 0x3F));
             out.write(0x80 | ((c) & 0x3F));
             continue;
         } else {
             ch=(char)(c>>>6);
             if (ch>0) {
                 out.write(0xC0 | (ch & 0x1F));
             } else {
                 out.write(0xC0);
             }
             out.write(0x80 | ((c) & 0x3F));
             continue;
         }
    	}

    }
    /**
     * Outputs a PI to the internal Writer.
     *
     * @param currentPI
     * @param writer TODO
     * @throws IOException
     */
    static final void outputPItoWriter(ProcessingInstruction currentPI, OutputStream writer) throws IOException {
    	  final int position = getPositionRelativeToDocumentElement(currentPI);

       if (position == NODE_AFTER_DOCUMENT_ELEMENT) {
         writer.write('\n');
       }
       writer.write(_BEGIN_PI);

       final String target = currentPI.getTarget();
       int length = target.length();

       for (int i = 0; i < length; i++) {
       	 char c=target.charAt(i);
          if (c==0x0D) {
             writer.write(__XD_);
          } else {
             writeCharToUtf8(c,writer);
          }
       }

       final String data = currentPI.getData();

       length = data.length();

       if (length > 0) {
          writer.write(' ');

          for (int i = 0; i < length; i++) {
          	char c=data.charAt(i);
             if (c==0x0D) {
                writer.write(__XD_);
             } else {
                writeCharToUtf8(c,writer);
             }
          }
       }

       writer.write(_END_PI);
       if (position == NODE_BEFORE_DOCUMENT_ELEMENT) {
         writer.write('\n');
      }
    }

    /**
     * Method outputCommentToWriter
     *
     * @param currentComment
     * @param writer TODO
     * @throws IOException
     */
    static final void outputCommentToWriter(Comment currentComment, OutputStream writer) throws IOException {
    	  final int position = getPositionRelativeToDocumentElement(currentComment);
    	  if (position == NODE_AFTER_DOCUMENT_ELEMENT) {
    		writer.write('\n');
    	  }
       writer.write(_BEGIN_COMM);

       final String data = currentComment.getData();
       final int length = data.length();

       for (int i = 0; i < length; i++) {
          char c=data.charAt(i);
          if (c==0x0D) {
             writer.write(__XD_);
          } else {
             writeCharToUtf8(c,writer);
          }
       }

       writer.write(_END_COMM);
       if (position == NODE_BEFORE_DOCUMENT_ELEMENT) {
 		writer.write('\n');
 	 }
    }

    /**
     * Outputs a Text of CDATA section to the internal Writer.
     *
     * @param text
     * @param writer TODO
     * @throws IOException
     */
    static final void outputTextToWriter(final String text, final OutputStream writer) throws IOException {
       final int length = text.length();
       byte []toWrite;
       for (int i = 0; i < length; i++) {
          char c = text.charAt(i);

          switch (c) {

          case '&' :
          	toWrite=_AMP_;
             //writer.write(_AMP_);
             break;

          case '<' :
          	toWrite=_LT_;
             //writer.write(_LT_);
             break;

          case '>' :
          	toWrite=_GT_;
             //writer.write(_GT_);
             break;

          case 0xD :
          	toWrite=__XD_;
             //writer.write(__XD_);
             break;

          default :
             writeCharToUtf8(c,writer);
             continue;
          }
          writer.write(toWrite);
       }
    }

    /**
     * Obtain the attributes to output for this node in XPathNodeSet c14n.
     *
     * @param E
 	* @param ns
 	* @return the attributes nodes to output.
     * @throws CanonicalizationException
     */
    abstract Iterator handleAttributes(Element E, NameSpaceSymbTable ns )
    throws CanonicalizationException;

    /**
     * Obtain the attributes to output for this node in a Subtree c14n.
     *
     * @param E
 	* @param ns
 	* @return the attributes nodes to output.
     * @throws CanonicalizationException
     */
    abstract Iterator handleAttributesSubtree(Element E, NameSpaceSymbTable ns)
    throws CanonicalizationException;


    /**
     * @return Returns the _includeComments.
     */
    final public boolean is_includeComments() {
 	 return _includeComments;
    }
    /**
     * @param comments The _includeComments to set.
     */
     final public void set_includeComments(boolean comments) {
 	    _includeComments = comments;
     }

     /**
      * @param _writer The _writer to set.
      */
     public void setWriter(OutputStream _writer) {
     	this._writer = _writer;
     }

 }
	/*
	* Copyright 1999-2004 The Apache Software Foundation.
	*
	* Licensed under the Apache License, Version 2.0 (the "License");
	* you may not use this file except in compliance with the License.
	* You may obtain a copy of the License at
	*
	* http://www.apache.org/licenses/LICENSE-2.0
	*
	* Unless required by applicable law or agreed to in writing, software
	* distributed under the License is distributed on an "AS IS" BASIS,
	* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
	* See the License for the specific language governing permissions and
	* limitations under the License.
	*
	*/
	package org.apache.xml.security.c14n.implementations;



	import java.io.ByteArrayOutputStream;
	import java.io.IOException;
	import java.io.OutputStream;
	import java.io.UnsupportedEncodingException;
	import java.util.ArrayList;
	import java.util.Iterator;
	import java.util.List;
	import java.util.ListIterator;
	import java.util.Set;

	import javax.xml.parsers.DocumentBuilderFactory;

	import org.apache.xml.security.c14n.CanonicalizationException;
	import org.apache.xml.security.c14n.CanonicalizerSpi;
	import org.apache.xml.security.c14n.helper.AttrCompare;
	import org.apache.xml.security.utils.Constants;
	import org.apache.xml.security.utils.XMLUtils;
	import org.w3c.dom.Attr;
	import org.w3c.dom.Comment;
	import org.w3c.dom.Element;
	import org.w3c.dom.NamedNodeMap;
	import org.w3c.dom.Node;
	import org.w3c.dom.ProcessingInstruction;


	/**
	* Abstract base class for canonicalization algorithms.
	*
	* @author Christian Geuer-Pollmann <geuerp@apache.org>
	* @version $Revision$
	*/
	public abstract class CanonicalizerBase extends CanonicalizerSpi {
	//Constants to be outputed, In char array form, so
	//less garbage is generate when outputed.
	private static final byte[] _END_PI = {'?','>'};
	private static final byte[] _BEGIN_PI = {'<','?'};
	private static final byte[] _END_COMM = {'-','-','>'};
	private static final byte[] _BEGIN_COMM = {'<','!','-','-'};
	private static final byte[] __XA_ = {'&','#','x','A',';'};
	private static final byte[] __X9_ = {'&','#','x','9',';'};
	private static final byte[] _QUOT_ = {'&','q','u','o','t',';'};
	private static final byte[] __XD_ = {'&','#','x','D',';'};
	private static final byte[] _GT_ = {'&','g','t',';'};
	private static final byte[] _LT_ = {'&','l','t',';'};
	private static final byte[] _END_TAG = {'<','/'};
	private static final byte[] _AMP_ = {'&','a','m','p',';'};
	final static AttrCompare COMPARE=new AttrCompare();
	final static String XML="xml";
	final static String XMLNS="xmlns";
	final static byte[] equalsStr= {'=','\"'};
	static final int NODE_BEFORE_DOCUMENT_ELEMENT = -1;
	static final int NODE_NOT_BEFORE_OR_AFTER_DOCUMENT_ELEMENT = 0;
	static final int NODE_AFTER_DOCUMENT_ELEMENT = 1;
	//The null xmlns definiton.
	protected static final Attr nullNode;
	static {
	try {
	nullNode=DocumentBuilderFactory.newInstance().
	newDocumentBuilder().newDocument().createAttributeNS(Constants.NamespaceSpecNS,XMLNS);
	nullNode.setValue("");
	} catch (Exception e) {
	throw new RuntimeException("Unable to create nullNode"/,/+e);
	}
	}

	boolean _includeComments;
	Set _xpathNodeSet = null;
	/**
	* The node to be skiped/excluded from the DOM tree
	* in subtree canonicalizations.
	*/
	Node _excludeNode =null;
	OutputStream _writer = new ByteArrayOutputStream();//null;

	/**
	* Constructor CanonicalizerBase
	*
	* @param includeComments
	*/
	public CanonicalizerBase(boolean includeComments) {
	this._includeComments = includeComments;
	}

	/**
	* Method engineCanonicalizeSubTree
	* @inheritDoc
	* @param rootNode
	* @throws CanonicalizationException
	*/
	public byte[] engineCanonicalizeSubTree(Node rootNode)
	throws CanonicalizationException {
	return engineCanonicalizeSubTree(rootNode,(Node)null);
	}
	/**
	* Canonicalizes a Subtree node.
	* @param rootNode the root of the subtree to canicalize
	* @param excludeNode a node to be excluded from the canicalize operation
	* @return The canonicalize stream.
	* @throws CanonicalizationException
	*/
	public byte[] engineCanonicalizeSubTree(Node rootNode,Node excludeNode)
	throws CanonicalizationException {
	this._excludeNode = excludeNode;
	try {
	NameSpaceSymbTable ns=new NameSpaceSymbTable();
	if (rootNode instanceof Element) {
	//Fills the nssymbtable with the definitions of the parent of the root subnode
	getParentNameSpaces((Element)rootNode,ns);
	}
	this.canonicalizeSubTree(rootNode,ns);
	this._writer.close();
	if (this._writer instanceof ByteArrayOutputStream) {
	byte []result=((ByteArrayOutputStream)this._writer).toByteArray();
	if (reset) {
	((ByteArrayOutputStream)this._writer).reset();
	}
	return result;
	}
	return null;

	} catch (UnsupportedEncodingException ex) {
	throw new CanonicalizationException("empty", ex);
	} catch (IOException ex) {
	throw new CanonicalizationException("empty", ex);
	}
	}


	/**
	* Method canonicalizeSubTree, this function is a recursive one.
	*
	* @param currentNode
	* @param ns
	* @throws CanonicalizationException
	* @throws IOException
	*/
	final void canonicalizeSubTree(Node currentNode, NameSpaceSymbTable ns)
	throws CanonicalizationException, IOException {

	switch (currentNode.getNodeType()) {

	case Node.DOCUMENT_TYPE_NODE :
	default :
	break;

	case Node.ENTITY_NODE :
	case Node.NOTATION_NODE :
	case Node.DOCUMENT_FRAGMENT_NODE :
	case Node.ATTRIBUTE_NODE :
	// illegal node type during traversal
	throw new CanonicalizationException("empty");
	case Node.DOCUMENT_NODE :
	for (Node currentChild = currentNode.getFirstChild();
	currentChild != null;
	currentChild = currentChild.getNextSibling()) {
	canonicalizeSubTree(currentChild,ns);
	}
	break;

	case Node.COMMENT_NODE :
	if (this._includeComments) {
	outputCommentToWriter((Comment) currentNode, this._writer);
	}
	break;

	case Node.PROCESSING_INSTRUCTION_NODE :
	outputPItoWriter((ProcessingInstruction) currentNode, this._writer);
	break;

	case Node.TEXT_NODE :
	case Node.CDATA_SECTION_NODE :
	outputTextToWriter(currentNode.getNodeValue(), this._writer);
	break;

	case Node.ELEMENT_NODE :
	if (currentNode==this._excludeNode) {
	return;
	}
	OutputStream writer=this._writer;
	Element currentElement = (Element) currentNode;
	//Add a level to the nssymbtable. So latter can be pop-back.
	ns.outputNodePush();
	writer.write('<');
	String tagName=currentElement.getTagName();
	writeStringToUtf8(tagName,writer);

	Iterator attrs = this.handleAttributesSubtree(currentElement,ns);
	if (attrs!=null) {
	//we output all Attrs which are available
	while (attrs.hasNext()) {
	Attr attr = (Attr) attrs.next();
	outputAttrToWriter(attr.getNodeName(),
	attr.getNodeValue(), writer);
	}
	}

	writer.write('>');

	// traversal
	for (Node currentChild = currentNode.getFirstChild();
	currentChild != null;
	currentChild = currentChild.getNextSibling()) {
	canonicalizeSubTree(currentChild,ns);
	}

	writer.write(_END_TAG);
	writeStringToUtf8(tagName,writer);
	writer.write('>');
	//We fineshed with this level, pop to the previous definitions.
	ns.outputNodePop();
	break;
	}
	}

	/**
	* Checks whether a Comment or ProcessingInstruction is before or after the
	* document element. This is needed for prepending or appending "\n"s.
	*
	* @param currentNode comment or pi to check
	* @return NODE_BEFORE_DOCUMENT_ELEMENT, NODE_NOT_BEFORE_OR_AFTER_DOCUMENT_ELEMENT or NODE_AFTER_DOCUMENT_ELEMENT
	* @see #NODE_BEFORE_DOCUMENT_ELEMENT
	* @see #NODE_NOT_BEFORE_OR_AFTER_DOCUMENT_ELEMENT
	* @see #NODE_AFTER_DOCUMENT_ELEMENT
	*/
	final static int getPositionRelativeToDocumentElement(Node currentNode) {

	if ((currentNode == null) \|\|
	(currentNode.getParentNode().getNodeType() != Node.DOCUMENT_NODE) ) {
	return CanonicalizerBase.NODE_NOT_BEFORE_OR_AFTER_DOCUMENT_ELEMENT;
	}
	Element documentElement = currentNode.getOwnerDocument().getDocumentElement();
	if ( (documentElement == null) \|\| (documentElement == currentNode) ){
	return CanonicalizerBase.NODE_NOT_BEFORE_OR_AFTER_DOCUMENT_ELEMENT;
	}

	for (Node x = currentNode; x != null; x = x.getNextSibling()) {
	if (x == documentElement) {
	return CanonicalizerBase.NODE_BEFORE_DOCUMENT_ELEMENT;
	}
	}

	return CanonicalizerBase.NODE_AFTER_DOCUMENT_ELEMENT;
	}

	/**
	* Method engineCanonicalizeXPathNodeSet
	* @inheritDoc
	* @param xpathNodeSet
	* @throws CanonicalizationException
	*/
	public byte[] engineCanonicalizeXPathNodeSet(Set xpathNodeSet)
	throws CanonicalizationException {
	if (xpathNodeSet.size() == 0) {
	return new byte[0];
	}
	this._xpathNodeSet = xpathNodeSet;
	try {
	Node rootNodeOfC14n = XMLUtils.getOwnerDocument(this._xpathNodeSet);
	this.canonicalizeXPathNodeSet(rootNodeOfC14n,new NameSpaceSymbTable());
	this._writer.close();
	if (this._writer instanceof ByteArrayOutputStream) {
	byte [] sol=((ByteArrayOutputStream)this._writer).toByteArray();
	if (reset) {
	((ByteArrayOutputStream)this._writer).reset();
	}
	return sol;
	}
	return null;
	} catch (UnsupportedEncodingException ex) {
	throw new CanonicalizationException("empty", ex);
	} catch (IOException ex) {
	throw new CanonicalizationException("empty", ex);
	}
	}

	/**
	* Canoicalizes all the nodes included in the currentNode and contained in the
	* _xpathNodeSet field.
	*
	* @param currentNode
	* @param ns
	* @throws CanonicalizationException
	* @throws IOException
	*/
	final void canonicalizeXPathNodeSet(Node currentNode, NameSpaceSymbTable ns )
	throws CanonicalizationException, IOException {
	boolean currentNodeIsVisible = this._xpathNodeSet.contains(currentNode);

	switch (currentNode.getNodeType()) {

	case Node.DOCUMENT_TYPE_NODE :
	default :
	break;

	case Node.ENTITY_NODE :
	case Node.NOTATION_NODE :
	case Node.DOCUMENT_FRAGMENT_NODE :
	case Node.ATTRIBUTE_NODE :
	throw new CanonicalizationException("empty");
	case Node.DOCUMENT_NODE :
	for (Node currentChild = currentNode.getFirstChild();
	currentChild != null;
	currentChild = currentChild.getNextSibling()) {
	canonicalizeXPathNodeSet(currentChild,ns);
	}
	break;

	case Node.COMMENT_NODE :
	if (currentNodeIsVisible && this._includeComments) {
	outputCommentToWriter((Comment) currentNode, this._writer);
	}
	break;

	case Node.PROCESSING_INSTRUCTION_NODE :
	if (currentNodeIsVisible) {
	outputPItoWriter((ProcessingInstruction) currentNode, this._writer);
	}
	break;

	case Node.TEXT_NODE :
	case Node.CDATA_SECTION_NODE :
	if (currentNodeIsVisible) {
	outputTextToWriter(currentNode.getNodeValue(), this._writer);

	for (Node nextSibling = currentNode.getNextSibling();
	(nextSibling != null)
	&& ((nextSibling.getNodeType() == Node.TEXT_NODE)
	\|\| (nextSibling.getNodeType()
	== Node.CDATA_SECTION_NODE));
	nextSibling = nextSibling.getNextSibling()) {
	/* The XPath data model allows to select only the first of a
	* sequence of mixed text and CDATA nodes. But we must output
	* them all, so we must search:
	*
	* @see http://nagoya.apache.org/bugzilla/show_bug.cgi?id=6329
	*/
	outputTextToWriter(nextSibling.getNodeValue(), this._writer);
	}
	}
	break;

	case Node.ELEMENT_NODE :
	Element currentElement = (Element) currentNode;
	OutputStream writer=this._writer;
	String tagName=currentElement.getTagName();
	if (currentNodeIsVisible) {
	//This is an outputNode.
	ns.outputNodePush();
	writer.write('<');
	writeStringToUtf8(tagName,writer);
	} else {
	//Not an outputNode.
	ns.push();
	}

	// we output all Attrs which are available
	Iterator attrs = handleAttributes(currentElement,ns);
	while (attrs.hasNext()) {
	Attr attr = (Attr) attrs.next();
	outputAttrToWriter(attr.getNodeName(), attr.getNodeValue(), writer);
	}

	if (currentNodeIsVisible) {
	writer.write('>');
	}

	// traversal
	for (Node currentChild = currentNode.getFirstChild();
	currentChild != null;
	currentChild = currentChild.getNextSibling()) {
	canonicalizeXPathNodeSet(currentChild,ns);
	}

	if (currentNodeIsVisible) {
	writer.write(_END_TAG);
	writeStringToUtf8(tagName,writer);
	//this._writer.write(currentElement.getTagName().getBytes("UTF8"));
	writer.write('>');
	ns.outputNodePop();
	} else {
	ns.pop();
	}
	break;
	}
	}

	/**
	* Adds to ns the definitons from the parent elements of el
	* @param el
	* @param ns
	*/
	final static void getParentNameSpaces(Element el,NameSpaceSymbTable ns) {
	List parents=new ArrayList();
	Node n1=el.getParentNode();
	if (!(n1 instanceof Element)) {
	return;
	}
	//Obtain all the parents of the elemnt
	Element parent=(Element) el.getParentNode();
	while (parent!=null) {
	parents.add(parent);
	Node n=parent.getParentNode();
	if (!(n instanceof Element )) {
	break;
	}
	parent=(Element)n;
	}
	//Visit them in reverse order.
	ListIterator it=parents.listIterator(parents.size());
	while (it.hasPrevious()) {
	Element ele=(Element)it.previous();
	if (!ele.hasAttributes()) {
	continue;
	}
	NamedNodeMap attrs = ele.getAttributes();
	int attrsLength = attrs.getLength();
	for (int i = 0; i < attrsLength; i++) {
	Attr N = (Attr) attrs.item(i);
	if (!Constants.NamespaceSpecNS.equals(N.getNamespaceURI())) {
	//Not a namespace definition, ignore.
	continue;
	}

	String NName=N.getLocalName();
	String NValue=N.getNodeValue();
	if (XML.equals(NName)
	&& Constants.XML_LANG_SPACE_SpecNS.equals(NValue)) {
	continue;
	}
	ns.addMapping(NName,NValue,N);
	}
	}
	Attr nsprefix;
	if (((nsprefix=ns.getMappingWithoutRendered("xmlns"))!=null)
	&& "".equals(nsprefix.getValue())) {
	ns.addMappingAndRender("xmlns","",nullNode);
	}
	}
	/**
	* Outputs an Attribute to the internal Writer.
	*
	* The string value of the node is modified by replacing
	* <UL>
	* <LI>all ampersands (&) with <CODE>&amp;</CODE></LI>
	* <LI>all open angle brackets (<) with <CODE>&lt;</CODE></LI>
	* <LI>all quotation mark characters with <CODE>&quot;</CODE></LI>
	* <LI>and the whitespace characters <CODE>#x9</CODE>, #xA, and #xD, with character
	* references. The character references are written in uppercase
	* hexadecimal with no leading zeroes (for example, <CODE>#xD</CODE> is represented
	* by the character reference <CODE>&#xD;</CODE>)</LI>
	* </UL>
	*
	* @param name
	* @param value
	* @param writer
	* @throws IOException
	*/
	static final void outputAttrToWriter(final String name, final String value, final OutputStream writer) throws IOException {
	writer.write(' ');
	writeStringToUtf8(name,writer);
	writer.write(equalsStr);
	byte []toWrite;
	final int length = value.length();
	for (int i=0;i < length; i++) {
	char c = value.charAt(i);

	switch (c) {

	case '&' :
	toWrite=_AMP_;
	//writer.write(_AMP_);
	break;

	case '<' :
	toWrite=_LT_;
	//writer.write(_LT_);
	break;

	case '"' :
	toWrite=_QUOT_;
	//writer.write(_QUOT_);
	break;

	case 0x09 : // '\t'
	toWrite=__X9_;
	//writer.write(__X9_);
	break;

	case 0x0A : // '\n'
	toWrite=__XA_;
	//writer.write(__XA_);
	break;

	case 0x0D : // '\r'
	toWrite=__XD_;
	//writer.write(__XD_);
	break;

	default :
	writeCharToUtf8(c,writer);
	//this._writer.write(c);
	continue;
	}
	writer.write(toWrite);
	}

	writer.write('\"');
	}

	final static void writeCharToUtf8(final char c,final OutputStream out) throws IOException{
	char ch;
	if (/(c >= 0x0001) &&/ (c <= 0x007F)) {
	out.write(c);
	return;
	} else if (c > 0x07FF) {
	ch=(char)(c>>>12);
	if (ch>0) {
	out.write(0xE0 \| ( ch & 0x0F));
	} else {
	out.write(0xE0);
	}
	out.write(0x80 \| ((c >>> 6) & 0x3F));
	out.write(0x80 \| ((c) & 0x3F));
	return;

	} else {
	ch=(char)(c>>>6);
	if (ch>0) {
	out.write(0xC0 \| (ch & 0x1F));
	} else {
	out.write(0xC0);
	}
	out.write(0x80 \| ((c) & 0x3F));
	return;
	}

	}

	final static void writeStringToUtf8(final String str,final OutputStream out) throws IOException{
	final int length=str.length();
	int i=0;
	char ch,c;
	while (i<length) {
	c=str.charAt(i++);
	if (/(c >= 0x0001) &&/ (c <= 0x007F)) {
	out.write(c);
	continue;
	} else if (c > 0x07FF) {
	ch=(char)(c>>>12);
	if (ch>0) {
	out.write(0xE0 \| ( ch & 0x0F));
	} else {
	out.write(0xE0);
	}
	out.write(0x80 \| ((c >>> 6) & 0x3F));
	out.write(0x80 \| ((c) & 0x3F));
	continue;
	} else {
	ch=(char)(c>>>6);
	if (ch>0) {
	out.write(0xC0 \| (ch & 0x1F));
	} else {
	out.write(0xC0);
	}
	out.write(0x80 \| ((c) & 0x3F));
	continue;
	}
	}

	}
	/**
	* Outputs a PI to the internal Writer.
	*
	* @param currentPI
	* @param writer TODO
	* @throws IOException
	*/
	static final void outputPItoWriter(ProcessingInstruction currentPI, OutputStream writer) throws IOException {
	final int position = getPositionRelativeToDocumentElement(currentPI);

	if (position == NODE_AFTER_DOCUMENT_ELEMENT) {
	writer.write('\n');
	}
	writer.write(_BEGIN_PI);

	final String target = currentPI.getTarget();
	int length = target.length();

	for (int i = 0; i < length; i++) {
	char c=target.charAt(i);
	if (c==0x0D) {
	writer.write(__XD_);
	} else {
	writeCharToUtf8(c,writer);
	}
	}

	final String data = currentPI.getData();

	length = data.length();

	if (length > 0) {
	writer.write(' ');

	for (int i = 0; i < length; i++) {
	char c=data.charAt(i);
	if (c==0x0D) {
	writer.write(__XD_);
	} else {
	writeCharToUtf8(c,writer);
	}
	}
	}

	writer.write(_END_PI);
	if (position == NODE_BEFORE_DOCUMENT_ELEMENT) {
	writer.write('\n');
	}
	}

	/**
	* Method outputCommentToWriter
	*
	* @param currentComment
	* @param writer TODO
	* @throws IOException
	*/
	static final void outputCommentToWriter(Comment currentComment, OutputStream writer) throws IOException {
	final int position = getPositionRelativeToDocumentElement(currentComment);
	if (position == NODE_AFTER_DOCUMENT_ELEMENT) {
	writer.write('\n');
	}
	writer.write(_BEGIN_COMM);

	final String data = currentComment.getData();
	final int length = data.length();

	for (int i = 0; i < length; i++) {
	char c=data.charAt(i);
	if (c==0x0D) {
	writer.write(__XD_);
	} else {
	writeCharToUtf8(c,writer);
	}
	}

	writer.write(_END_COMM);
	if (position == NODE_BEFORE_DOCUMENT_ELEMENT) {
	writer.write('\n');
	}
	}

	/**
	* Outputs a Text of CDATA section to the internal Writer.
	*
	* @param text
	* @param writer TODO
	* @throws IOException
	*/
	static final void outputTextToWriter(final String text, final OutputStream writer) throws IOException {
	final int length = text.length();
	byte []toWrite;
	for (int i = 0; i < length; i++) {
	char c = text.charAt(i);

	switch (c) {

	case '&' :
	toWrite=_AMP_;
	//writer.write(_AMP_);
	break;

	case '<' :
	toWrite=_LT_;
	//writer.write(_LT_);
	break;

	case '>' :
	toWrite=_GT_;
	//writer.write(_GT_);
	break;

	case 0xD :
	toWrite=__XD_;
	//writer.write(__XD_);
	break;

	default :
	writeCharToUtf8(c,writer);
	continue;
	}
	writer.write(toWrite);
	}
	}

	/**
	* Obtain the attributes to output for this node in XPathNodeSet c14n.
	*
	* @param E
	* @param ns
	* @return the attributes nodes to output.
	* @throws CanonicalizationException
	*/
	abstract Iterator handleAttributes(Element E, NameSpaceSymbTable ns )
	throws CanonicalizationException;

	/**
	* Obtain the attributes to output for this node in a Subtree c14n.
	*
	* @param E
	* @param ns
	* @return the attributes nodes to output.
	* @throws CanonicalizationException
	*/
	abstract Iterator handleAttributesSubtree(Element E, NameSpaceSymbTable ns)
	throws CanonicalizationException;


	/**
	* @return Returns the _includeComments.
	*/
	final public boolean is_includeComments() {
	return _includeComments;
	}
	/**
	* @param comments The _includeComments to set.
	*/
	final public void set_includeComments(boolean comments) {
	_includeComments = comments;
	}

	/**
	* @param _writer The _writer to set.
	*/
	public void setWriter(OutputStream _writer) {
	this._writer = _writer;
	}

	}