src/xercesc/dom/impl/DOMWriterImpl.cpp - xerces-c - Git at Google

 /*
  * The Apache Software License, Version 1.1
  *
  * Copyright (c) 2002 The Apache Software Foundation.  All rights
  * reserved.
  *
  * Redistribution and use in source and binary forms, with or without
  * modification, are permitted provided that the following conditions
  * are met:
  *
  * 1. Redistributions of source code must retain the above copyright
  *    notice, this list of conditions and the following disclaimer.
  *
  * 2. Redistributions in binary form must reproduce the above copyright
  *    notice, this list of conditions and the following disclaimer in
  *    the documentation and/or other materials provided with the
  *    distribution.
  *
  * 3. The end-user documentation included with the redistribution,
  *    if any, must include the following acknowledgment:
  *       "This product includes software developed by the
  *        Apache Software Foundation (http://www.apache.org/)."
  *    Alternately, this acknowledgment may appear in the software itself,
  *    if and wherever such third-party acknowledgments normally appear.
  *
  * 4. The names "Xerces" and "Apache Software Foundation" must
  *    not be used to endorse or promote products derived from this
  *    software without prior written permission. For written
  *    permission, please contact apache\@apache.org.
  *
  * 5. Products derived from this software may not be called "Apache",
  *    nor may "Apache" appear in their featName, without prior written
  *    permission of the Apache Software Foundation.
  *
  * THIS SOFTWARE IS PROVIDED ``AS IS'' AND ANY EXPRESSED OR IMPLIED
  * WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
  * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
  * DISCLAIMED.  IN NO EVENT SHALL THE APACHE SOFTWARE FOUNDATION OR
  * ITS CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
  * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
  * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF
  * USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
  * ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
  * OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT
  * OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
  * SUCH DAMAGE.
  * ====================================================================
  *
  * This software consists of voluntary contributions made by many
  * individuals on behalf of the Apache Software Foundation, and was
  * originally based on software copyright (c) 1999, International
  * Business Machines, Inc., http://www.ibm.com .  For more information
  * on the Apache Software Foundation, please see
  * <http://www.apache.org/>.
  */

 /*
  * $Id$
  * $Log$
  * Revision 1.14  2002/07/22 23:24:01  tng
  * DOM L3: writeToString should use the fFormatter to do the transcoding
  *
  * Revision 1.13  2002/07/16 15:19:42  peiyongz
  * check lenght of getEncoding()/getActualEncoding()
  *
  * Revision 1.12  2002/06/25 16:17:16  tng
  * DOM L3: add release()
  *
  * Revision 1.11  2002/06/21 19:33:12  peiyongz
  * support for feature split_cdata_section and entities revised.
  *
  * Revision 1.10  2002/06/18 15:35:25  peiyongz
  * Bug#9950: Compilation error on MSVC5, patch from PeterV@ti.com.od.ua (Peter A. Volchek)
  *
  * Revision 1.9  2002/06/17 19:45:58  peiyongz
  * optimization on fFeatures and featureId introduced
  *
  * Revision 1.8  2002/06/11 19:45:45  peiyongz
  * Notify application of the XMLFormatter creation failure
  *
  * Revision 1.7  2002/06/10 16:02:21  peiyongz
  * format-pretty-print partially supported
  * resolve encoding from DOMDocument Interface
  *
  * Revision 1.6  2002/06/06 20:58:37  tng
  * [Bug 9639] enum_mem in DOMError clashes with constant.
  *
  * Revision 1.5  2002/06/05 16:03:03  peiyongz
  * delete[] used.
  *
  * Revision 1.4  2002/06/03 22:35:54  peiyongz
  * constants changed
  *
  * Revision 1.3  2002/05/31 21:01:06  peiyongz
  * move printing of XMLDecl into the processNode().
  *
  * Revision 1.2  2002/05/29 21:31:50  knoaman
  * DOM L3 LS: DOMInputSource, DOMEntityResolver, DOMImplementationLS and DOMBuilder
  *
  * Revision 1.1  2002/05/28 22:39:39  peiyongz
  * DOM3 Save Interface: DOMWriter/DOMWriterFilter
  *
  */

 #include "DOMWriterImpl.hpp"
 #include "DOMErrorImpl.hpp"
 #include "DOMLocatorImpl.hpp"

 #include <xercesc/framework/MemBufFormatTarget.hpp>

 #include <xercesc/util/TransService.hpp>
 #include <xercesc/util/TranscodingException.hpp>
 #include <xercesc/util/Janitor.hpp>
 #include <xercesc/util/XMLString.hpp>
 #include <xercesc/util/XMLUniDefs.hpp>

 // ---------------------------------------------------------------------------
 //  Local const data
 //
 // ---------------------------------------------------------------------------

 static const int INVALID_FEATURE_ID               = -1;
 static const int CANONICAL_FORM_ID                = 0x0;
 static const int DISCARD_DEFAULT_CONTENT_ID       = 0x1;
 static const int ENTITIES_ID                      = 0x2;
 static const int FORMAT_PRETTY_PRINT_ID           = 0x3;
 static const int NORMALIZE_CHARACTERS_ID          = 0x4;
 static const int SPLIT_CDATA_SECTIONS_ID          = 0x5;
 static const int VALIDATION_ID                    = 0x6;
 static const int WHITESPACE_IN_ELEMENT_CONTENT_ID = 0x7;

 //    feature                      true                       false
 // ================================================================================
 //canonical-form                 [optional] Not Supported     [required] (default)
 //discard-default-content        [required] (default)         [required]
 //entity                         [required] (default)         [optional]
 //format-pretty-print            [optional] Partially Supported [required] (default)
 //normalize-characters           [optional] Not Supported     [required] (default)
 //split-cdata-sections           [required] (default)         [required]
 //validation                     [optional] Not Supported     [required] (default)
 //whitespace-in-element-content  [requierd] (default)         [optional] Not Supported
 //

 //
 // Each feature has 2 entries in this array,
 // the first for "true",
 // the second for "false".
 //
 static bool  featuresSupported[] = {
     false, true,  // canonical-form
     true,  true,  // discard-default-content
     true,  true,  // entity
     true,  true,  // format-pretty-print
     false, true,  // normalize-characters
     true,  true,  // split-cdata-sections
     false, true,  // validation
     true,  false  // whitespace-in-element-content
 };

 // default end-of-line sequence
 static const XMLCh  gEOLSeq[] =
 {
 	chLF, chNull
 };

 //UTF-8
 static const XMLCh  gUTF8[] =
 {
 	chLatin_U, chLatin_T, chLatin_F, chDash, chDigit_8, chNull
 };

 //</
 static const XMLCh  gEndElement[] =
 {
 	chOpenAngle, chForwardSlash, chNull
 };

 //?>
 static const XMLCh  gEndPI[] =
 {
 	chQuestion, chCloseAngle, chNull
 };

 //<?
 static const XMLCh  gStartPI[] =
 {
 	chOpenAngle, chQuestion, chNull
 };

 //<?xml version="
 static const XMLCh  gXMLDecl_VersionInfo[] =
 {
 	chOpenAngle, chQuestion, chLatin_x,     chLatin_m,  chLatin_l,  chSpace,
 	chLatin_v,   chLatin_e,  chLatin_r,     chLatin_s,  chLatin_i,  chLatin_o,
 	chLatin_n,   chEqual,    chDoubleQuote, chNull
 };

 static const XMLCh gXMLDecl_ver10[] =
 {
     chDigit_1, chPeriod, chDigit_0, chNull
 };

 //encoding="
 static const XMLCh  gXMLDecl_EncodingDecl[] =
 {
 	chLatin_e,  chLatin_n,  chLatin_c,  chLatin_o,      chLatin_d, chLatin_i,
     chLatin_n,  chLatin_g,  chEqual,    chDoubleQuote,  chNull
 };

 //" standalone="
 static const XMLCh  gXMLDecl_SDDecl[] =
 {
 	chLatin_s, chLatin_t, chLatin_a,   chLatin_n,    chLatin_d,   chLatin_a,
     chLatin_l, chLatin_o, chLatin_n,   chLatin_e,    chEqual,     chDoubleQuote,
     chNull
 };

 //"
 static const XMLCh  gXMLDecl_separator[] =
 {
 	chDoubleQuote, chSpace, chNull
 };

 //?>
 static const XMLCh  gXMLDecl_endtag[] =
 {
 	chQuestion, chCloseAngle,  chNull
 };

 //<![CDATA[
 static const XMLCh  gStartCDATA[] =
 {
 	chOpenAngle, chBang,    chOpenSquare, chLatin_C, chLatin_D,
     chLatin_A,   chLatin_T, chLatin_A,    chOpenSquare, chNull
 };

 //]]>
 static const XMLCh  gEndCDATA[] =
 {
     chCloseSquare, chCloseAngle, chCloseAngle, chNull  // test only: ]>>
 //  chCloseSquare, chCloseSquare, chCloseAngle, chNull
 };

 //<!--
 static const XMLCh  gStartComment[] =
 {
     chOpenAngle, chBang, chDash, chDash, chNull
 };

 //-->
 static const XMLCh  gEndComment[] =
 {
     chDash, chDash, chCloseAngle, chNull
 };

 //<!DOCTYPE
 static const XMLCh  gStartDoctype[] =
 {
     chOpenAngle, chBang,    chLatin_D, chLatin_O, chLatin_C, chLatin_T,
     chLatin_Y,   chLatin_P, chLatin_E, chSpace,   chNull
 };

 //PUBLIC "
 static const XMLCh  gPublic[] =
 {
     chLatin_P, chLatin_U, chLatin_B,     chLatin_L, chLatin_I,
     chLatin_C, chSpace,   chDoubleQuote, chNull
 };

 //SYSTEM "
 static const XMLCh  gSystem[] =
 {
     chLatin_S, chLatin_Y, chLatin_S,     chLatin_T, chLatin_E,
     chLatin_M, chSpace,   chDoubleQuote, chNull
 };

 //<!ENTITY
 static const XMLCh  gStartEntity[] =
 {
     chOpenAngle, chBang,    chLatin_E, chLatin_N, chLatin_T, chLatin_I,
     chLatin_T,   chLatin_Y, chSpace,   chNull
 };

 //NDATA "
 static const XMLCh  gNotation[] =
 {
     chLatin_N, chLatin_D,     chLatin_A, chLatin_T, chLatin_A,
     chSpace,   chDoubleQuote, chNull
 };

 // Unrecognized node type
 static const XMLCh  gUnrecognizedNodeType[] =
 {
 	chLatin_U, chLatin_n, chLatin_r, chLatin_e, chLatin_c, chLatin_o,
     chLatin_g, chLatin_n, chLatin_i, chLatin_z, chLatin_e, chLatin_d,
 	chSpace,   chLatin_N, chLatin_o, chLatin_d, chLatin_e, chSpace,
 	chLatin_T, chLatin_y, chLatin_p, chLatin_e, chNull
 };

 // nested cdata
 static const XMLCh  gNestedCdata[] =
 {
 	chLatin_N, chLatin_e, chLatin_s, chLatin_t, chLatin_e, chLatin_d,
     chLatin_C, chLatin_D, chLatin_a, chLatin_t, chLatin_a, chNull
 };

 // Unrepresentable char
 static const XMLCh  gUnrepresentableChar[] =
 {
 	chLatin_U, chLatin_n, chLatin_r, chLatin_e, chLatin_p, chLatin_r,
     chLatin_e, chLatin_s, chLatin_e, chLatin_n, chLatin_t, chLatin_a,
 	chLatin_b, chLatin_l, chLatin_e, chSpace,   chLatin_C, chLatin_h,
 	chLatin_a, chLatin_r, chNull
 };

 //Feature
 static const XMLCh  gFeature[] =
 {
 	chLatin_F, chLatin_e, chLatin_a, chLatin_t, chLatin_u, chLatin_r,
     chLatin_e, chSpace,   chNull
 };

 // Can not be set to
 static const XMLCh  gCantSet[] =
 {
 	chSpace,   chLatin_C, chLatin_a, chLatin_n, chSpace, chLatin_n, chLatin_o,
     chLatin_t, chSpace,   chLatin_b, chLatin_e, chSpace, chLatin_s,
     chLatin_e, chLatin_t, chSpace,   chLatin_t, chLatin_o, chSpace, chNull
 };

 static const XMLCh  gTrue[] =
 {
 	chSingleQuote, chLatin_t, chLatin_r, chLatin_u, chLatin_e,
     chSingleQuote, chLF,      chNull
 };

 static const XMLCh  gFalse[] =
 {
 	chSingleQuote, chLatin_f, chLatin_a, chLatin_l, chLatin_s,
     chLatin_e,     chSingleQuote, chLF, chNull
 };

 //
 // Notification of the error though error handler
 //
 // The application may instruct the engine to abort serialization
 // by returning "false".
 //
 // REVISIT: update the locator ctor once the line#, col#, uri and offset
 // are available from DOM3 core
 //
 // REVISIT: use throwing exception to abort serialization is an interesting
 // thing here, since the serializer is a recusive function, we
 // can't use return, obviously. However we may have multiple try/catch
 // along its way going back to writeNode(). So far we don't come up with a
 // "short-cut" to go "directly" back.
 //
 #define  TRY_CATCH_THROW(action, forceToRethrow)                     \
 fFormatter->setUnRepFlags(XMLFormatter::UnRep_Fail);                 \
 try                                                                  \
 {                                                                    \
      action;                                                         \
 }                                                                 \
 catch(TranscodingException const &e)                                 \
 {                                                                    \
     if ( !reportError(nodeToWrite                                    \
                     , DOMError::DOM_SEVERITY_FATAL_ERROR             \
                     , e.getMessage())                       ||       \
          forceToRethrow                                      )       \
         throw;                                                       \
 }

 DOMWriterImpl::~DOMWriterImpl()
 {
 	delete [] fEncoding;
 	delete [] fNewLine;

 	// we don't own/adopt error handler and filter
 }

 DOMWriterImpl::DOMWriterImpl()
 :fFeatures(0)
 ,fEncoding(0)
 ,fNewLine(0)
 ,fErrorHandler(0)
 ,fFilter(0)
 ,fEncodingUsed(0)
 ,fNewLineUsed(0)
 ,fFormatter(0)
 ,fErrorCount(0)
 {
     //
     // set features to default setting
     //
     setFeature(CANONICAL_FORM_ID,                false);
 	setFeature(DISCARD_DEFAULT_CONTENT_ID,       true );
 	setFeature(ENTITIES_ID,                      true );
 	setFeature(FORMAT_PRETTY_PRINT_ID,	         false);
 	setFeature(NORMALIZE_CHARACTERS_ID,          false);
 	setFeature(SPLIT_CDATA_SECTIONS_ID,          true );
 	setFeature(VALIDATION_ID,                    false);
 	setFeature(WHITESPACE_IN_ELEMENT_CONTENT_ID, true );
 }

 bool DOMWriterImpl::canSetFeature(const XMLCh* const featName
           						, bool               state) const
 {
     int featureId = INVALID_FEATURE_ID;
     return checkFeature(featName, false, featureId) ? canSetFeature(featureId, state) : false;
 }

 void DOMWriterImpl::setFeature(const XMLCh* const featName
                              , bool               state)
 {
     int featureId = INVALID_FEATURE_ID;
     checkFeature(featName, true, featureId);

 	if (!canSetFeature(featureId, state))
     {
         XMLCh  tmpbuf[256];
         XMLString::copyString(tmpbuf, gFeature);
         XMLString::catString(tmpbuf, featName);
         XMLString::catString(tmpbuf, gCantSet);
         XMLString::catString(tmpbuf, state? gTrue : gFalse);
 		throw DOMException(DOMException::NOT_SUPPORTED_ERR, tmpbuf);
     }
     else
         setFeature(featureId, state);

 	//
 	// canonical-form and format-pretty-print can not be both set to true
 	// meaning set canonical-form true will automatically set
 	// format-pretty-print to false and vise versa.
     //
     if ((featureId == CANONICAL_FORM_ID) && state)
         setFeature(FORMAT_PRETTY_PRINT_ID, false);

     if ((featureId == FORMAT_PRETTY_PRINT_ID) && state)
         setFeature(CANONICAL_FORM_ID, false);

     return;
 }

 bool DOMWriterImpl::getFeature(const XMLCh* const featName) const
 {
     int featureId = INVALID_FEATURE_ID;
     checkFeature(featName, true, featureId);
     return getFeature(featureId);
 }

 // we don't check the validity of the encoding set
 void DOMWriterImpl::setEncoding(const XMLCh* const encoding)
 {
 	delete [] fEncoding;
 	fEncoding = XMLString::replicate(encoding);
 }

 const XMLCh* DOMWriterImpl::getEncoding() const
 {
 	return fEncoding;
 }

 void DOMWriterImpl::setNewLine(const XMLCh* const newLine)
 {
 	delete [] fNewLine;
 	fNewLine = XMLString::replicate(newLine);
 }

 const XMLCh* DOMWriterImpl::getNewLine() const
 {
 	return fNewLine;
 }

 void DOMWriterImpl::setErrorHandler(DOMErrorHandler *errorHandler)
 {
 	fErrorHandler = errorHandler;
 }

 DOMErrorHandler* DOMWriterImpl::getErrorHandler() const
 {
 	return fErrorHandler;
 }

 void DOMWriterImpl::setFilter(DOMWriterFilter *filter)
 {
 	fFilter = filter;
 }

 DOMWriterFilter* DOMWriterImpl::getFilter() const
 {
 	return fFilter;
 }

 //
 //
 //
 bool DOMWriterImpl::writeNode(XMLFormatTarget* const destination
                             , const DOMNode         &nodeToWrite)
 {
 	//init session vars
 	initSession(&nodeToWrite);

     try
     {
         fFormatter = new XMLFormatter(fEncodingUsed
                                      ,destination
                                      ,XMLFormatter::NoEscapes
                                      ,XMLFormatter::UnRep_CharRef);
     }
     catch (const TranscodingException& e)
     {
         reportError(&nodeToWrite, DOMError::DOM_SEVERITY_FATAL_ERROR, e.getMessage());
         return false;
     }

     try
     {
         Janitor<XMLFormatter> janName(fFormatter);
         processNode(&nodeToWrite);
 	}

 	//
 	// The serialize engine (processNode) throws an exception to abort
 	// serialization if
 	//
 	//   . A fatal error occurs which renters the output ill-formed, or
 	//   . Instructed by the application's error handler
 	//
 	catch (const TranscodingException&)
 	{
 		return false;
 	}

 	catch (const DOMException&)
 	{
 		return false;
 	}

 	//
 	// DOMSystemException
     // This exception will be raised in response to any sort of IO or system
     // error that occurs while writing to the destination. It may wrap an
     // underlying system exception.
 	//
 	//catch (RuntimeException const &)
 	catch (...)
 	{
 		// REVISIT generate a DOMSystemException wrapping the underlying
 		//         exception.
 		throw;
 	}

 	//
 	// true if node was successfully serialized and
 	// false in case a failure occured and the
 	// failure wasn't canceled by the error handler.
 	//
 	return ((fErrorCount == 0)? true : false);
 }

 //
 // We don't throw DOMSTRING_SIZE_ERR since we are no longer
 // using DOMString.
 //
 XMLCh* DOMWriterImpl::writeToString(const DOMNode &nodeToWrite)
 {
 	MemBufFormatTarget  destination;
 	bool retVal;

    // XMLCh is unicode, assume fEncoding as UTF-16
    XMLCh* tempEncoding = fEncoding;
    fEncoding = (XMLCh*) XMLUni::fgUTF16EncodingString;

 	try
 	{
 		retVal = writeNode(&destination, nodeToWrite);
 	}
 	catch (...)
 	{
 		//
 		// there is a possibility that memeory allocation
 		// exception thrown in XMLBuffer class
 		//
       fEncoding = tempEncoding;
 		return 0;
 	}

     fEncoding = tempEncoding;
     return (retVal ? XMLString::replicate((XMLCh*) destination.getRawBuffer()) : 0);
 }

 void DOMWriterImpl::initSession(const DOMNode* const nodeToWrite)
 {

 /**
  * The encoding to use when writing is determined as follows:
  *     If the encoding attribute has been set, that value will be used.
  *     If the encoding attribute is null or empty,
  *            but the item to be written, or
  *            the owner document specified encoding (ie. the "actualEncoding"
  *            from the document) that value will be used.
  *     If neither of the above provides an encoding name, a default encoding of
  *            "UTF-8" will be used.
  */
 	fEncodingUsed = gUTF8;

 	if (fEncoding && XMLString::stringLen(fEncoding))
 	{
 		fEncodingUsed = fEncoding;
 	}
 	else
 	{
         DOMDocument *docu = (nodeToWrite->getNodeType() == DOMNode::DOCUMENT_NODE)?
                             (DOMDocument*)nodeToWrite : nodeToWrite->getOwnerDocument();
         if (docu)
         {
             const XMLCh* tmpEncoding = docu->getEncoding();

             if ( tmpEncoding && XMLString::stringLen(tmpEncoding))
             {
                 fEncodingUsed = tmpEncoding;
             }
             else
             {
                 tmpEncoding = docu->getActualEncoding();

                 if ( tmpEncoding && XMLString::stringLen(tmpEncoding))
                 {
                     fEncodingUsed = tmpEncoding;
                 }
             }
         }
     }

 /**
  *  The end-of-line sequence of characters to be used in the XML being
  *  written out. The only permitted values are these:
  *     . null
  *
  *  Use a default end-of-line sequence. DOM implementations should choose
  * the default to match the usual convention for text files in the
  * environment being used. Implementations must choose a default
  * sequence that matches one of those allowed by  2.11 "End-of-Line
  * Handling".
  *
  *    CR    The carriage-return character (#xD)
  *    CR-LF The carriage-return and line-feed characters (#xD #xA)
  *    LF    The line-feed character (#xA)
  *
  *  The default value for this attribute is null
  */
 	fNewLineUsed = (fNewLine && XMLString::stringLen(fNewLine))? fNewLine : gEOLSeq;

 	fErrorCount = 0;
 }

 //
 // Characters not representable in output encoding,
 //
 // 1. CHARACTER DATA (outside of markup)                --- no error
 //    ordinary character  -> numeric character reference
 //    '<' and '&'         -> &lt; and &amp;
 //
 // 2. Within MARKUP, but outside of attributes
 //    reported as an error                                 --- ERROR
 //    markup:
 //           start tag                                  done
 //           end tag                                    done
 //           empty element tag                          done
 //           entity references                          done
 //           character references    // REVISIT
 //           comments                                   done
 //           CDATA section delimiters                   done, done
 //           document type declarartions                done
 //           processing instructions (PI)               done
 //
 // 3. With in ATTRIBUTE
 //    -> numeric character reference
 //    no quotes                        -> in quotes
 //    with quotes, no apostrophe       -> in apostrophe
 //    with quotes and apostrophe       -> in quotes and &quot;
 //
 // 4. CDATA sections
 //    "split_cdata_section"  true                      --- char ref
 //                           false                     ---      ERROR
 //

 //
 // REVISIT
 //    FormatPrettyPrint requires proper indentation, newline, and etc.
 //    currently we partially support this feature by adding new line to
 //    xmldecl, doctype and root element, later on we need to work on
 //    other nodes, such as element, attribute and so on.
 //

 // ---------------------------------------------------------------------------
 //  Stream out a DOM node, and, recursively, all of its children. This
 //  function is the heart of writing a DOM tree out as XML source. Give it
 //  a document node and it will do the whole thing.
 // ---------------------------------------------------------------------------
 void DOMWriterImpl::processNode(const DOMNode* const nodeToWrite)
 {
     // Get the name and value out for convenience
     const XMLCh*    nodeName = nodeToWrite->getNodeName();
     const XMLCh*    nodeValue = nodeToWrite->getNodeValue();
     unsigned long   lent = XMLString::stringLen(nodeValue);

     switch (nodeToWrite->getNodeType())
     {
 	case DOMNode::TEXT_NODE:
         {
 			if (checkFilter(nodeToWrite) != DOMNodeFilter::FILTER_ACCEPT)
 				break;

 			setURCharRef();      // character data
             fFormatter->formatBuf(nodeValue, lent, XMLFormatter::CharEscapes);
             break;
         }

 	case DOMNode::PROCESSING_INSTRUCTION_NODE:
         {
 			if (checkFilter(nodeToWrite) != DOMNodeFilter::FILTER_ACCEPT)
 				break;

 			TRY_CATCH_THROW
 			(
 				*fFormatter << XMLFormatter::NoEscapes << gStartPI << nodeName;
 				if (lent > 0)
 				{
 					*fFormatter << chSpace << nodeValue;
 				}
 				*fFormatter << gEndPI;
 				,true
 			)
             break;
         }

 	case DOMNode::DOCUMENT_NODE: // Not to be shown to Filter
         {
 			setURCharRef();
             DOMDocument *docu = (DOMDocument*)nodeToWrite;

             //[23] XMLDecl      ::= '<?xml' VersionInfo EncodingDecl? SDDecl? S? '?>'
             //[24] VersionInfo  ::= S 'version' Eq ("'" VersionNum "'" | '"' VersionNum '"')
             //[80] EncodingDecl ::= S 'encoding' Eq ('"' EncName '"' | "'" EncName
             //[32] SDDecl       ::= S 'standalone' Eq (("'" ('yes' | 'no') "'") | ('"' ('yes' | 'no') '"'))
             //
             // We always print out the xmldecl no matter whether it is
             // present in the original XML instance document or not.
             //
             const XMLCh* versionNo = (docu->getVersion()) ? docu->getVersion() : gXMLDecl_ver10;
 			*fFormatter << gXMLDecl_VersionInfo << versionNo << gXMLDecl_separator;

             // use the encoding resolved in initSession()
             *fFormatter << gXMLDecl_EncodingDecl << fEncodingUsed << gXMLDecl_separator;

             const XMLCh* st = (docu->getStandalone())? XMLUni::fgYesString : XMLUni::fgNoString;
             *fFormatter << gXMLDecl_SDDecl << st << gXMLDecl_separator;

             *fFormatter << gXMLDecl_endtag;
             printNewLine();

             DOMNode *child = nodeToWrite->getFirstChild();
             while( child != 0)
             {
                 processNode(child);
                 printNewLine();
                 child = child->getNextSibling();
             }
             break;
         }

 	case DOMNode::ELEMENT_NODE:
         {
 			DOMNodeFilter::FilterAction filterAction = checkFilter(nodeToWrite);

 			if ( filterAction == DOMNodeFilter::FILTER_REJECT)
 				break;

 			if ( filterAction == DOMNodeFilter::FILTER_ACCEPT)
 			{
 				//           this element    attributes   child elements
                 // accept        yes             yes           yes
 				// skip          no              no            yes
 				//
 				TRY_CATCH_THROW
 				(
 				// The name has to be representable without any escapes
                     *fFormatter  << XMLFormatter::NoEscapes
                                  << chOpenAngle << nodeName;
 			        ,true
 			    )

 				// Output any attributes on this element
 				setURCharRef();
 				DOMNamedNodeMap *attributes = nodeToWrite->getAttributes();
 				int attrCount = attributes->getLength();

 				bool discard = getFeature(DISCARD_DEFAULT_CONTENT_ID);
 				for (int i = 0; i < attrCount; i++)
 				{
 					DOMNode  *attribute = attributes->item(i);

 					// Not to be shown to Filter

 					//
 					//"discard-default-content"
 					//	true
 					//	[required] (default)
 					//	Use whatever information available to the implementation
 					//  (i.e. XML schema, DTD, the specified flag on Attr nodes,
 					//  and so on) to decide what attributes and content should be
 					//  discarded or not.
 					//  Note that the specified flag on Attr nodes in itself is
 					//  not always reliable, it is only reliable when it is set
 					//  to false since the only case where it can be set to false
 					//  is if the attribute was created by the implementation.
 					//  The default content won't be removed if an implementation
 					//  does not have any information available.
 					//	false
 					//	[required]
 					//	Keep all attributes and all content.
 					//
 					if (discard && !((DOMAttr*)attribute )->getSpecified())
 						continue;
 					//
 					//  Again the name has to be completely representable. But the
 					//  attribute can have refs and requires the attribute style
 					//  escaping.
 					//

 					*fFormatter  << XMLFormatter::NoEscapes
                                  << chSpace << attribute->getNodeName()
                                  << chEqual << chDoubleQuote
                                  << XMLFormatter::AttrEscapes
                                  << attribute->getNodeValue()
                                  << XMLFormatter::NoEscapes
                                  << chDoubleQuote;
 				} // end of for
 			} // end of FILTER_ACCEPT

 			// FILTER_SKIP may start from here

             //
             //  Test for the presence of children, which includes both
             //  text content and nested elements.
             //
             DOMNode *child = nodeToWrite->getFirstChild();
             if (child != 0)
             {
                 // There are children. Close start-tag, and output children.
                 // No escapes are legal here
 				if (filterAction == DOMNodeFilter::FILTER_ACCEPT)
 					*fFormatter << XMLFormatter::NoEscapes << chCloseAngle;

                 while( child != 0)
                 {
                     processNode(child);
                     child = child->getNextSibling();
                 }

 				if (filterAction == DOMNodeFilter::FILTER_ACCEPT)
 				{
 					TRY_CATCH_THROW
 					(
                          *fFormatter << XMLFormatter::NoEscapes << gEndElement
                                      << nodeName << chCloseAngle;
                         ,true
 	                )
 				}
             }
             else
             {
                 //
                 //  There were no children. Output the short form close of
                 //  the element start tag, making it an empty-element tag.
                 //
 				if (filterAction == DOMNodeFilter::FILTER_ACCEPT)
 				{
 					TRY_CATCH_THROW
                     (
 					    *fFormatter << XMLFormatter::NoEscapes << chForwardSlash << chCloseAngle;
 				       , true
 				    )
 				}
             }
             break;
         }

 	case DOMNode::ENTITY_REFERENCE_NODE:
 		{
 			//"entities"
 			//true
 			//[required] (default)
 			//Keep EntityReference and Entity nodes in the document.

 			//false
 			//[optional]
 			//Remove all EntityReference and Entity nodes from the document,
 			//       putting the entity expansions directly in their place.
 			//       Text nodes are into "normal" form.
 			//Only EntityReference nodes to non-defined entities are kept in the document.

 			if (checkFilter(nodeToWrite) != DOMNodeFilter::FILTER_ACCEPT)
 				break;

 			if (getFeature(ENTITIES_ID))
 			{
 				TRY_CATCH_THROW
 				(
 					*fFormatter << XMLFormatter::NoEscapes << chAmpersand
                                 << nodeName << chSemiColon;
 				    , true
 				)
 			}
 			else
 			{
                 // check if the referenced entity is defined or not
                 if (nodeToWrite->getOwnerDocument()->getDoctype()->getEntities()->getNamedItem(nodeName))
                 {
                     DOMNode *child;
                     for (child = nodeToWrite->getFirstChild();
                     child != 0;
                     child = child->getNextSibling())
                     {
                         processNode(child);
                     }
                 }
                 else
                 {
                     TRY_CATCH_THROW
                    (
                         *fFormatter<<XMLFormatter::NoEscapes<<chAmpersand<<nodeName<<chSemiColon;
                         , true
 				    )
                 }
 			}
 			break;
 		}

         //
         //  feature:split_cdata_sections     occurence of ]]>   unrep-char
         //  ===============================================================
         //          true                        split            split
         //          false                       fails            fails
         //
 	case DOMNode::CDATA_SECTION_NODE:
 		{
 			if (checkFilter(nodeToWrite) != DOMNodeFilter::FILTER_ACCEPT)
 				break;

 			if (getFeature(SPLIT_CDATA_SECTIONS_ID))
 			{
                 // it is fairly complicated and we process this
                 // in a separate function.
                 procCdataSection(nodeValue, nodeToWrite);
 			}
 			else
 			{
                 // search for "]]>"
                 if (XMLString::patternMatch((XMLCh* const) nodeValue, gEndCDATA) != -1)
                 {
                     reportError(nodeToWrite, DOMError::DOM_SEVERITY_FATAL_ERROR, gNestedCdata);
                     throw DOMException(DOMException::SYNTAX_ERR, gNestedCdata);
                 }

                 TRY_CATCH_THROW
                 (
                     // transcoder throws exception for unrep chars
                     *fFormatter << XMLFormatter::NoEscapes << gStartCDATA << nodeValue << gEndCDATA;
                    , true
 			    )
             }

             break;
 		}

 	case DOMNode::COMMENT_NODE:
         {
 			if (checkFilter(nodeToWrite) != DOMNodeFilter::FILTER_ACCEPT)
 				break;

 			TRY_CATCH_THROW
 			(
                 *fFormatter << XMLFormatter::NoEscapes << gStartComment
                 << nodeValue << gEndComment;
 			    , true
 			)
 			break;
         }

 	case DOMNode::DOCUMENT_TYPE_NODE:  // Not to be shown to Filter
 		{
             DOMDocumentType *doctype = (DOMDocumentType *)nodeToWrite;;

 			fFormatter->setEscapeFlags(XMLFormatter::NoEscapes);
             TRY_CATCH_THROW
 			(
     			*fFormatter << gStartDoctype << nodeName;

     			const XMLCh  *id = doctype->getPublicId();
                 if (id && *id)
 				{
                     *fFormatter << chSpace << gPublic << id << chDoubleQuote;

 					id = doctype->getSystemId();
 					if (id && *id)
 					{
 						*fFormatter << chSpace << chDoubleQuote << id << chDoubleQuote;
 					}
 					else
 					{
 						//
                         // 4.2.2 External Entities
                         // [Definition: If the entity is not internal,
 						//           it is an external entity, declared as follows:]
 						// External Entity Declaration
 						// [75] ExternalID ::= 'SYSTEM' S SystemLiteral
 						//                   | 'PUBLIC' S PubidLiteral S SystemLiteral
 						//
                         reportError(nodeToWrite, DOMError::DOM_SEVERITY_FATAL_ERROR, gUnrecognizedNodeType);
                         throw DOMException(DOMException::NOT_FOUND_ERR, 0);
 						// systemLiteral not found
 					}
 				}
 				else
 				{
 					id = doctype->getSystemId();
 					if (id && *id)
 					{
 						*fFormatter << chSpace << gSystem << id << chDoubleQuote;
 					}
 				}

 				id = doctype->getInternalSubset();
 				if (id && *id)
 				{
 					*fFormatter << chSpace << chOpenSquare << id << chCloseSquare;
 				}

 				*fFormatter << chCloseAngle;
 				, true

 			) // end of TRY_CATCH_THROW

 			break;
         }

 	case DOMNode::ENTITY_NODE:  // Not to be shown to Filter
         {
 			//
 			// REVISIT: how does the feature "entities" impact
 			// entity node?
 			//

 			fFormatter->setEscapeFlags(XMLFormatter::NoEscapes);
 			*fFormatter << gStartEntity	<< nodeName;

 			const XMLCh * id = ((DOMEntity*)nodeToWrite)->getPublicId();
 			if (id)
 				*fFormatter << gPublic << id << chDoubleQuote;

 			id = ((DOMEntity*)nodeToWrite)->getSystemId();
 			if (id)
 				*fFormatter << gSystem << id << chDoubleQuote;

 			id = ((DOMEntity*)nodeToWrite)->getNotationName();
 			if (id)
 				*fFormatter << gNotation << id << chDoubleQuote;

             *fFormatter << chCloseAngle;

             printNewLine();

 			break;
         }

 	default:
     	/***
 		    This is an implementation specific behaviour, we abort serialization
 			once unrecognized node type encountered.
 	     ***/
         {
             reportError(nodeToWrite, DOMError::DOM_SEVERITY_FATAL_ERROR, gUnrecognizedNodeType);
             throw DOMException(DOMException::NOT_FOUND_ERR, 0);
 			// UnreognizedNodeType;
 		}

 		break;
     }

 }

 //
 //
 DOMNodeFilter::FilterAction DOMWriterImpl::checkFilter(const DOMNode* const node) const
 {
 	if (!fFilter ||
         ((fFilter->getWhatToShow() & (1 << (node->getNodeType() - 1))) == 0))
 		return DOMNodeFilter::FILTER_ACCEPT;

 	//
 	// if and only if there is a filter, and it is interested
 	// in the node type, then we pass the node to the filter
 	// for examination
 	//
 	return (DOMNodeFilter::FilterAction) fFilter->acceptNode(node);
 }


 bool DOMWriterImpl::checkFeature(const XMLCh* const featName
                                , bool               toThrow
                                , int&               featureId) const
 {
     // check for null and/or empty feature name
     if ((!featName) || (XMLString::stringLen(featName)==0))
     {
         if (toThrow)
             throw DOMException(DOMException::NOT_FOUND_ERR, 0);

         return false;
     }

     featureId = INVALID_FEATURE_ID;

     if (XMLString::compareString(featName, XMLUni::fgDOMWRTCanonicalForm)==0)
         featureId = CANONICAL_FORM_ID;
     else if (XMLString::compareString(featName, XMLUni::fgDOMWRTDiscardDefaultContent)==0)
         featureId = DISCARD_DEFAULT_CONTENT_ID;
     else if (XMLString::compareString(featName, XMLUni::fgDOMWRTEntities)==0)
         featureId = ENTITIES_ID;
     else if (XMLString::compareString(featName, XMLUni::fgDOMWRTFormatPrettyPrint)==0)
         featureId = FORMAT_PRETTY_PRINT_ID;
     else if (XMLString::compareString(featName, XMLUni::fgDOMWRTNormalizeCharacters)==0)
         featureId = NORMALIZE_CHARACTERS_ID;
     else if (XMLString::compareString(featName, XMLUni::fgDOMWRTSplitCdataSections)==0)
         featureId = SPLIT_CDATA_SECTIONS_ID;
     else if (XMLString::compareString(featName, XMLUni::fgDOMWRTValidation)==0)
         featureId = VALIDATION_ID;
     else if (XMLString::compareString(featName, XMLUni::fgDOMWRTWhitespaceInElementContent)==0)
         featureId = WHITESPACE_IN_ELEMENT_CONTENT_ID;

     //feature name not resolvable
     if (featureId == INVALID_FEATURE_ID)
     {
         if (toThrow)
             throw DOMException(DOMException::NOT_FOUND_ERR, featName);

         return false;
     }

     return true;
 }

 bool DOMWriterImpl::reportError(const DOMNode* const    errorNode
                               , DOMError::ErrorSeverity errorType
                               , const XMLCh*   const    errorMsg)
 {
     bool toContinueProcess = true;   // default value for no error handler

     if (fErrorHandler)
     {
         DOMLocatorImpl  locator(0, 0, (DOMNode* const) errorNode, 0, 0);
         DOMErrorImpl    domError(errorType , errorMsg, &locator);
         toContinueProcess = fErrorHandler->handleError(domError);
     }

     fErrorCount++;
     return toContinueProcess;
 }

 //
 //
 //
 void DOMWriterImpl::procCdataSection(const XMLCh*   const nodeValue
                                    , const DOMNode* const nodeToWrite)
 {
     XMLCh* curPtr  = (XMLCh*) nodeValue;
     XMLCh* nextPtr = 0;
     int    endTagPos = -1;
     int    offset = XMLString::stringLen(gEndCDATA);
     bool   endTagFound = true;

     while (endTagFound)
     {
         endTagPos = XMLString::patternMatch(curPtr, gEndCDATA);
         if (endTagPos != -1)
         {
             nextPtr = curPtr + endTagPos + offset;  // skip the ']]>'
             *(curPtr + endTagPos) = chNull;         //nullify the first ']'

             reportError(nodeToWrite, DOMError::DOM_SEVERITY_WARNING, gNestedCdata);
         }
         else
         {
             endTagFound = false;
         }

         procUnrepCharInCdataSection(curPtr, nodeToWrite);

         if (endTagFound)
         {
             *(nextPtr - offset) = chCloseSquare;   //restore the first ']'
             curPtr = nextPtr;
         }
     }

     return;
 }

 //
 //
 //
 void DOMWriterImpl::procUnrepCharInCdataSection(const XMLCh*   const nodeValue
                                               , const DOMNode* const nodeToWrite)
 {
     //
     //  We have to check each character and see if it could be represented.
     //  As long as it can, we just keep up with where we started and how
     //  many chars we've checked. When we hit an unrepresentable one, we
     //  stop, transcode everything we've collected, then start handling
     //  the unrepresentables via char refs. We repeat this until we get all
     //  the chars done.
     //
     const XMLCh*    srcPtr = nodeValue;
     const XMLCh*    endPtr = nodeValue +  XMLString::stringLen(nodeValue);;

     // Set up the common part of the buffer that we build char refs into
     XMLCh tmpBuf[32];
     tmpBuf[0] = chAmpersand;
     tmpBuf[1] = chPound;
     tmpBuf[2] = chLatin_x;

     while (srcPtr < endPtr)
     {
         const XMLCh* tmpPtr = srcPtr;
         while (tmpPtr < endPtr)
         {
             if (fFormatter->getTranscoder()->canTranscodeTo(*tmpPtr))
                 tmpPtr++;
             else
                 break;
         }

         if (tmpPtr > srcPtr)
         {

             TRY_CATCH_THROW
            (
                 *fFormatter << XMLFormatter::NoEscapes << gStartCDATA;
                 , true
             )

             // We got at least some chars that can be done normally
             fFormatter->formatBuf
             (
                 srcPtr
                 , tmpPtr - srcPtr
                 , XMLFormatter::CharEscapes
                 , XMLFormatter::UnRep_Fail
             );

             TRY_CATCH_THROW
             (
                 *fFormatter << XMLFormatter::NoEscapes << gEndCDATA;
                 , true
             )

             // Update the source pointer to our new spot
             srcPtr = tmpPtr;
         }
          else
         {
              //
              //  We hit something unrepresentable. So continue forward doing
              //  char refs until we hit something representable again or the
              //  end of input.
              //

              // one warning for consective unrep chars
              reportError(nodeToWrite, DOMError::DOM_SEVERITY_WARNING, gUnrepresentableChar);

             while (srcPtr < endPtr)
             {
                 // Build a char ref for the current char
                 XMLString::binToText(*srcPtr, &tmpBuf[3], 8, 16);
                 const unsigned int bufLen = XMLString::stringLen(tmpBuf);
                 tmpBuf[bufLen] = chSemiColon;
                 tmpBuf[bufLen+1] = chNull;

                 // And now call recursively back to our caller to format this
                 fFormatter->formatBuf
                 (
                     tmpBuf
                     , bufLen + 1
                     , XMLFormatter::NoEscapes
                     , XMLFormatter::UnRep_Fail
                 );

                 // Move up the source pointer and break out if needed
                 srcPtr++;
                 if (fFormatter->getTranscoder()->canTranscodeTo(*srcPtr))
                     break;
             }
         }
     }
 }

 bool DOMWriterImpl::canSetFeature(const int featureId
                                        , bool      val) const
 {
     return featuresSupported[2*featureId + (val? 0: 1)];
 }

 void DOMWriterImpl::printNewLine() const
 {
     if (getFeature(FORMAT_PRETTY_PRINT_ID))
         *fFormatter << fNewLineUsed;
 }

 void DOMWriterImpl::release()
 {
     DOMWriterImpl* writer = (DOMWriterImpl*) this;
     delete writer;
 }