blob: 2a21691332642fa04033c3e409e7c3eabcb1e540 [file] [log] [blame]
/*
* The Apache Software License, Version 1.1
*
* Copyright (c) 1999-2000 The Apache Software Foundation. All rights
* reserved.
*
* Redistribution and use in source and binary forms, with or without
* modification, are permitted provided that the following conditions
* are met:
*
* 1. Redistributions of source code must retain the above copyright
* notice, this list of conditions and the following disclaimer.
*
* 2. Redistributions in binary form must reproduce the above copyright
* notice, this list of conditions and the following disclaimer in
* the documentation and/or other materials provided with the
* distribution.
*
* 3. The end-user documentation included with the redistribution,
* if any, must include the following acknowledgment:
* "This product includes software developed by the
* Apache Software Foundation (http://www.apache.org/)."
* Alternately, this acknowledgment may appear in the software itself,
* if and wherever such third-party acknowledgments normally appear.
*
* 4. The names "Xerces" and "Apache Software Foundation" must
* not be used to endorse or promote products derived from this
* software without prior written permission. For written
* permission, please contact apache\@apache.org.
*
* 5. Products derived from this software may not be called "Apache",
* nor may "Apache" appear in their name, without prior written
* permission of the Apache Software Foundation.
*
* THIS SOFTWARE IS PROVIDED ``AS IS'' AND ANY EXPRESSED OR IMPLIED
* WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
* OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
* DISCLAIMED. IN NO EVENT SHALL THE APACHE SOFTWARE FOUNDATION OR
* ITS CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
* SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
* LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF
* USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
* ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
* OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT
* OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
* SUCH DAMAGE.
* ====================================================================
*
* This software consists of voluntary contributions made by many
* individuals on behalf of the Apache Software Foundation, and was
* originally based on software copyright (c) 1999, International
* Business Machines, Inc., http://www.ibm.com . For more information
* on the Apache Software Foundation, please see
* <http://www.apache.org/>.
*/
// ---------------------------------------------------------------------------
// Includes
// ---------------------------------------------------------------------------
#include <xercesc/util/BitOps.hpp>
#include <xercesc/util/XMLUTF16Transcoder.hpp>
#include <xercesc/util/TranscodingException.hpp>
#include <string.h>
// ---------------------------------------------------------------------------
// XMLUTF16Transcoder: Constructors and Destructor
// ---------------------------------------------------------------------------
XMLUTF16Transcoder::XMLUTF16Transcoder( const XMLCh* const encodingName
, const unsigned int blockSize
, const bool swapped) :
XMLTranscoder(encodingName, blockSize)
, fSwapped(swapped)
{
}
XMLUTF16Transcoder::~XMLUTF16Transcoder()
{
}
// ---------------------------------------------------------------------------
// XMLUTF16Transcoder: Implementation of the transcoder API
// ---------------------------------------------------------------------------
unsigned int
XMLUTF16Transcoder::transcodeFrom( const XMLByte* const srcData
, const unsigned int srcCount
, XMLCh* const toFill
, const unsigned int maxChars
, unsigned int& bytesEaten
, unsigned char* const charSizes)
{
// If debugging, make sure that the block size is legal
#if defined(XERCES_DEBUG)
checkBlockSize(maxChars);
#endif
//
// Calculate the max chars we can do here. Its the lesser of the
// max output chars and the number of chars in the source.
//
const unsigned int srcChars = srcCount / sizeof(UTF16Ch);
const unsigned int countToDo = srcChars < maxChars ? srcChars : maxChars;
// Look at the source data as UTF16 chars
const UTF16Ch* asUTF16 = (const UTF16Ch*)srcData;
// And get a mutable pointer to the output
XMLCh* outPtr = toFill;
//
// If its swapped, we have to do a char by char swap and cast. Else
// we have to check whether our XMLCh and UTF16Ch types are the same
// size or not. If so, we can optimize by just doing a buffer copy.
//
if (fSwapped)
{
//
// And then do the swapping loop for the count we precalculated. Note
// that this also handles size conversion as well if XMLCh is not the
// same size as UTF16Ch.
//
for (unsigned int index = 0; index < countToDo; index++)
*outPtr++ = BitOps::swapBytes(*asUTF16++);
}
else
{
//
// If the XMLCh type is the same size as a UTF16 value on this
// platform, then we can do just a buffer copy straight to the target
// buffer since our source chars are UTF-16 chars. If its not, then
// we still have to do a loop and assign each one, in order to
// implicitly convert.
//
if (sizeof(XMLCh) == sizeof(UTF16Ch))
{
// Notice we convert char count to byte count here!!!
memcpy(toFill, srcData, countToDo * sizeof(UTF16Ch));
}
else
{
for (unsigned int index = 0; index < countToDo; index++)
*outPtr++ = XMLCh(*asUTF16++);
}
}
// Set the bytes eaten
bytesEaten = countToDo * sizeof(UTF16Ch);
// Set the character sizes to the fixed size
memset(charSizes, sizeof(UTF16Ch), countToDo);
// Return the chars we transcoded
return countToDo;
}
unsigned int
XMLUTF16Transcoder::transcodeTo(const XMLCh* const srcData
, const unsigned int srcCount
, XMLByte* const toFill
, const unsigned int maxBytes
, unsigned int& charsEaten
, const UnRepOpts options)
{
// If debugging, make sure that the block size is legal
#if defined(XERCES_DEBUG)
checkBlockSize(maxBytes);
#endif
//
// Calculate the max chars we can do here. Its the lesser of the
// chars that we can fit into the output buffer, and the source
// chars available.
//
const unsigned int maxOutChars = maxBytes / sizeof(UTF16Ch);
const unsigned int countToDo = srcCount < maxOutChars ? srcCount : maxOutChars;
//
// Get a pointer tot he output buffer in the UTF-16 character format
// that we need to work with. And get a mutable pointer to the source
// character buffer.
//
UTF16Ch* outPtr = (UTF16Ch*)toFill;
const XMLCh* srcPtr = srcData;
//
// If the target format is swapped from our native format, then handle
// it one way, else handle it another.
//
if (fSwapped)
{
//
// And then do the swapping loop for the count we precalculated. Note
// that this also handles size conversion as well if XMLCh is not the
// same size as UTF16Ch.
//
for (unsigned int index = 0; index < countToDo; index++)
{
// To avoid flakey compilers, use a temp
const UTF16Ch tmpCh = UTF16Ch(*srcPtr++);
*outPtr++ = BitOps::swapBytes(tmpCh);
}
}
else
{
//
// If XMLCh and UTF16Ch are the same size, we can just do a fast
// memory copy. Otherwise, we have to do a loop and downcast each
// character into its new 16 bit storage.
//
if (sizeof(XMLCh) == sizeof(UTF16Ch))
{
// Notice we convert char count to byte count here!!!
memcpy(toFill, srcData, countToDo * sizeof(UTF16Ch));
}
else
{
for (unsigned int index = 0; index < countToDo; index++)
*outPtr++ = UTF16Ch(*srcPtr++);
}
}
// Set the chars eaten to the calculated number we ate
charsEaten = countToDo;
//Return the bytes we ate. Note we convert to a byte count here!
return countToDo * sizeof(UTF16Ch);
}
bool XMLUTF16Transcoder::canTranscodeTo(const unsigned int toCheck) const
{
// We can handle anything
return true;
}