AOO410/main/sal/rtl/source/ustring.c - openoffice - Git at Google

 /**************************************************************
  *
  * Licensed to the Apache Software Foundation (ASF) under one
  * or more contributor license agreements.  See the NOTICE file
  * distributed with this work for additional information
  * regarding copyright ownership.  The ASF licenses this file
  * to you under the Apache License, Version 2.0 (the
  * "License"); you may not use this file except in compliance
  * with the License.  You may obtain a copy of the License at
  *
  *   http://www.apache.org/licenses/LICENSE-2.0
  *
  * Unless required by applicable law or agreed to in writing,
  * software distributed under the License is distributed on an
  * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
  * KIND, either express or implied.  See the License for the
  * specific language governing permissions and limitations
  * under the License.
  *
  *************************************************************/


 #if defined(_MSC_VER) && (_MSC_VER >= 1400)
 #pragma warning(disable:4738) // storing 32-bit float result in memory, possible loss of performance
 #endif

 #include <rtl/memory.h>
 #include <osl/diagnose.h>
 #include <osl/interlck.h>
 #include <rtl/alloc.h>
 #include <osl/mutex.h>
 #include <osl/doublecheckedlocking.h>
 #include <rtl/tencinfo.h>

 #include <string.h>
 #include <sal/alloca.h>

 #include "hash.h"
 #include "strimp.h"
 #include "surrogates.h"
 #include <rtl/ustring.h>

 #include "rtl/math.h"
 #include "rtl/tencinfo.h"

 /* ======================================================================= */

 /* static data to be referenced by all empty strings
  * the refCount is predefined to 1 and must never become 0 !
  */
 static rtl_uString const aImplEmpty_rtl_uString =
 {
     (sal_Int32) (SAL_STRING_INTERN_FLAG|SAL_STRING_STATIC_FLAG|1), /*sal_Int32    refCount; */
     0,                                               /*sal_Int32    length;   */
     { 0 }                                            /*sal_Unicode  buffer[1];*/
 };

 /* ======================================================================= */

 #define IMPL_RTL_STRCODE            sal_Unicode
 #define IMPL_RTL_USTRCODE( c )      (c)
 #define IMPL_RTL_STRNAME( n )       rtl_ustr_ ## n

 #define IMPL_RTL_STRINGNAME( n )    rtl_uString_ ## n
 #define IMPL_RTL_STRINGDATA         rtl_uString
 #define IMPL_RTL_EMPTYSTRING        aImplEmpty_rtl_uString
 #define IMPL_RTL_INTERN
 static void internRelease (rtl_uString *pThis);

 /* ======================================================================= */

 /* Include String/UString template code */

 #include "strtmpl.c"

 sal_Int32 rtl_ustr_indexOfAscii_WithLength(
     sal_Unicode const * str, sal_Int32 len,
     char const * subStr, sal_Int32 subLen)
 {
     if (subLen > 0 && subLen <= len) {
         sal_Int32 i;
         for (i = 0; i <= len - subLen; ++i) {
             if (rtl_ustr_asciil_reverseEquals_WithLength(
                     str + i, subStr, subLen))
             {
                 return i;
             }
         }
     }
     return -1;
 }

 sal_Int32 rtl_ustr_lastIndexOfAscii_WithLength(
     sal_Unicode const * str, sal_Int32 len,
     char const * subStr, sal_Int32 subLen)
 {
     if (subLen > 0 && subLen <= len) {
         sal_Int32 i;
         for (i = len - subLen; i >= 0; --i) {
             if (rtl_ustr_asciil_reverseEquals_WithLength(
                     str + i, subStr, subLen))
             {
                 return i;
             }
         }
     }
     return -1;
 }

 sal_Int32 SAL_CALL rtl_ustr_valueOfFloat(sal_Unicode * pStr, float f)
 {
     rtl_uString * pResult = NULL;
     sal_Int32 nLen;
     rtl_math_doubleToUString(
         &pResult, 0, 0, f, rtl_math_StringFormat_G,
         RTL_USTR_MAX_VALUEOFFLOAT - RTL_CONSTASCII_LENGTH("-x.E-xxx"), '.', 0,
         0, sal_True);
     nLen = pResult->length;
     OSL_ASSERT(nLen < RTL_USTR_MAX_VALUEOFFLOAT);
     rtl_copyMemory(pStr, pResult->buffer, (nLen + 1) * sizeof(sal_Unicode));
     rtl_uString_release(pResult);
     return nLen;
 }

 sal_Int32 SAL_CALL rtl_ustr_valueOfDouble(sal_Unicode * pStr, double d)
 {
     rtl_uString * pResult = NULL;
     sal_Int32 nLen;
     rtl_math_doubleToUString(
         &pResult, 0, 0, d, rtl_math_StringFormat_G,
         RTL_USTR_MAX_VALUEOFDOUBLE - RTL_CONSTASCII_LENGTH("-x.E-xxx"), '.', 0,
         0, sal_True);
     nLen = pResult->length;
     OSL_ASSERT(nLen < RTL_USTR_MAX_VALUEOFDOUBLE);
     rtl_copyMemory(pStr, pResult->buffer, (nLen + 1) * sizeof(sal_Unicode));
     rtl_uString_release(pResult);
     return nLen;
 }

 float SAL_CALL rtl_ustr_toFloat(sal_Unicode const * pStr)
 {
     return (float) rtl_math_uStringToDouble(pStr,
                                             pStr + rtl_ustr_getLength(pStr),
                                             '.', 0, 0, 0);
 }

 double SAL_CALL rtl_ustr_toDouble(sal_Unicode const * pStr)
 {
     return rtl_math_uStringToDouble(pStr, pStr + rtl_ustr_getLength(pStr), '.',
                                     0, 0, 0);
 }

 /* ======================================================================= */

 sal_Int32 SAL_CALL rtl_ustr_ascii_compare( const sal_Unicode* pStr1,
                                            const sal_Char* pStr2 )
 {
     sal_Int32 nRet;
     while ( ((nRet = ((sal_Int32)(*pStr1))-
                      ((sal_Int32)((unsigned char)(*pStr2)))) == 0) &&
             *pStr2 )
     {
         pStr1++;
         pStr2++;
     }

     return nRet;
 }

 /* ----------------------------------------------------------------------- */

 sal_Int32 SAL_CALL rtl_ustr_ascii_compare_WithLength( const sal_Unicode* pStr1,
                                                       sal_Int32 nStr1Len,
                                                       const sal_Char* pStr2 )
 {
 	sal_Int32 nRet = 0;
     while( ((nRet = (nStr1Len ? (sal_Int32)(*pStr1) : 0)-
                     ((sal_Int32)((unsigned char)(*pStr2)))) == 0) &&
            nStr1Len && *pStr2 )
     {
         pStr1++;
         pStr2++;
         nStr1Len--;
     }

     return nRet;
 }

 /* ----------------------------------------------------------------------- */

 sal_Int32 SAL_CALL rtl_ustr_ascii_shortenedCompare_WithLength( const sal_Unicode* pStr1,
                                                                sal_Int32 nStr1Len,
                                                                const sal_Char* pStr2,
                                                                sal_Int32 nShortenedLength )
 {
     const sal_Unicode*  pStr1End = pStr1 + nStr1Len;
     sal_Int32           nRet;
     while ( (nShortenedLength > 0) &&
             (pStr1 < pStr1End) && *pStr2 )
     {
         /* Check ASCII range */
         OSL_ENSURE( (*pStr2 & 0x80) == 0, "Found ASCII char > 127");

         nRet = ((sal_Int32)*pStr1)-
                ((sal_Int32)(unsigned char)*pStr2);
         if ( nRet != 0 )
             return nRet;

         nShortenedLength--;
         pStr1++;
         pStr2++;
     }

     if ( nShortenedLength <= 0 )
         return 0;

     if ( *pStr2 )
     {
         OSL_ENSURE( pStr1 == pStr1End, "pStr1 == pStr1End failed" );
         // first is a substring of the second string => less (negative value)
         nRet = -1;
     }
     else
     {
         // greater or equal
         nRet = pStr1End - pStr1;
     }

     return nRet;
 }

 /* ----------------------------------------------------------------------- */

 sal_Int32 SAL_CALL rtl_ustr_asciil_reverseCompare_WithLength( const sal_Unicode* pStr1,
                                                               sal_Int32 nStr1Len,
                                                               const sal_Char* pStr2,
                                                               sal_Int32 nStr2Len )
 {
     const sal_Unicode*  pStr1Run = pStr1+nStr1Len;
     const sal_Char*     pStr2Run = pStr2+nStr2Len;
     sal_Int32           nRet;
     while ( (pStr1 < pStr1Run) && (pStr2 < pStr2Run) )
     {
         pStr1Run--;
         pStr2Run--;
         nRet = ((sal_Int32)*pStr1Run)-((sal_Int32)*pStr2Run);
         if ( nRet )
             return nRet;
     }

     return nStr1Len - nStr2Len;
 }

 /* ----------------------------------------------------------------------- */

 sal_Bool SAL_CALL rtl_ustr_asciil_reverseEquals_WithLength( const sal_Unicode* pStr1,
                                                               const sal_Char* pStr2,
                                                               sal_Int32 nStrLen )
 {
     const sal_Unicode*  pStr1Run = pStr1+nStrLen;
     const sal_Char*     pStr2Run = pStr2+nStrLen;
     while ( pStr1 < pStr1Run )
     {
         pStr1Run--;
         pStr2Run--;
 		if( *pStr1Run != (sal_Unicode)*pStr2Run )
 			return sal_False;
     }

     return sal_True;
 }

 /* ----------------------------------------------------------------------- */

 sal_Int32 SAL_CALL rtl_ustr_ascii_compareIgnoreAsciiCase( const sal_Unicode* pStr1,
                                                           const sal_Char* pStr2 )
 {
     sal_Int32   nRet;
     sal_Int32   c1;
     sal_Int32   c2;
     do
     {
         /* If character between 'A' and 'Z', than convert it to lowercase */
         c1 = (sal_Int32)*pStr1;
         c2 = (sal_Int32)((unsigned char)*pStr2);
         if ( (c1 >= 65) && (c1 <= 90) )
             c1 += 32;
         if ( (c2 >= 65) && (c2 <= 90) )
             c2 += 32;
         nRet = c1-c2;
         if ( nRet != 0 )
             return nRet;

         pStr1++;
         pStr2++;
     }
     while ( c2 );

     return 0;
 }

 /* ----------------------------------------------------------------------- */

 sal_Int32 SAL_CALL rtl_ustr_ascii_compareIgnoreAsciiCase_WithLength( const sal_Unicode* pStr1,
                                                                      sal_Int32 nStr1Len,
                                                                      const sal_Char* pStr2 )
 {
     sal_Int32   nRet;
     sal_Int32   c1;
     sal_Int32   c2;
     do
     {
         if ( !nStr1Len )
             return *pStr2 == '\0' ? 0 : -1;

         /* If character between 'A' and 'Z', than convert it to lowercase */
         c1 = (sal_Int32)*pStr1;
         c2 = (sal_Int32)((unsigned char)*pStr2);
         if ( (c1 >= 65) && (c1 <= 90) )
             c1 += 32;
         if ( (c2 >= 65) && (c2 <= 90) )
             c2 += 32;
         nRet = c1-c2;
         if ( nRet != 0 )
             return nRet;

         pStr1++;
         pStr2++;
         nStr1Len--;
     }
     while( c2 );

     return 0;
 }

 sal_Int32 rtl_ustr_ascii_compareIgnoreAsciiCase_WithLengths(
     sal_Unicode const * first, sal_Int32 firstLen,
     char const * second, sal_Int32 secondLen)
 {
     sal_Int32 i;
     sal_Int32 len = firstLen < secondLen ? firstLen : secondLen;
     for (i = 0; i < len; ++i) {
         sal_Int32 c1 = *first++;
         sal_Int32 c2 = (unsigned char) *second++;
         sal_Int32 d;
         if (c1 >= 65 && c1 <= 90) {
             c1 += 32;
         }
         if (c2 >= 65 && c2 <= 90) {
             c2 += 32;
         }
         d = c1 - c2;
         if (d != 0) {
             return d;
         }
     }
     return firstLen - secondLen;
 }

 /* ----------------------------------------------------------------------- */

 sal_Int32 SAL_CALL rtl_ustr_ascii_shortenedCompareIgnoreAsciiCase_WithLength( const sal_Unicode* pStr1,
                                                                               sal_Int32 nStr1Len,
                                                                               const sal_Char* pStr2,
                                                                               sal_Int32 nShortenedLength )
 {
     const sal_Unicode*  pStr1End = pStr1 + nStr1Len;
     sal_Int32           nRet;
     sal_Int32           c1;
     sal_Int32           c2;
     while ( (nShortenedLength > 0) &&
             (pStr1 < pStr1End) && *pStr2 )
     {
         /* Check ASCII range */
         OSL_ENSURE( (*pStr2 & 0x80) == 0, "Found ASCII char > 127");

         /* If character between 'A' and 'Z', than convert it to lowercase */
         c1 = (sal_Int32)*pStr1;
         c2 = (sal_Int32)((unsigned char)*pStr2);
         if ( (c1 >= 65) && (c1 <= 90) )
             c1 += 32;
         if ( (c2 >= 65) && (c2 <= 90) )
             c2 += 32;
         nRet = c1-c2;
         if ( nRet != 0 )
             return nRet;

         nShortenedLength--;
         pStr1++;
         pStr2++;
     }

     if ( nShortenedLength <= 0 )
         return 0;

     if ( *pStr2 )
     {
         OSL_ENSURE( pStr1 == pStr1End, "pStr1 == pStr1End failed" );
         // first is a substring of the second string => less (negative value)
         nRet = -1;
     }
     else
     {
         // greater or equal
         nRet = pStr1End - pStr1;
     }

     return nRet;
 }

 /* ----------------------------------------------------------------------- */

 void SAL_CALL rtl_uString_newFromAscii( rtl_uString** ppThis,
                                         const sal_Char* pCharStr )
 {
     sal_Int32 nLen;

     if ( pCharStr )
     {
         const sal_Char* pTempStr = pCharStr;
         while( *pTempStr )
             pTempStr++;
         nLen = pTempStr-pCharStr;
     }
     else
         nLen = 0;

     if ( !nLen )
     {
         IMPL_RTL_STRINGNAME( new )( ppThis );
         return;
     }

     if ( *ppThis )
         IMPL_RTL_STRINGNAME( release )( *ppThis );

     *ppThis = IMPL_RTL_STRINGNAME( ImplAlloc )( nLen );
     OSL_ASSERT(*ppThis != NULL);
     if ( (*ppThis) )
     {
         IMPL_RTL_STRCODE* pBuffer = (*ppThis)->buffer;
         do
         {
             /* Check ASCII range */
             OSL_ENSURE( ((unsigned char)*pCharStr) <= 127,
                         "rtl_uString_newFromAscii() - Found ASCII char > 127" );

             *pBuffer = *pCharStr;
             pBuffer++;
             pCharStr++;
         }
         while ( *pCharStr );
     }
 }

 void SAL_CALL rtl_uString_newFromCodePoints(
     rtl_uString ** newString, sal_uInt32 const * codePoints,
     sal_Int32 codePointCount)
 {
     sal_Int32 n;
     sal_Int32 i;
     sal_Unicode * p;
     OSL_ASSERT(
         newString != NULL &&
         (codePoints != NULL || codePointCount == 0) &&
         codePointCount >= 0);
     if (codePointCount == 0) {
         rtl_uString_new(newString);
         return;
     }
     if (*newString != NULL) {
         rtl_uString_release(*newString);
     }
     n = codePointCount;
     for (i = 0; i < codePointCount; ++i) {
         OSL_ASSERT(codePoints[i] <= 0x10FFFF);
         if (codePoints[i] >= 0x10000) {
             ++n;
         }
     }
     /* Builds on the assumption that sal_Int32 uses 32 bit two's complement
        representation with wrap around (the necessary number of UTF-16 code
        units will be no larger than 2 * SAL_MAX_INT32, represented as
        sal_Int32 -2): */
     if (n < 0) {
         *newString = NULL;
         return;
     }
     *newString = rtl_uString_ImplAlloc(n);
     if (*newString == NULL) {
         return;
     }
     p = (*newString)->buffer;
     for (i = 0; i < codePointCount; ++i) {
         sal_uInt32 c = codePoints[i];
         if (c < 0x10000) {
             *p++ = (sal_Unicode) c;
         } else {
             c -= 0x10000;
             *p++ = (sal_Unicode) ((c >> 10) | SAL_RTL_FIRST_HIGH_SURROGATE);
             *p++ = (sal_Unicode) ((c & 0x3FF) | SAL_RTL_FIRST_LOW_SURROGATE);
         }
     }
 }

 /* ======================================================================= */

 static int rtl_ImplGetFastUTF8UnicodeLen( const sal_Char* pStr, sal_Int32 nLen )
 {
     int             n;
     sal_uChar       c;
     const sal_Char* pEndStr;

     n = 0;
     pEndStr  = pStr+nLen;
     while ( pStr < pEndStr )
     {
         c = (sal_uChar)*pStr;

         if ( !(c & 0x80) )
             pStr++;
         else if ( (c & 0xE0) == 0xC0 )
             pStr += 2;
         else if ( (c & 0xF0) == 0xE0 )
             pStr += 3;
         else if ( (c & 0xF8) == 0xF0 )
             pStr += 4;
         else if ( (c & 0xFC) == 0xF8 )
             pStr += 5;
         else if ( (c & 0xFE) == 0xFC )
             pStr += 6;
         else
             pStr++;

         n++;
     }

     return n;
 }

 /* ----------------------------------------------------------------------- */

 static void rtl_string2UString_status( rtl_uString** ppThis,
                                        const sal_Char* pStr,
                                        sal_Int32 nLen,
                                        rtl_TextEncoding eTextEncoding,
                                        sal_uInt32 nCvtFlags,
                                        sal_uInt32 *pInfo )
 {
     OSL_ENSURE(rtl_isOctetTextEncoding(eTextEncoding),
                "rtl_string2UString_status() - Wrong TextEncoding" );

     if ( !nLen )
     {
         rtl_uString_new( ppThis );
         if (pInfo != NULL) {
             *pInfo = 0;
         }
     }
     else
     {
         if ( *ppThis )
             IMPL_RTL_STRINGNAME( release )( *ppThis );

         /* Optimization for US-ASCII */
         if ( eTextEncoding == RTL_TEXTENCODING_ASCII_US )
         {
             IMPL_RTL_STRCODE* pBuffer;
             *ppThis = IMPL_RTL_STRINGNAME( ImplAlloc )( nLen );
             if (*ppThis == NULL) {
                 if (pInfo != NULL) {
                     *pInfo = RTL_TEXTTOUNICODE_INFO_ERROR |
                         RTL_TEXTTOUNICODE_INFO_DESTBUFFERTOSMALL;
                 }
                 return;
             }
             pBuffer = (*ppThis)->buffer;
             do
             {
                 /* Check ASCII range */
                 OSL_ENSURE( ((unsigned char)*pStr) <= 127,
                             "rtl_string2UString_status() - Found char > 127 and RTL_TEXTENCODING_ASCII_US is specified" );

                 *pBuffer = *pStr;
                 pBuffer++;
                 pStr++;
                 nLen--;
             }
             while ( nLen );
             if (pInfo != NULL) {
                 *pInfo = 0;
             }
         }
         else
         {
             rtl_uString*                pTemp;
             rtl_uString*                pTemp2 = NULL;
             rtl_TextToUnicodeConverter  hConverter;
             sal_uInt32                  nInfo;
             sal_Size                    nSrcBytes;
             sal_Size                    nDestChars;
             sal_Size                    nNewLen;

             /* Optimization for UTF-8 - we try to calculate the exact length */
             /* For all other encoding we try the maximum - and reallocate
                the buffer if needed */
             if ( eTextEncoding == RTL_TEXTENCODING_UTF8 )
             {
                 nNewLen = rtl_ImplGetFastUTF8UnicodeLen( pStr, nLen );
                 /* Includes the string only ASCII, then we could copy
                    the buffer faster */
                 if ( nNewLen == (sal_Size)nLen )
                 {
                     IMPL_RTL_STRCODE* pBuffer;
                     *ppThis = IMPL_RTL_STRINGNAME( ImplAlloc )( nLen );
                     if (*ppThis == NULL)
                     {
                         if (pInfo != NULL) {
                             *pInfo = RTL_TEXTTOUNICODE_INFO_ERROR |
                                 RTL_TEXTTOUNICODE_INFO_DESTBUFFERTOSMALL;
                         }
                         return;
                     }
                     pBuffer = (*ppThis)->buffer;
                     do
                     {
                         /* Check ASCII range */
                         OSL_ENSURE( ((unsigned char)*pStr) <= 127,
                                     "rtl_string2UString_status() - UTF8 test encoding is wrong" );

                         *pBuffer = *pStr;
                         pBuffer++;
                         pStr++;
                         nLen--;
                     }
                     while ( nLen );
                     if (pInfo != NULL) {
                         *pInfo = 0;
                     }
                     return;
                 }
             }
             else
                 nNewLen = nLen;

             nCvtFlags |= RTL_TEXTTOUNICODE_FLAGS_FLUSH;
             hConverter = rtl_createTextToUnicodeConverter( eTextEncoding );

             pTemp = IMPL_RTL_STRINGNAME( ImplAlloc )( nNewLen );
             if (pTemp == NULL) {
                 if (pInfo != NULL) {
                     *pInfo = RTL_TEXTTOUNICODE_INFO_ERROR |
                         RTL_TEXTTOUNICODE_INFO_DESTBUFFERTOSMALL;
                 }
                 return;
             }
             nDestChars = rtl_convertTextToUnicode( hConverter, 0,
                                                    pStr, nLen,
                                                    pTemp->buffer, nNewLen,
                                                    nCvtFlags,
                                                    &nInfo, &nSrcBytes );

             /* Buffer not big enough, try again with enough space */
             /* Shouldn't be the case, but if we get textencoding which
                could results in more unicode characters we have this
                code here. Could be the case for apple encodings */
             while ( nInfo & RTL_TEXTTOUNICODE_INFO_DESTBUFFERTOSMALL )
             {
                 rtl_freeMemory( pTemp );
                 nNewLen += 8;
                 pTemp = IMPL_RTL_STRINGNAME( ImplAlloc )( nNewLen );
                 if (pTemp == NULL) {
                     if (pInfo != NULL) {
                         *pInfo = RTL_TEXTTOUNICODE_INFO_ERROR |
                             RTL_TEXTTOUNICODE_INFO_DESTBUFFERTOSMALL;
                     }
                     return;
                 }
                 nDestChars = rtl_convertTextToUnicode( hConverter, 0,
                                                        pStr, nLen,
                                                        pTemp->buffer, nNewLen,
                                                        nCvtFlags,
                                                        &nInfo, &nSrcBytes );
             }

             if (pInfo)
                 *pInfo = nInfo;

             /* Set the buffer to the correct size or if there is too
                much overhead, reallocate to the correct size */
             if ( nNewLen > nDestChars+8 )
             {
                 pTemp2 = IMPL_RTL_STRINGNAME( ImplAlloc )( nDestChars );
             }
             if (pTemp2 != NULL)
             {
                 rtl_str_ImplCopy(pTemp2->buffer, pTemp->buffer, nDestChars);
                 rtl_freeMemory(pTemp);
                 pTemp = pTemp2;
             }
             else
             {
                 pTemp->length = nDestChars;
                 pTemp->buffer[nDestChars] = 0;
             }

             rtl_destroyTextToUnicodeConverter( hConverter );
             *ppThis = pTemp;

             /* Results the conversion in an empty buffer -
                create an empty string */
             if ( pTemp && !nDestChars )
                 rtl_uString_new( ppThis );
         }
     }
 }

 void SAL_CALL rtl_string2UString( rtl_uString** ppThis,
                                   const sal_Char* pStr,
                                   sal_Int32 nLen,
                                   rtl_TextEncoding eTextEncoding,
                                   sal_uInt32 nCvtFlags )
 {
     rtl_string2UString_status( ppThis, pStr, nLen, eTextEncoding,
                                nCvtFlags, NULL );
 }

 /* ----------------------------------------------------------------------- */

 typedef enum {
     CANNOT_RETURN,
     CAN_RETURN = 1
 } StrLifecycle;

 static oslMutex
 getInternMutex()
 {
     static oslMutex pPoolGuard = NULL;
     if( !pPoolGuard )
     {
         oslMutex pGlobalGuard;
         pGlobalGuard = *osl_getGlobalMutex();
         osl_acquireMutex( pGlobalGuard );
         if( !pPoolGuard )
         {
             oslMutex p = osl_createMutex();
             OSL_DOUBLE_CHECKED_LOCKING_MEMORY_BARRIER();
             pPoolGuard = p;
         }
         osl_releaseMutex( pGlobalGuard );
     }
     else
     {
         OSL_DOUBLE_CHECKED_LOCKING_MEMORY_BARRIER();
     }

     return pPoolGuard;
 }

 /* returns true if we found a dup in the pool */
 static void rtl_ustring_intern_internal( rtl_uString ** newStr,
                                          rtl_uString  * str,
                                          StrLifecycle   can_return )
 {
     oslMutex pPoolMutex;

     pPoolMutex = getInternMutex();

     osl_acquireMutex( pPoolMutex );

     *newStr = rtl_str_hash_intern (str, can_return);

     osl_releaseMutex( pPoolMutex );

     if( can_return && *newStr != str )
     { /* we dupped, then found a match */
         rtl_freeMemory( str );
     }
 }

 void SAL_CALL rtl_uString_intern( rtl_uString ** newStr,
                                   rtl_uString  * str)
 {
     if (SAL_STRING_IS_INTERN(str))
     {
         IMPL_RTL_AQUIRE( str );
         *newStr = str;
     }
     else
     {
         rtl_uString *pOrg = *newStr;
         *newStr = NULL;
         rtl_ustring_intern_internal( newStr, str, CANNOT_RETURN );
         if (pOrg)
             rtl_uString_release (pOrg);
     }
 }

 void SAL_CALL rtl_uString_internConvert( rtl_uString   ** newStr,
                                          const sal_Char * str,
                                          sal_Int32        len,
                                          rtl_TextEncoding eTextEncoding,
                                          sal_uInt32       convertFlags,
                                          sal_uInt32     * pInfo )
 {
     rtl_uString *scratch;

     if (*newStr)
     {
         rtl_uString_release (*newStr);
         *newStr = NULL;
     }

     if ( len < 256 )
     { // try various optimisations
         if ( len < 0 )
             len = strlen( str );
         if ( eTextEncoding == RTL_TEXTENCODING_ASCII_US )
         {
             int i;
             rtl_uString *pScratch;
             pScratch = alloca( sizeof( rtl_uString )
                                + len * sizeof (IMPL_RTL_STRCODE ) );
             for (i = 0; i < len; i++)
             {
                 /* Check ASCII range */
                 OSL_ENSURE( ((unsigned char)str[i]) <= 127,
                             "rtl_ustring_internConvert() - Found char > 127 and RTL_TEXTENCODING_ASCII_US is specified" );
                 pScratch->buffer[i] = str[i];
             }
             pScratch->length = len;
             rtl_ustring_intern_internal( newStr, pScratch, CANNOT_RETURN );
             return;
         }
         /* FIXME: we want a nice UTF-8 / alloca shortcut here */
     }

     scratch = NULL;
     rtl_string2UString_status( &scratch, str, len, eTextEncoding, convertFlags,
                                pInfo );
     if (!scratch) {
         return;
     }
     rtl_ustring_intern_internal( newStr, scratch, CAN_RETURN );
 }

 static void
 internRelease (rtl_uString *pThis)
 {
     oslMutex pPoolMutex;

     rtl_uString *pFree = NULL;
     if ( SAL_STRING_REFCOUNT(
              osl_decrementInterlockedCount( &(pThis->refCount) ) ) == 0)
     {
         pPoolMutex = getInternMutex();
         osl_acquireMutex( pPoolMutex );

         rtl_str_hash_remove (pThis);

         /* May have been separately acquired */
         if ( SAL_STRING_REFCOUNT(
                  osl_incrementInterlockedCount( &(pThis->refCount) ) ) == 1 )
         {
             /* we got the last ref */
             pFree = pThis;
         }
         else /* very unusual */
         {
             internRelease (pThis);
         }

         osl_releaseMutex( pPoolMutex );
     }
     if (pFree)
         rtl_freeMemory (pFree);
 }

 sal_uInt32 SAL_CALL rtl_uString_iterateCodePoints(
     rtl_uString const * string, sal_Int32 * indexUtf16,
     sal_Int32 incrementCodePoints)
 {
     sal_Int32 n;
     sal_Unicode cu;
     sal_uInt32 cp;
     OSL_ASSERT(string != NULL && indexUtf16 != NULL);
     n = *indexUtf16;
     OSL_ASSERT(n >= 0 && n <= string->length);
     while (incrementCodePoints < 0) {
         OSL_ASSERT(n > 0);
         cu = string->buffer[--n];
         if (SAL_RTL_IS_LOW_SURROGATE(cu) && n != 0 &&
             SAL_RTL_IS_HIGH_SURROGATE(string->buffer[n - 1]))
         {
             --n;
         }
         ++incrementCodePoints;
     }
     OSL_ASSERT(n >= 0 && n < string->length);
     cu = string->buffer[n];
     if (SAL_RTL_IS_HIGH_SURROGATE(cu) && string->length - n >= 2 &&
         SAL_RTL_IS_LOW_SURROGATE(string->buffer[n + 1]))
     {
         cp = SAL_RTL_COMBINE_SURROGATES(cu, string->buffer[n + 1]);
     } else {
         cp = cu;
     }
     while (incrementCodePoints > 0) {
         OSL_ASSERT(n < string->length);
         cu = string->buffer[n++];
         if (SAL_RTL_IS_HIGH_SURROGATE(cu) && n != string->length &&
             SAL_RTL_IS_LOW_SURROGATE(string->buffer[n]))
         {
             ++n;
         }
         --incrementCodePoints;
     }
     OSL_ASSERT(n >= 0 && n <= string->length);
     *indexUtf16 = n;
     return cp;
 }

 sal_Bool rtl_convertStringToUString(
     rtl_uString ** target, char const * source, sal_Int32 length,
     rtl_TextEncoding encoding, sal_uInt32 flags) SAL_THROW_EXTERN_C()
 {
     sal_uInt32 info;
     rtl_string2UString_status(target, source, length, encoding, flags, &info);
     return (sal_Bool) ((info & RTL_TEXTTOUNICODE_INFO_ERROR) == 0);
 }
	/**************************************************************
	*
	* Licensed to the Apache Software Foundation (ASF) under one
	* or more contributor license agreements. See the NOTICE file
	* distributed with this work for additional information
	* regarding copyright ownership. The ASF licenses this file
	* to you under the Apache License, Version 2.0 (the
	* "License"); you may not use this file except in compliance
	* with the License. You may obtain a copy of the License at
	*
	* http://www.apache.org/licenses/LICENSE-2.0
	*
	* Unless required by applicable law or agreed to in writing,
	* software distributed under the License is distributed on an
	* "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
	* KIND, either express or implied. See the License for the
	* specific language governing permissions and limitations
	* under the License.
	*
	*************************************************************/


	#if defined(_MSC_VER) && (_MSC_VER >= 1400)
	#pragma warning(disable:4738) // storing 32-bit float result in memory, possible loss of performance
	#endif

	#include <rtl/memory.h>
	#include <osl/diagnose.h>
	#include <osl/interlck.h>
	#include <rtl/alloc.h>
	#include <osl/mutex.h>
	#include <osl/doublecheckedlocking.h>
	#include <rtl/tencinfo.h>

	#include <string.h>
	#include <sal/alloca.h>

	#include "hash.h"
	#include "strimp.h"
	#include "surrogates.h"
	#include <rtl/ustring.h>

	#include "rtl/math.h"
	#include "rtl/tencinfo.h"

	/* ======================================================================= */

	/* static data to be referenced by all empty strings
	* the refCount is predefined to 1 and must never become 0 !
	*/
	static rtl_uString const aImplEmpty_rtl_uString =
	{
	(sal_Int32) (SAL_STRING_INTERN_FLAG\|SAL_STRING_STATIC_FLAG\|1), /sal_Int32 refCount; /
	0, /sal_Int32 length; /
	{ 0 } /sal_Unicode buffer[1];/
	};

	/* ======================================================================= */

	#define IMPL_RTL_STRCODE sal_Unicode
	#define IMPL_RTL_USTRCODE( c ) (c)
	#define IMPL_RTL_STRNAME( n ) rtl_ustr_ ## n

	#define IMPL_RTL_STRINGNAME( n ) rtl_uString_ ## n
	#define IMPL_RTL_STRINGDATA rtl_uString
	#define IMPL_RTL_EMPTYSTRING aImplEmpty_rtl_uString
	#define IMPL_RTL_INTERN
	static void internRelease (rtl_uString *pThis);

	/* ======================================================================= */

	/* Include String/UString template code */

	#include "strtmpl.c"

	sal_Int32 rtl_ustr_indexOfAscii_WithLength(
	sal_Unicode const * str, sal_Int32 len,
	char const * subStr, sal_Int32 subLen)
	{
	if (subLen > 0 && subLen <= len) {
	sal_Int32 i;
	for (i = 0; i <= len - subLen; ++i) {
	if (rtl_ustr_asciil_reverseEquals_WithLength(
	str + i, subStr, subLen))
	{
	return i;
	}
	}
	}
	return -1;
	}

	sal_Int32 rtl_ustr_lastIndexOfAscii_WithLength(
	sal_Unicode const * str, sal_Int32 len,
	char const * subStr, sal_Int32 subLen)
	{
	if (subLen > 0 && subLen <= len) {
	sal_Int32 i;
	for (i = len - subLen; i >= 0; --i) {
	if (rtl_ustr_asciil_reverseEquals_WithLength(
	str + i, subStr, subLen))
	{
	return i;
	}
	}
	}
	return -1;
	}

	sal_Int32 SAL_CALL rtl_ustr_valueOfFloat(sal_Unicode * pStr, float f)
	{
	rtl_uString * pResult = NULL;
	sal_Int32 nLen;
	rtl_math_doubleToUString(
	&pResult, 0, 0, f, rtl_math_StringFormat_G,
	RTL_USTR_MAX_VALUEOFFLOAT - RTL_CONSTASCII_LENGTH("-x.E-xxx"), '.', 0,
	0, sal_True);
	nLen = pResult->length;
	OSL_ASSERT(nLen < RTL_USTR_MAX_VALUEOFFLOAT);
	rtl_copyMemory(pStr, pResult->buffer, (nLen + 1) * sizeof(sal_Unicode));
	rtl_uString_release(pResult);
	return nLen;
	}

	sal_Int32 SAL_CALL rtl_ustr_valueOfDouble(sal_Unicode * pStr, double d)
	{
	rtl_uString * pResult = NULL;
	sal_Int32 nLen;
	rtl_math_doubleToUString(
	&pResult, 0, 0, d, rtl_math_StringFormat_G,
	RTL_USTR_MAX_VALUEOFDOUBLE - RTL_CONSTASCII_LENGTH("-x.E-xxx"), '.', 0,
	0, sal_True);
	nLen = pResult->length;
	OSL_ASSERT(nLen < RTL_USTR_MAX_VALUEOFDOUBLE);
	rtl_copyMemory(pStr, pResult->buffer, (nLen + 1) * sizeof(sal_Unicode));
	rtl_uString_release(pResult);
	return nLen;
	}

	float SAL_CALL rtl_ustr_toFloat(sal_Unicode const * pStr)
	{
	return (float) rtl_math_uStringToDouble(pStr,
	pStr + rtl_ustr_getLength(pStr),
	'.', 0, 0, 0);
	}

	double SAL_CALL rtl_ustr_toDouble(sal_Unicode const * pStr)
	{
	return rtl_math_uStringToDouble(pStr, pStr + rtl_ustr_getLength(pStr), '.',
	0, 0, 0);
	}

	/* ======================================================================= */

	sal_Int32 SAL_CALL rtl_ustr_ascii_compare( const sal_Unicode* pStr1,
	const sal_Char* pStr2 )
	{
	sal_Int32 nRet;
	while ( ((nRet = ((sal_Int32)(*pStr1))-
	((sal_Int32)((unsigned char)(*pStr2)))) == 0) &&
	*pStr2 )
	{
	pStr1++;
	pStr2++;
	}

	return nRet;
	}

	/* ----------------------------------------------------------------------- */

	sal_Int32 SAL_CALL rtl_ustr_ascii_compare_WithLength( const sal_Unicode* pStr1,
	sal_Int32 nStr1Len,
	const sal_Char* pStr2 )
	{
	sal_Int32 nRet = 0;
	while( ((nRet = (nStr1Len ? (sal_Int32)(*pStr1) : 0)-
	((sal_Int32)((unsigned char)(*pStr2)))) == 0) &&
	nStr1Len && *pStr2 )
	{
	pStr1++;
	pStr2++;
	nStr1Len--;
	}

	return nRet;
	}

	/* ----------------------------------------------------------------------- */

	sal_Int32 SAL_CALL rtl_ustr_ascii_shortenedCompare_WithLength( const sal_Unicode* pStr1,
	sal_Int32 nStr1Len,
	const sal_Char* pStr2,
	sal_Int32 nShortenedLength )
	{
	const sal_Unicode* pStr1End = pStr1 + nStr1Len;
	sal_Int32 nRet;
	while ( (nShortenedLength > 0) &&
	(pStr1 < pStr1End) && *pStr2 )
	{
	/* Check ASCII range */
	OSL_ENSURE( (*pStr2 & 0x80) == 0, "Found ASCII char > 127");

	nRet = ((sal_Int32)*pStr1)-
	((sal_Int32)(unsigned char)*pStr2);
	if ( nRet != 0 )
	return nRet;

	nShortenedLength--;
	pStr1++;
	pStr2++;
	}

	if ( nShortenedLength <= 0 )
	return 0;

	if ( *pStr2 )
	{
	OSL_ENSURE( pStr1 == pStr1End, "pStr1 == pStr1End failed" );
	// first is a substring of the second string => less (negative value)
	nRet = -1;
	}
	else
	{
	// greater or equal
	nRet = pStr1End - pStr1;
	}

	return nRet;
	}

	/* ----------------------------------------------------------------------- */

	sal_Int32 SAL_CALL rtl_ustr_asciil_reverseCompare_WithLength( const sal_Unicode* pStr1,
	sal_Int32 nStr1Len,
	const sal_Char* pStr2,
	sal_Int32 nStr2Len )
	{
	const sal_Unicode* pStr1Run = pStr1+nStr1Len;
	const sal_Char* pStr2Run = pStr2+nStr2Len;
	sal_Int32 nRet;
	while ( (pStr1 < pStr1Run) && (pStr2 < pStr2Run) )
	{
	pStr1Run--;
	pStr2Run--;
	nRet = ((sal_Int32)pStr1Run)-((sal_Int32)pStr2Run);
	if ( nRet )
	return nRet;
	}

	return nStr1Len - nStr2Len;
	}

	/* ----------------------------------------------------------------------- */

	sal_Bool SAL_CALL rtl_ustr_asciil_reverseEquals_WithLength( const sal_Unicode* pStr1,
	const sal_Char* pStr2,
	sal_Int32 nStrLen )
	{
	const sal_Unicode* pStr1Run = pStr1+nStrLen;
	const sal_Char* pStr2Run = pStr2+nStrLen;
	while ( pStr1 < pStr1Run )
	{
	pStr1Run--;
	pStr2Run--;
	if( pStr1Run != (sal_Unicode)pStr2Run )
	return sal_False;
	}

	return sal_True;
	}

	/* ----------------------------------------------------------------------- */

	sal_Int32 SAL_CALL rtl_ustr_ascii_compareIgnoreAsciiCase( const sal_Unicode* pStr1,
	const sal_Char* pStr2 )
	{
	sal_Int32 nRet;
	sal_Int32 c1;
	sal_Int32 c2;
	do
	{
	/* If character between 'A' and 'Z', than convert it to lowercase */
	c1 = (sal_Int32)*pStr1;
	c2 = (sal_Int32)((unsigned char)*pStr2);
	if ( (c1 >= 65) && (c1 <= 90) )
	c1 += 32;
	if ( (c2 >= 65) && (c2 <= 90) )
	c2 += 32;
	nRet = c1-c2;
	if ( nRet != 0 )
	return nRet;

	pStr1++;
	pStr2++;
	}
	while ( c2 );

	return 0;
	}

	/* ----------------------------------------------------------------------- */

	sal_Int32 SAL_CALL rtl_ustr_ascii_compareIgnoreAsciiCase_WithLength( const sal_Unicode* pStr1,
	sal_Int32 nStr1Len,
	const sal_Char* pStr2 )
	{
	sal_Int32 nRet;
	sal_Int32 c1;
	sal_Int32 c2;
	do
	{
	if ( !nStr1Len )
	return *pStr2 == '\0' ? 0 : -1;

	/* If character between 'A' and 'Z', than convert it to lowercase */
	c1 = (sal_Int32)*pStr1;
	c2 = (sal_Int32)((unsigned char)*pStr2);
	if ( (c1 >= 65) && (c1 <= 90) )
	c1 += 32;
	if ( (c2 >= 65) && (c2 <= 90) )
	c2 += 32;
	nRet = c1-c2;
	if ( nRet != 0 )
	return nRet;

	pStr1++;
	pStr2++;
	nStr1Len--;
	}
	while( c2 );

	return 0;
	}

	sal_Int32 rtl_ustr_ascii_compareIgnoreAsciiCase_WithLengths(
	sal_Unicode const * first, sal_Int32 firstLen,
	char const * second, sal_Int32 secondLen)
	{
	sal_Int32 i;
	sal_Int32 len = firstLen < secondLen ? firstLen : secondLen;
	for (i = 0; i < len; ++i) {
	sal_Int32 c1 = *first++;
	sal_Int32 c2 = (unsigned char) *second++;
	sal_Int32 d;
	if (c1 >= 65 && c1 <= 90) {
	c1 += 32;
	}
	if (c2 >= 65 && c2 <= 90) {
	c2 += 32;
	}
	d = c1 - c2;
	if (d != 0) {
	return d;
	}
	}
	return firstLen - secondLen;
	}

	/* ----------------------------------------------------------------------- */

	sal_Int32 SAL_CALL rtl_ustr_ascii_shortenedCompareIgnoreAsciiCase_WithLength( const sal_Unicode* pStr1,
	sal_Int32 nStr1Len,
	const sal_Char* pStr2,
	sal_Int32 nShortenedLength )
	{
	const sal_Unicode* pStr1End = pStr1 + nStr1Len;
	sal_Int32 nRet;
	sal_Int32 c1;
	sal_Int32 c2;
	while ( (nShortenedLength > 0) &&
	(pStr1 < pStr1End) && *pStr2 )
	{
	/* Check ASCII range */
	OSL_ENSURE( (*pStr2 & 0x80) == 0, "Found ASCII char > 127");

	/* If character between 'A' and 'Z', than convert it to lowercase */
	c1 = (sal_Int32)*pStr1;
	c2 = (sal_Int32)((unsigned char)*pStr2);
	if ( (c1 >= 65) && (c1 <= 90) )
	c1 += 32;
	if ( (c2 >= 65) && (c2 <= 90) )
	c2 += 32;
	nRet = c1-c2;
	if ( nRet != 0 )
	return nRet;

	nShortenedLength--;
	pStr1++;
	pStr2++;
	}

	if ( nShortenedLength <= 0 )
	return 0;

	if ( *pStr2 )
	{
	OSL_ENSURE( pStr1 == pStr1End, "pStr1 == pStr1End failed" );
	// first is a substring of the second string => less (negative value)
	nRet = -1;
	}
	else
	{
	// greater or equal
	nRet = pStr1End - pStr1;
	}

	return nRet;
	}

	/* ----------------------------------------------------------------------- */

	void SAL_CALL rtl_uString_newFromAscii( rtl_uString** ppThis,
	const sal_Char* pCharStr )
	{
	sal_Int32 nLen;

	if ( pCharStr )
	{
	const sal_Char* pTempStr = pCharStr;
	while( *pTempStr )
	pTempStr++;
	nLen = pTempStr-pCharStr;
	}
	else
	nLen = 0;

	if ( !nLen )
	{
	IMPL_RTL_STRINGNAME( new )( ppThis );
	return;
	}

	if ( *ppThis )
	IMPL_RTL_STRINGNAME( release )( *ppThis );

	*ppThis = IMPL_RTL_STRINGNAME( ImplAlloc )( nLen );
	OSL_ASSERT(*ppThis != NULL);
	if ( (*ppThis) )
	{
	IMPL_RTL_STRCODE* pBuffer = (*ppThis)->buffer;
	do
	{
	/* Check ASCII range */
	OSL_ENSURE( ((unsigned char)*pCharStr) <= 127,
	"rtl_uString_newFromAscii() - Found ASCII char > 127" );

	pBuffer = pCharStr;
	pBuffer++;
	pCharStr++;
	}
	while ( *pCharStr );
	}
	}

	void SAL_CALL rtl_uString_newFromCodePoints(
	rtl_uString ** newString, sal_uInt32 const * codePoints,
	sal_Int32 codePointCount)
	{
	sal_Int32 n;
	sal_Int32 i;
	sal_Unicode * p;
	OSL_ASSERT(
	newString != NULL &&
	(codePoints != NULL \|\| codePointCount == 0) &&
	codePointCount >= 0);
	if (codePointCount == 0) {
	rtl_uString_new(newString);
	return;
	}
	if (*newString != NULL) {
	rtl_uString_release(*newString);
	}
	n = codePointCount;
	for (i = 0; i < codePointCount; ++i) {
	OSL_ASSERT(codePoints[i] <= 0x10FFFF);
	if (codePoints[i] >= 0x10000) {
	++n;
	}
	}
	/* Builds on the assumption that sal_Int32 uses 32 bit two's complement
	representation with wrap around (the necessary number of UTF-16 code
	units will be no larger than 2 * SAL_MAX_INT32, represented as
	sal_Int32 -2): */
	if (n < 0) {
	*newString = NULL;
	return;
	}
	*newString = rtl_uString_ImplAlloc(n);
	if (*newString == NULL) {
	return;
	}
	p = (*newString)->buffer;
	for (i = 0; i < codePointCount; ++i) {
	sal_uInt32 c = codePoints[i];
	if (c < 0x10000) {
	*p++ = (sal_Unicode) c;
	} else {
	c -= 0x10000;
	*p++ = (sal_Unicode) ((c >> 10) \| SAL_RTL_FIRST_HIGH_SURROGATE);
	*p++ = (sal_Unicode) ((c & 0x3FF) \| SAL_RTL_FIRST_LOW_SURROGATE);
	}
	}
	}

	/* ======================================================================= */

	static int rtl_ImplGetFastUTF8UnicodeLen( const sal_Char* pStr, sal_Int32 nLen )
	{
	int n;
	sal_uChar c;
	const sal_Char* pEndStr;

	n = 0;
	pEndStr = pStr+nLen;
	while ( pStr < pEndStr )
	{
	c = (sal_uChar)*pStr;

	if ( !(c & 0x80) )
	pStr++;
	else if ( (c & 0xE0) == 0xC0 )
	pStr += 2;
	else if ( (c & 0xF0) == 0xE0 )
	pStr += 3;
	else if ( (c & 0xF8) == 0xF0 )
	pStr += 4;
	else if ( (c & 0xFC) == 0xF8 )
	pStr += 5;
	else if ( (c & 0xFE) == 0xFC )
	pStr += 6;
	else
	pStr++;

	n++;
	}

	return n;
	}

	/* ----------------------------------------------------------------------- */

	static void rtl_string2UString_status( rtl_uString** ppThis,
	const sal_Char* pStr,
	sal_Int32 nLen,
	rtl_TextEncoding eTextEncoding,
	sal_uInt32 nCvtFlags,
	sal_uInt32 *pInfo )
	{
	OSL_ENSURE(rtl_isOctetTextEncoding(eTextEncoding),
	"rtl_string2UString_status() - Wrong TextEncoding" );

	if ( !nLen )
	{
	rtl_uString_new( ppThis );
	if (pInfo != NULL) {
	*pInfo = 0;
	}
	}
	else
	{
	if ( *ppThis )
	IMPL_RTL_STRINGNAME( release )( *ppThis );

	/* Optimization for US-ASCII */
	if ( eTextEncoding == RTL_TEXTENCODING_ASCII_US )
	{
	IMPL_RTL_STRCODE* pBuffer;
	*ppThis = IMPL_RTL_STRINGNAME( ImplAlloc )( nLen );
	if (*ppThis == NULL) {
	if (pInfo != NULL) {
	*pInfo = RTL_TEXTTOUNICODE_INFO_ERROR \|
	RTL_TEXTTOUNICODE_INFO_DESTBUFFERTOSMALL;
	}
	return;
	}
	pBuffer = (*ppThis)->buffer;
	do
	{
	/* Check ASCII range */
	OSL_ENSURE( ((unsigned char)*pStr) <= 127,
	"rtl_string2UString_status() - Found char > 127 and RTL_TEXTENCODING_ASCII_US is specified" );

	pBuffer = pStr;
	pBuffer++;
	pStr++;
	nLen--;
	}
	while ( nLen );
	if (pInfo != NULL) {
	*pInfo = 0;
	}
	}
	else
	{
	rtl_uString* pTemp;
	rtl_uString* pTemp2 = NULL;
	rtl_TextToUnicodeConverter hConverter;
	sal_uInt32 nInfo;
	sal_Size nSrcBytes;
	sal_Size nDestChars;
	sal_Size nNewLen;

	/* Optimization for UTF-8 - we try to calculate the exact length */
	/* For all other encoding we try the maximum - and reallocate
	the buffer if needed */
	if ( eTextEncoding == RTL_TEXTENCODING_UTF8 )
	{
	nNewLen = rtl_ImplGetFastUTF8UnicodeLen( pStr, nLen );
	/* Includes the string only ASCII, then we could copy
	the buffer faster */
	if ( nNewLen == (sal_Size)nLen )
	{
	IMPL_RTL_STRCODE* pBuffer;
	*ppThis = IMPL_RTL_STRINGNAME( ImplAlloc )( nLen );
	if (*ppThis == NULL)
	{
	if (pInfo != NULL) {
	*pInfo = RTL_TEXTTOUNICODE_INFO_ERROR \|
	RTL_TEXTTOUNICODE_INFO_DESTBUFFERTOSMALL;
	}
	return;
	}
	pBuffer = (*ppThis)->buffer;
	do
	{
	/* Check ASCII range */
	OSL_ENSURE( ((unsigned char)*pStr) <= 127,
	"rtl_string2UString_status() - UTF8 test encoding is wrong" );

	pBuffer = pStr;
	pBuffer++;
	pStr++;
	nLen--;
	}
	while ( nLen );
	if (pInfo != NULL) {
	*pInfo = 0;
	}
	return;
	}
	}
	else
	nNewLen = nLen;

	nCvtFlags \|= RTL_TEXTTOUNICODE_FLAGS_FLUSH;
	hConverter = rtl_createTextToUnicodeConverter( eTextEncoding );

	pTemp = IMPL_RTL_STRINGNAME( ImplAlloc )( nNewLen );
	if (pTemp == NULL) {
	if (pInfo != NULL) {
	*pInfo = RTL_TEXTTOUNICODE_INFO_ERROR \|
	RTL_TEXTTOUNICODE_INFO_DESTBUFFERTOSMALL;
	}
	return;
	}
	nDestChars = rtl_convertTextToUnicode( hConverter, 0,
	pStr, nLen,
	pTemp->buffer, nNewLen,
	nCvtFlags,
	&nInfo, &nSrcBytes );

	/* Buffer not big enough, try again with enough space */
	/* Shouldn't be the case, but if we get textencoding which
	could results in more unicode characters we have this
	code here. Could be the case for apple encodings */
	while ( nInfo & RTL_TEXTTOUNICODE_INFO_DESTBUFFERTOSMALL )
	{
	rtl_freeMemory( pTemp );
	nNewLen += 8;
	pTemp = IMPL_RTL_STRINGNAME( ImplAlloc )( nNewLen );
	if (pTemp == NULL) {
	if (pInfo != NULL) {
	*pInfo = RTL_TEXTTOUNICODE_INFO_ERROR \|
	RTL_TEXTTOUNICODE_INFO_DESTBUFFERTOSMALL;
	}
	return;
	}
	nDestChars = rtl_convertTextToUnicode( hConverter, 0,
	pStr, nLen,
	pTemp->buffer, nNewLen,
	nCvtFlags,
	&nInfo, &nSrcBytes );
	}

	if (pInfo)
	*pInfo = nInfo;

	/* Set the buffer to the correct size or if there is too
	much overhead, reallocate to the correct size */
	if ( nNewLen > nDestChars+8 )
	{
	pTemp2 = IMPL_RTL_STRINGNAME( ImplAlloc )( nDestChars );
	}
	if (pTemp2 != NULL)
	{
	rtl_str_ImplCopy(pTemp2->buffer, pTemp->buffer, nDestChars);
	rtl_freeMemory(pTemp);
	pTemp = pTemp2;
	}
	else
	{
	pTemp->length = nDestChars;
	pTemp->buffer[nDestChars] = 0;
	}

	rtl_destroyTextToUnicodeConverter( hConverter );
	*ppThis = pTemp;

	/* Results the conversion in an empty buffer -
	create an empty string */
	if ( pTemp && !nDestChars )
	rtl_uString_new( ppThis );
	}
	}
	}

	void SAL_CALL rtl_string2UString( rtl_uString** ppThis,
	const sal_Char* pStr,
	sal_Int32 nLen,
	rtl_TextEncoding eTextEncoding,
	sal_uInt32 nCvtFlags )
	{
	rtl_string2UString_status( ppThis, pStr, nLen, eTextEncoding,
	nCvtFlags, NULL );
	}

	/* ----------------------------------------------------------------------- */

	typedef enum {
	CANNOT_RETURN,
	CAN_RETURN = 1
	} StrLifecycle;

	static oslMutex
	getInternMutex()
	{
	static oslMutex pPoolGuard = NULL;
	if( !pPoolGuard )
	{
	oslMutex pGlobalGuard;
	pGlobalGuard = *osl_getGlobalMutex();
	osl_acquireMutex( pGlobalGuard );
	if( !pPoolGuard )
	{
	oslMutex p = osl_createMutex();
	OSL_DOUBLE_CHECKED_LOCKING_MEMORY_BARRIER();
	pPoolGuard = p;
	}
	osl_releaseMutex( pGlobalGuard );
	}
	else
	{
	OSL_DOUBLE_CHECKED_LOCKING_MEMORY_BARRIER();
	}

	return pPoolGuard;
	}

	/* returns true if we found a dup in the pool */
	static void rtl_ustring_intern_internal( rtl_uString ** newStr,
	rtl_uString * str,
	StrLifecycle can_return )
	{
	oslMutex pPoolMutex;

	pPoolMutex = getInternMutex();

	osl_acquireMutex( pPoolMutex );

	*newStr = rtl_str_hash_intern (str, can_return);

	osl_releaseMutex( pPoolMutex );

	if( can_return && *newStr != str )
	{ /* we dupped, then found a match */
	rtl_freeMemory( str );
	}
	}

	void SAL_CALL rtl_uString_intern( rtl_uString ** newStr,
	rtl_uString * str)
	{
	if (SAL_STRING_IS_INTERN(str))
	{
	IMPL_RTL_AQUIRE( str );
	*newStr = str;
	}
	else
	{
	rtl_uString pOrg = newStr;
	*newStr = NULL;
	rtl_ustring_intern_internal( newStr, str, CANNOT_RETURN );
	if (pOrg)
	rtl_uString_release (pOrg);
	}
	}

	void SAL_CALL rtl_uString_internConvert( rtl_uString ** newStr,
	const sal_Char * str,
	sal_Int32 len,
	rtl_TextEncoding eTextEncoding,
	sal_uInt32 convertFlags,
	sal_uInt32 * pInfo )
	{
	rtl_uString *scratch;

	if (*newStr)
	{
	rtl_uString_release (*newStr);
	*newStr = NULL;
	}

	if ( len < 256 )
	{ // try various optimisations
	if ( len < 0 )
	len = strlen( str );
	if ( eTextEncoding == RTL_TEXTENCODING_ASCII_US )
	{
	int i;
	rtl_uString *pScratch;
	pScratch = alloca( sizeof( rtl_uString )
	+ len * sizeof (IMPL_RTL_STRCODE ) );
	for (i = 0; i < len; i++)
	{
	/* Check ASCII range */
	OSL_ENSURE( ((unsigned char)str[i]) <= 127,
	"rtl_ustring_internConvert() - Found char > 127 and RTL_TEXTENCODING_ASCII_US is specified" );
	pScratch->buffer[i] = str[i];
	}
	pScratch->length = len;
	rtl_ustring_intern_internal( newStr, pScratch, CANNOT_RETURN );
	return;
	}
	/* FIXME: we want a nice UTF-8 / alloca shortcut here */
	}

	scratch = NULL;
	rtl_string2UString_status( &scratch, str, len, eTextEncoding, convertFlags,
	pInfo );
	if (!scratch) {
	return;
	}
	rtl_ustring_intern_internal( newStr, scratch, CAN_RETURN );
	}

	static void
	internRelease (rtl_uString *pThis)
	{
	oslMutex pPoolMutex;

	rtl_uString *pFree = NULL;
	if ( SAL_STRING_REFCOUNT(
	osl_decrementInterlockedCount( &(pThis->refCount) ) ) == 0)
	{
	pPoolMutex = getInternMutex();
	osl_acquireMutex( pPoolMutex );

	rtl_str_hash_remove (pThis);

	/* May have been separately acquired */
	if ( SAL_STRING_REFCOUNT(
	osl_incrementInterlockedCount( &(pThis->refCount) ) ) == 1 )
	{
	/* we got the last ref */
	pFree = pThis;
	}
	else /* very unusual */
	{
	internRelease (pThis);
	}

	osl_releaseMutex( pPoolMutex );
	}
	if (pFree)
	rtl_freeMemory (pFree);
	}

	sal_uInt32 SAL_CALL rtl_uString_iterateCodePoints(
	rtl_uString const * string, sal_Int32 * indexUtf16,
	sal_Int32 incrementCodePoints)
	{
	sal_Int32 n;
	sal_Unicode cu;
	sal_uInt32 cp;
	OSL_ASSERT(string != NULL && indexUtf16 != NULL);
	n = *indexUtf16;
	OSL_ASSERT(n >= 0 && n <= string->length);
	while (incrementCodePoints < 0) {
	OSL_ASSERT(n > 0);
	cu = string->buffer[--n];
	if (SAL_RTL_IS_LOW_SURROGATE(cu) && n != 0 &&
	SAL_RTL_IS_HIGH_SURROGATE(string->buffer[n - 1]))
	{
	--n;
	}
	++incrementCodePoints;
	}
	OSL_ASSERT(n >= 0 && n < string->length);
	cu = string->buffer[n];
	if (SAL_RTL_IS_HIGH_SURROGATE(cu) && string->length - n >= 2 &&
	SAL_RTL_IS_LOW_SURROGATE(string->buffer[n + 1]))
	{
	cp = SAL_RTL_COMBINE_SURROGATES(cu, string->buffer[n + 1]);
	} else {
	cp = cu;
	}
	while (incrementCodePoints > 0) {
	OSL_ASSERT(n < string->length);
	cu = string->buffer[n++];
	if (SAL_RTL_IS_HIGH_SURROGATE(cu) && n != string->length &&
	SAL_RTL_IS_LOW_SURROGATE(string->buffer[n]))
	{
	++n;
	}
	--incrementCodePoints;
	}
	OSL_ASSERT(n >= 0 && n <= string->length);
	*indexUtf16 = n;
	return cp;
	}

	sal_Bool rtl_convertStringToUString(
	rtl_uString ** target, char const * source, sal_Int32 length,
	rtl_TextEncoding encoding, sal_uInt32 flags) SAL_THROW_EXTERN_C()
	{
	sal_uInt32 info;
	rtl_string2UString_status(target, source, length, encoding, flags, &info);
	return (sal_Bool) ((info & RTL_TEXTTOUNICODE_INFO_ERROR) == 0);
	}