blob: 36ce3aa2e2564296ee522bd8ee54d81d9af49e23 [file] [log] [blame]
/*
* The Apache Software License, Version 1.1
*
* Copyright (c) 2001 The Apache Software Foundation. All rights
* reserved.
*
* Redistribution and use in source and binary forms, with or without
* modification, are permitted provided that the following conditions
* are met:
*
* 1. Redistributions of source code must retain the above copyright
* notice, this list of conditions and the following disclaimer.
*
* 2. Redistributions in binary form must reproduce the above copyright
* notice, this list of conditions and the following disclaimer in
* the documentation and/or other materials provided with the
* distribution.
*
* 3. The end-user documentation included with the redistribution,
* if any, must include the following acknowledgment:
* "This product includes software developed by the
* Apache Software Foundation (http://www.apache.org/)."
* Alternately, this acknowledgment may appear in the software itself,
* if and wherever such third-party acknowledgments normally appear.
*
* 4. The names "Xerces" and "Apache Software Foundation" must
* not be used to endorse or promote products derived from this
* software without prior written permission. For written
* permission, please contact apache\@apache.org.
*
* 5. Products derived from this software may not be called "Apache",
* nor may "Apache" appear in their name, without prior written
* permission of the Apache Software Foundation.
*
* THIS SOFTWARE IS PROVIDED ``AS IS'' AND ANY EXPRESSED OR IMPLIED
* WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
* OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
* DISCLAIMED. IN NO EVENT SHALL THE APACHE SOFTWARE FOUNDATION OR
* ITS CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
* SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
* LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF
* USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
* ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
* OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT
* OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
* SUCH DAMAGE.
* ====================================================================
*
* This software consists of voluntary contributions made by many
* individuals on behalf of the Apache Software Foundation, and was
* originally based on software copyright (c) 1999, International
* Business Machines, Inc., http://www.ibm.com . For more information
* on the Apache Software Foundation, please see
* <http://www.apache.org/>.
*/
/*
* $Id$
*/
// ---------------------------------------------------------------------------
// Includes
// ---------------------------------------------------------------------------
#include <xercesc/util/PlatformUtils.hpp>
#include <xercesc/util/Janitor.hpp>
#include <xercesc/util/NumberFormatException.hpp>
#include <xercesc/util/XMLUri.hpp>
#include <xercesc/util/XMLString.hpp>
#include <xercesc/util/XMLUniDefs.hpp>
#include <xercesc/util/XMLUni.hpp>
// ---------------------------------------------------------------------------
// XMLUri: static data
// ---------------------------------------------------------------------------
// Amended by RFC2732
// reserved = ";" | "/" | "?" | ":" | "@" | "&" | "=" | "+" |
// "$" | "," | "[" | "]"
//
const XMLCh XMLUri::RESERVED_CHARACTERS[] =
{
chSemiColon, chForwardSlash, chQuestion, chColon, chAt,
chAmpersand, chEqual, chPlus, chDollarSign, chComma, chNull
};
//
// mark = "-" | "_" | "." | "!" | "~" | "*" | "'" |
// "(" | ")"
//
const XMLCh XMLUri::MARK_CHARACTERS[] =
{
chDash, chUnderscore, chPeriod, chBang, chTilde,
chAsterisk, chSingleQuote, chOpenParen, chCloseParen, chNull
};
//
// scheme = alpha *( alpha | digit | "+" | "-" | "." )
//
const XMLCh XMLUri::SCHEME_CHARACTERS[] =
{
chPlus, chDash, chPeriod, chNull
};
//
// userinfo = *( unreserved | escaped |
// ";" | ":" | "&" | "=" | "+" | "$" | "," )
//
const XMLCh XMLUri::USERINFO_CHARACTERS[] =
{
chSemiColon, chColon, chAmpersand, chEqual, chPlus,
chDollarSign, chPeriod, chNull
};
// ---------------------------------------------------------------------------
// Local methods and data
// ---------------------------------------------------------------------------
static const int BUF_LEN = 64;
static XMLCh value1[BUF_LEN+1];
//
// "Scheme"
// "SchemeSpecificPart"
// "Parameters"
// "UserInfo"
// "Host"
// "Port"
// "Path"
// "Query"
// "Fragment"
//
static const XMLCh errMsg_SCHEME[] =
{
chLatin_S, chLatin_c, chLatin_h, chLatin_e,
chLatin_m, chLatin_e, chNull
};
static const XMLCh errMsg_SCHEMESPART[] =
{
chLatin_S, chLatin_c, chLatin_h, chLatin_e, chLatin_m, chLatin_e,
chLatin_S, chLatin_p, chLatin_e, chLatin_c, chLatin_i, chLatin_f,
chLatin_i, chLatin_c, chLatin_P, chLatin_a, chLatin_r, chLatin_t,
chNull
};
static const XMLCh errMsg_PARAMS[] =
{
chLatin_P, chLatin_a, chLatin_r, chLatin_a, chLatin_m,
chLatin_e, chLatin_t, chLatin_e, chLatin_r, chLatin_s, chNull
};
static const XMLCh errMsg_USERINFO[] =
{
chLatin_U, chLatin_s, chLatin_e, chLatin_r,
chLatin_i, chLatin_n, chLatin_f, chLatin_o, chNull
};
static const XMLCh errMsg_HOST[] =
{
chLatin_H, chLatin_o, chLatin_s, chLatin_t, chNull
};
static const XMLCh errMsg_PORT[] =
{
chLatin_P, chLatin_o, chLatin_r, chLatin_t, chNull
};
static const XMLCh errMsg_PATH[] =
{
chLatin_P, chLatin_a, chLatin_t, chLatin_h, chNull
};
static const XMLCh errMsg_QUERY[] =
{
chLatin_Q, chLatin_u, chLatin_e, chLatin_r, chLatin_y, chNull
};
static const XMLCh errMsg_FRAGMENT[] =
{
chLatin_F, chLatin_r, chLatin_a, chLatin_g,
chLatin_m, chLatin_e, chLatin_n, chLatin_t, chNull
};
//
// "//"
// "/"
// "./"
// "/."
// "/../"
// "/.."
//
static const XMLCh DOUBLE_SLASH[] =
{
chForwardSlash, chForwardSlash, chNull
};
static const XMLCh SINGLE_SLASH[] =
{
chForwardSlash, chNull
};
static const XMLCh DOT_SLASH[] =
{
chPeriod, chForwardSlash, chNull
};
static const XMLCh SLASH_DOT[] =
{
chForwardSlash, chPeriod, chNull
};
static const XMLCh SLASH_DOTDOT_SLASH[] =
{
chForwardSlash, chPeriod, chPeriod, chForwardSlash, chNull
};
static const XMLCh SLASH_DOTDOT[] =
{
chForwardSlash, chPeriod, chPeriod, chNull
};
//
// ":/?#"
//
// REVISIT: why?
static const XMLCh SCHEME_SEPARATORS[] =
{
chColon, chForwardSlash, chQuestion, chPound, chNull
};
//
// "?#"
//
static const XMLCh PATH_SEPARATORS[] =
{
chQuestion, chPound, chNull
};
// ---------------------------------------------------------------------------
// XMLUri: Constructors and Helper methods
// ---------------------------------------------------------------------------
// ctor# 2
XMLUri::XMLUri(const XMLCh* const uriSpec)
:fScheme(0)
,fUserInfo(0)
,fHost(0)
,fPort(-1)
,fPath(0)
,fQueryString(0)
,fFragment(0)
{
try {
initialize((XMLUri *)0, uriSpec);
}
catch (...)
{
cleanUp();
throw;
}
}
// ctor# 7 relative ctor
XMLUri::XMLUri(const XMLUri* const baseURI
, const XMLCh* const uriSpec)
:fScheme(0)
,fUserInfo(0)
,fHost(0)
,fPort(-1)
,fPath(0)
,fQueryString(0)
,fFragment(0)
{
try {
initialize(baseURI, uriSpec);
}
catch (...)
{
cleanUp();
throw;
}
}
XMLUri::~XMLUri()
{
cleanUp();
}
void XMLUri::cleanUp()
{
if (getScheme())
delete[] fScheme;
if (getUserInfo())
delete[] fUserInfo;
if (getHost())
delete[] fHost;
if (getPath())
delete[] fPath;
if (getQueryString())
delete[] fQueryString;
if (getFragment())
delete[] fFragment;
}
void XMLUri::initialize(const XMLUri& toCopy)
{
//
// assuming that all fields from the toCopy are valid,
// therefore need NOT to go through various setXXX() methods
//
fScheme = XMLString::replicate(toCopy.getScheme());
fUserInfo = XMLString::replicate(toCopy.getUserInfo());
fHost = XMLString::replicate(toCopy.getHost());
fPort = toCopy.getPort();
fPath = XMLString::replicate(toCopy.getPath());
fQueryString = XMLString::replicate(toCopy.getQueryString());
fFragment = XMLString::replicate(toCopy.getFragment());
}
void XMLUri::initialize(const XMLUri* const baseURI
, const XMLCh* const uriSpec)
{
// get a trimmed version of uriSpec
// uriSpec will NO LONGER be used in this function.
//
XMLCh* const trimedUriSpec = XMLString::replicate(uriSpec);
XMLString::trim(trimedUriSpec);
ArrayJanitor<XMLCh> janName(trimedUriSpec);
int trimedUriSpecLen = XMLString::stringLen(trimedUriSpec);
if ( !baseURI &&
(!trimedUriSpec || trimedUriSpecLen == 0))
{
ThrowXML1(NumberFormatException
, XMLExcepts::XMLNUM_URI_Component_Empty
, errMsg_PARAMS);
}
// just make a copy of the base if spec is empty
if (!trimedUriSpec || trimedUriSpecLen == 0)
{
initialize(*baseURI);
return;
}
int index = 0;
// Check for scheme, which must be before `/'. Also handle names with
// DOS drive letters ('D:'), so 1-character schemes are not allowed.
int colonIdx = XMLString::indexOf(trimedUriSpec, chColon);
int slashIdx = XMLString::indexOf(trimedUriSpec, chForwardSlash);
if ((colonIdx < 2) ||
(colonIdx > slashIdx && slashIdx != -1) )
{
int fragmentIdx = XMLString::indexOf(trimedUriSpec, chPound); //'#'
// A standalone base is a valid URI according to spec
if ( !baseURI && fragmentIdx != 0 )
{
ThrowXML(NumberFormatException, XMLExcepts::XMLNUM_URI_No_Scheme);
}
}
else
{
initializeScheme(trimedUriSpec);
index = XMLString::stringLen(fScheme)+1;
}
// two slashes means generic URI syntax, so we get the authority
XMLCh* authUriSpec = new XMLCh[trimedUriSpecLen+1];
ArrayJanitor<XMLCh> authName(authUriSpec);
XMLString::subString(authUriSpec, trimedUriSpec, index, trimedUriSpecLen);
if (((index+1) < trimedUriSpecLen) &&
XMLString::startsWith(authUriSpec, DOUBLE_SLASH))
{
index += 2;
int startPos = index;
// get authority - everything up to path, query or fragment
XMLCh testChar;
while (index < trimedUriSpecLen)
{
testChar = trimedUriSpec[index];
if (testChar == chForwardSlash ||
testChar == chQuestion ||
testChar == chPound )
{
break;
}
index++;
}
// if we found authority, parse it out, otherwise we set the
// host to empty string
if (index > startPos)
{
XMLString::subString(authUriSpec, trimedUriSpec, startPos, index);
initializeAuthority(authUriSpec);
}
else
{
//fHost = 0;
setHost(0);
}
}
// we need to check if index has exceed the lenght or not
if (index >= trimedUriSpecLen)
return;
XMLCh* pathUriSpec = new XMLCh[trimedUriSpecLen+1];
ArrayJanitor<XMLCh> pathUriSpecName(pathUriSpec);
XMLString::subString(pathUriSpec, trimedUriSpec, index, trimedUriSpecLen);
initializePath(pathUriSpec);
// Resolve relative URI to base URI - see RFC 2396 Section 5.2
// In some cases, it might make more sense to throw an exception
// (when scheme is specified is the string spec and the base URI
// is also specified, for example), but we're just following the
// RFC specifications
if ( baseURI )
{
// check to see if this is the current doc - RFC 2396 5.2 #2
// note that this is slightly different from the RFC spec in that
// we don't include the check for query string being null
// - this handles cases where the urispec is just a query
// string or a fragment (e.g. "?y" or "#s") -
// see <http://www.ics.uci.edu/~fielding/url/test1.html> which
// identified this as a bug in the RFC
if ((!fPath || XMLString::stringLen(fPath) == 0) &&
fScheme == 0 &&
fHost == 0)
{
fScheme = XMLString::replicate(baseURI->getScheme());
delete [] fUserInfo;
fUserInfo = XMLString::replicate(baseURI->getUserInfo());
fHost = XMLString::replicate(baseURI->getHost());
fPort = baseURI->getPort();
delete [] fPath;
fPath = XMLString::replicate(baseURI->getPath());
if ( !fQueryString )
{
fQueryString = XMLString::replicate(baseURI->getQueryString());
}
return;
}
// check for scheme - RFC 2396 5.2 #3
// if we found a scheme, it means absolute URI, so we're done
if (fScheme == 0)
{
fScheme = XMLString::replicate(baseURI->getScheme());
}
else
{
return;
}
// check for authority - RFC 2396 5.2 #4
// if we found a host, then we've got a network path, so we're done
if (fHost == 0)
{
delete [] fUserInfo;
fUserInfo = XMLString::replicate(baseURI->getUserInfo());
fHost = XMLString::replicate(baseURI->getHost());
fPort = baseURI->getPort();
}
else
{
return;
}
// check for absolute path - RFC 2396 5.2 #5
if (XMLString::stringLen(fPath) > 0 &&
XMLString::startsWith(fPath, SINGLE_SLASH))
{
return;
}
// if we get to this point, we need to resolve relative path
// RFC 2396 5.2 #6
XMLCh* basePath = XMLString::replicate(baseURI->getPath());
ArrayJanitor<XMLCh> basePathName(basePath);
int bufLen = trimedUriSpecLen+XMLString::stringLen(fPath)+XMLString::stringLen(basePath)+1;
XMLCh* path = new XMLCh[bufLen];
ArrayJanitor<XMLCh> pathName(path);
path[0] = 0;
XMLCh* tmp1 = new XMLCh[bufLen];
ArrayJanitor<XMLCh> tmp1Name(tmp1);
XMLCh* tmp2 = new XMLCh[bufLen];
ArrayJanitor<XMLCh> tmp2Name(tmp2);
// 6a - get all but the last segment of the base URI path
if (basePath)
{
int lastSlash = XMLString::lastIndexOf(basePath, chForwardSlash);
if (lastSlash != -1)
{
XMLString::subString(path, basePath, 0, lastSlash+1);
}
}
// 6b - append the relative URI path
XMLString::catString(path, fPath);
// 6c - remove all "./" where "." is a complete path segment
index = -1;
while ((index = XMLString::patternMatch(path, DOT_SLASH)) != -1)
{
XMLString::subString(tmp1, path, 0, index);
XMLString::subString(tmp2, path, index+2, XMLString::stringLen(path));
path[0] = 0;
XMLString::catString(path, tmp1);
XMLString::catString(path, tmp2);
}
// 6d - remove "." if path ends with "." as a complete path segment
if (XMLString::endsWith(path, SLASH_DOT))
{
path[XMLString::stringLen(path) - 1] = chNull;
}
// 6e - remove all "<segment>/../" where "<segment>" is a complete
// path segment not equal to ".."
index = 1;
int segIndex = -1;
while ((index = XMLString::patternMatch(&(path[1]), SLASH_DOTDOT_SLASH)) != -1)
{
segIndex = XMLString::lastIndexOf(&(path[index-1]), chForwardSlash);
if (segIndex != -1 &&
(path[segIndex+1] != chPeriod ||
path[index] != chPeriod))
{
XMLString::subString(tmp1, path, 0, segIndex);
XMLString::subString(tmp2, path, index+3, XMLString::stringLen(path));
path[0] = 0;
XMLString::catString(path, tmp1);
XMLString::catString(path, tmp2);
index = segIndex;
}
else
{
index += 4;
}
}// while
// 6f - remove ending "<segment>/.." where "<segment>" is a
// complete path segment
if (XMLString::endsWith(path, SLASH_DOTDOT))
{
index = XMLString::stringLen(path) - 3;
segIndex = XMLString::lastIndexOf(&(path[index-1]), chForwardSlash);
if (segIndex != -1 &&
(path[segIndex+1] != chPeriod ||
path[index] != chPeriod))
{
path[segIndex+1] = chNull;
}
}
if (getPath())
delete [] fPath;
fPath = XMLString::replicate(path);
}
}
// ---------------------------------------------------------------------------
// Components initialization
// ---------------------------------------------------------------------------
//
// authority = server | reg_name
// server = [ [ userinfo "@" ] hostport ]
// hostport = host [ ":" port ]
//
// reg_name = 1*( unreserved | escaped | "$" | "," |
// ";" | ":" | "@" | "&" | "=" | "+" )
//
// userinfo = *( unreserved | escaped |
// ";" | ":" | "&" | "=" | "+" | "$" | "," )
//
void XMLUri::initializeAuthority(const XMLCh* const uriSpec)
{
int index = 0;
int start = 0;
const int end = XMLString::stringLen(uriSpec);
//
// server = [ [ userinfo "@" ] hostport ]
// userinfo is everything up @,
//
XMLCh* userinfo = new XMLCh[end+1];
ArrayJanitor<XMLCh> userName(userinfo);
index = XMLString::indexOf(&(uriSpec[start]), chAt);
if ( index != -1)
{
XMLString::subString(userinfo, &(uriSpec[start]), 0, index);
index++; // skip the @
start += index;
}
else
{
XMLString::copyString(userinfo, XMLUni::fgZeroLenString);
}
//
// hostport = host [ ":" port ]
// host is everything up to ':'
//
XMLCh* host = new XMLCh[end+1];
ArrayJanitor<XMLCh> hostName(host);
index = XMLString::indexOf(&(uriSpec[start]), chColon);
if ( index != -1)
{
XMLString::subString(host, &(uriSpec[start]), 0, index);
index++; // skip the :
start +=index;
}
else
{
XMLString::subString(host, &(uriSpec[start]), 0, end-start);
start=end;
}
// port is everything after ":"
XMLCh* portStr = new XMLCh[end+1];
ArrayJanitor<XMLCh> portName(portStr);
int port = -1;
if ((XMLString::stringLen(host) > 0) && // non empty host
(index != -1) && // ":" found
(start < end) ) // ":" is not the last
{
XMLString::subString(portStr, &(uriSpec[start]), 0, end-start);
if (XMLString::stringLen(portStr) > 0)
{
try
{
port = XMLString::parseInt(portStr);
}
catch (...)
{
throw;
}
}
} // if > 0
// The order is important, do not change
//
setHost(host);
setPort(port);
setUserInfo(userinfo);
}
// scheme = alpha *( alpha | digit | "+" | "-" | "." )
void XMLUri::initializeScheme(const XMLCh* const uriSpec)
{
const XMLCh* tmpPtr = XMLString::findAny(uriSpec, SCHEME_SEPARATORS);
if ( !tmpPtr )
{
ThrowXML(NumberFormatException, XMLExcepts::XMLNUM_URI_No_Scheme);
}
else
{
XMLCh* scheme = new XMLCh[XMLString::stringLen(uriSpec)+1];
ArrayJanitor<XMLCh> tmpName(scheme);
XMLString::subString(scheme, uriSpec, 0, (tmpPtr - uriSpec));
setScheme(scheme);
}
}
void XMLUri::initializePath(const XMLCh* const uriSpec)
{
if ( !uriSpec )
{
ThrowXML1(NumberFormatException
, XMLExcepts::XMLNUM_URI_Component_Empty
, errMsg_PATH);
}
int index = 0;
int start = 0;
int end = XMLString::stringLen(uriSpec);
XMLCh testChar;
// path - everything up to query string or fragment
while (index < end)
{
testChar = uriSpec[index];
if (testChar == chQuestion || testChar == chPound)
{
break;
}
// check for valid escape sequence
if (testChar == chPercent)
{
if (index+2 >= end ||
!XMLString::isHex(uriSpec[index+1]) ||
!XMLString::isHex(uriSpec[index+2]))
{
XMLString::moveChars(value1, &(uriSpec[index]), 3);
value1[3] = chNull;
ThrowXML2(NumberFormatException
, XMLExcepts::XMLNUM_URI_Component_Invalid_EscapeSequence
, errMsg_PATH
, value1);
}
}
else if (!isReservedCharacter(testChar) &&
!isUnreservedCharacter(testChar))
{
value1[0] = testChar;
value1[1] = chNull;
ThrowXML2(NumberFormatException
, XMLExcepts::XMLNUM_URI_Component_Invalid_Char
, errMsg_PATH
, value1);
}
index++;
}//while (index < end)
if (getPath())
{
delete [] fPath;
}
fPath = new XMLCh[index+1];
XMLString::subString(fPath, uriSpec, start, index);
// query - starts with ? and up to fragment or end
if (testChar == chQuestion)
{
index++;
start = index;
while (index < end)
{
testChar = uriSpec[index];
if (testChar == chPound)
{
break;
}
if (testChar == chPercent)
{
if (index+2 >= end ||
!XMLString::isHex(uriSpec[index+1]) ||
!XMLString::isHex(uriSpec[index+2]))
{
XMLString::moveChars(value1, &(uriSpec[index]), 3);
value1[3] = chNull;
ThrowXML2(NumberFormatException
, XMLExcepts::XMLNUM_URI_Component_Invalid_EscapeSequence
, errMsg_QUERY
, value1);
}
}
else if (!isReservedCharacter(testChar) &&
!isUnreservedCharacter(testChar))
{
value1[0] = testChar;
value1[1] = chNull;
ThrowXML2(NumberFormatException
, XMLExcepts::XMLNUM_URI_Component_Invalid_Char
, errMsg_QUERY
, value1);
}
index++;
}
if (getQueryString())
{
delete [] fQueryString;
}
fQueryString = new XMLCh[index - start + 1];
XMLString::subString(fQueryString, uriSpec, start, index);
}
// fragment - starts with #
if (testChar == chPound)
{
index++;
start = index;
while (index < end)
{
testChar = uriSpec[index];
if (testChar == chPercent)
{
if (index+2 >= end ||
!XMLString::isHex(uriSpec[index+1]) ||
!XMLString::isHex(uriSpec[index+2]))
{
XMLString::moveChars(value1, &(uriSpec[index]), 3);
value1[3] = chNull;
ThrowXML2(NumberFormatException
, XMLExcepts::XMLNUM_URI_Component_Invalid_EscapeSequence
, errMsg_FRAGMENT
, value1);
}
}
else if (!isReservedCharacter(testChar) &&
!isUnreservedCharacter(testChar))
{
value1[0] = testChar;
value1[1] = chNull;
ThrowXML2(NumberFormatException
, XMLExcepts::XMLNUM_URI_Component_Invalid_Char
, errMsg_FRAGMENT
, value1);
}
index++;
}
if (getFragment())
delete [] fFragment;
//make sure that there is something following the '#'
if (index > start)
{
fFragment = new XMLCh[index - start + 1];
XMLString::subString(fFragment, uriSpec, start, index);
}
else
{
// RFC 2396, 4.0. URI Reference
// URI-reference = [absoulteURI | relativeURI] [# fragment]
//
// RFC 2396, 4.1. Fragment Identifier
// fragment = *uric
//
// empty fragment is valid
fFragment = 0;
}
}
}
// ---------------------------------------------------------------------------
// Setter
// ---------------------------------------------------------------------------
void XMLUri::setScheme(const XMLCh* const newScheme)
{
if ( !newScheme )
{
ThrowXML1(NumberFormatException
, XMLExcepts::XMLNUM_URI_Component_Set_Null
, errMsg_SCHEME);
}
if (!isConformantSchemeName(newScheme))
{
ThrowXML2(NumberFormatException
, XMLExcepts::XMLNUM_URI_Component_Not_Conformant
, errMsg_SCHEME
, newScheme);
}
if (getScheme())
{
delete [] fScheme;
}
fScheme = XMLString::replicate(newScheme);
XMLString::lowerCase(fScheme);
}
//
// server = [ [ userinfo "@" ] hostport ]
// hostport = host [":" port]
//
// setUserInfo(), setHost() and setPort() are closely related
// three methods, in a word, userinfo and port has dependency
// on host.
//
// if host is not present, userinfo must be null and port = -1
//
void XMLUri::setUserInfo(const XMLCh* const newUserInfo)
{
if ( newUserInfo &&
!getHost() )
{
ThrowXML2(NumberFormatException
, XMLExcepts::XMLNUM_URI_NullHost
, errMsg_USERINFO
, newUserInfo);
}
try
{
isConformantUserInfo(newUserInfo);
}
catch (...)
{
throw;
}
if (getUserInfo())
{
delete [] fUserInfo;
}
fUserInfo = XMLString::replicate(newUserInfo);
}
void XMLUri::setHost(const XMLCh* const newHost)
{
if ( !newHost ||
XMLString::isAllWhiteSpace(newHost))
{
if (getHost())
delete [] fHost;
fHost = 0;
setUserInfo(0);
setPort(-1);
return;
}
if (!isWellFormedAddress(newHost))
{
ThrowXML2(NumberFormatException
, XMLExcepts::XMLNUM_URI_Component_Not_Conformant
, errMsg_HOST
, newHost);
}
if (getHost())
{
delete [] fHost;
}
fHost = XMLString::replicate(newHost);
}
void XMLUri::setPort(int newPort)
{
if (newPort >= 0 && newPort <= 65535)
{
if (!getHost())
{
XMLString::binToText(newPort, value1, BUF_LEN, 10);
ThrowXML2(NumberFormatException
, XMLExcepts::XMLNUM_URI_NullHost
, errMsg_PORT
, value1);
}
}
else if (newPort != -1)
{
XMLString::binToText(newPort, value1, BUF_LEN, 10);
ThrowXML1(NumberFormatException
, XMLExcepts::XMLNUM_URI_PortNo_Invalid
, value1);
}
fPort = newPort;
}
//
// setPath(), setQueryString() and setFragment() are closely
// related three methods as well.
//
void XMLUri::setPath(const XMLCh* const newPath)
{
if (!newPath)
{
if (getPath())
delete [] fPath;
fPath = 0;
setQueryString(0);
setFragment(0);
}
else
{
initializePath(newPath);
}
}
//
// fragment = *uric
//
void XMLUri::setFragment(const XMLCh* const newFragment)
{
if ( !newFragment )
{
if (getFragment())
delete [] fFragment;
fFragment = 0;
}
else if (!isGenericURI())
{
ThrowXML2(NumberFormatException
, XMLExcepts::XMLNUM_URI_Component_for_GenURI_Only
, errMsg_FRAGMENT
, newFragment);
}
else if ( !getPath() )
{
ThrowXML2(NumberFormatException
, XMLExcepts::XMLNUM_URI_NullPath
, errMsg_FRAGMENT
, newFragment);
}
else if (!isURIString(newFragment))
{
ThrowXML1(NumberFormatException
, XMLExcepts::XMLNUM_URI_Component_Invalid_Char
, errMsg_FRAGMENT);
}
else
{
if (getFragment())
{
delete [] fFragment;
}
fFragment = XMLString::replicate(newFragment);
}
}
//
// query = *uric
//
void XMLUri::setQueryString(const XMLCh* const newQueryString)
{
if ( !newQueryString )
{
if (getQueryString())
delete [] fQueryString;
fQueryString = 0;
}
else if (!isGenericURI())
{
ThrowXML2(NumberFormatException
, XMLExcepts::XMLNUM_URI_Component_for_GenURI_Only
, errMsg_QUERY
, newQueryString);
}
else if ( !getPath() )
{
ThrowXML2(NumberFormatException
, XMLExcepts::XMLNUM_URI_NullPath
, errMsg_QUERY
, newQueryString);
}
else if (!isURIString(newQueryString))
{
ThrowXML2(NumberFormatException
, XMLExcepts::XMLNUM_URI_Component_Invalid_Char
, errMsg_QUERY
, newQueryString);
}
else
{
if (getQueryString())
{
delete [] fQueryString;
}
fQueryString = XMLString::replicate(newQueryString);
}
}
// ---------------------------------------------------------------------------
// XMLUri: Public, static methods
// ---------------------------------------------------------------------------
//
// scheme = alpha *( alpha | digit | "+" | "-" | "." )
// alphanum = alpha | digit
//
bool XMLUri::isConformantSchemeName(const XMLCh* const scheme)
{
if ( !scheme )
return false;
const XMLCh* tmpStr = scheme;
if (!XMLString::isAlpha(*tmpStr)) // first: alpha
return false;
// second onwards: ( alpha | digit | "+" | "-" | "." )
tmpStr++;
while (*tmpStr)
{
if ( !XMLString::isAlphaNum(*tmpStr) &&
(XMLString::indexOf(SCHEME_CHARACTERS, *tmpStr) == -1))
return false;
tmpStr++;
}
return true;
}
//
// userinfo = *( unreserved | escaped |
// ";" | ":" | "&" | "=" | "+" | "$" | "," )
//
void XMLUri::isConformantUserInfo(const XMLCh* const userInfo)
{
if ( !userInfo )
return;
const XMLCh* tmpStr = userInfo;
while (*tmpStr)
{
if ( isUnreservedCharacter(*tmpStr) ||
(XMLString::indexOf(USERINFO_CHARACTERS, *tmpStr) != -1))
{
tmpStr++;
}
else if (*tmpStr == chPercent) // '%'
{
if (XMLString::isHex(*(tmpStr+1)) && // 1st hex
XMLString::isHex(*(tmpStr+2)) ) // 2nd hex
{
tmpStr+=3;
}
else
{
value1[0] = chPercent;
value1[1] = *(tmpStr+1);
value1[2] = *(tmpStr+2);
value1[3] = chNull;
ThrowXML2(NumberFormatException
, XMLExcepts::XMLNUM_URI_Component_Invalid_EscapeSequence
, errMsg_USERINFO
, value1);
}
}
else
{
ThrowXML2(NumberFormatException
, XMLExcepts::XMLNUM_URI_Component_Invalid_Char
, errMsg_USERINFO
, userInfo);
}
} //while
return;
}
//
// uric = reserved | unreserved | escaped
// escaped = "%" hex hex
// hex = digit | "A" | "B" | "C" | "D" | "E" | "F" |
// "a" | "b" | "c" | "d" | "e" | "f"
//
bool XMLUri::isURIString(const XMLCh* const uricString)
{
if (!uricString || !*uricString)
return false;
const XMLCh* tmpStr = uricString;
while (*tmpStr)
{
if (isReservedCharacter(*tmpStr) ||
isUnreservedCharacter(*tmpStr) )
{
tmpStr++;
}
else if (*tmpStr == chPercent) // '%'
{
if (XMLString::isHex(*(tmpStr+1)) && // 1st hex
XMLString::isHex(*(tmpStr+2)) ) // 2nd hex
{
tmpStr+=3;
}
else
{
return false;
}
}
else
{
return false;
}
}
return true;
}
//
// host = hostname | IPv4address
//
// hostname = *( domainlabel "." ) toplabel [ "." ]
// domainlabel = alphanum | alphanum *( alphanum | "-" ) alphanum
// toplabel = alpha | alpha *( alphanum | "-" ) alphanum
//
// IPv4address = 1*digit "." 1*digit "." 1*digit "." 1*digit
//
bool XMLUri::isWellFormedAddress(const XMLCh* const addrString)
{
if (!addrString)
return false;
//
// check length
//
XMLCh* tmpAddr = XMLString::replicate(addrString);
ArrayJanitor<XMLCh> janName(tmpAddr);
XMLString::trim(tmpAddr);
if ((XMLString::stringLen(tmpAddr) == 0) ||
(XMLString::stringLen(tmpAddr) > 255) )
return false;
//
// the frist letter shall NOT be "." or "-"
//
if (*addrString == chPeriod ||
*addrString == chDash )
return false;
// rightmost domain label starting with digit indicates IP address
// since top level domain label can only start with an alpha
// see RFC 2396 Section 3.2.2
int addrStrLen = XMLString::stringLen(addrString);
int lastPeriodPos = XMLString::lastIndexOf(addrString, chPeriod);
// if the string ends with "."
// get the second last "."
if (lastPeriodPos + 1 == addrStrLen)
{
XMLCh* tmp2 = new XMLCh[addrStrLen];
XMLString::subString(tmp2, addrString, 0, lastPeriodPos);
lastPeriodPos = XMLString::lastIndexOf(tmp2, chPeriod);
delete [] tmp2;
if ( XMLString::isDigit(addrString[lastPeriodPos + 1]))
return false;
}
if (XMLString::isDigit(addrString[lastPeriodPos + 1]))
{
//
// IPv4address = 1*digit "." 1*digit "." 1*digit "." 1*digit
//
// make sure that
// 1) we see only digits and dot separators,
// 2) that any dot separator is preceded and followed by a digit
// 3) that we find 3 dots
int numDots = 0;
for (int i = 0; i < addrStrLen; i++)
{
if (addrString[i] == chPeriod)
{
if (((i > 0) &&
(!XMLString::isDigit(addrString[i-1]))) ||
((i + 1 < addrStrLen) &&
(!XMLString::isDigit(addrString[i+1]))) )
{
return false;
}
numDots++;
}
else if (!XMLString::isDigit(addrString[i]))
{
return false;
}
} //for
if (numDots != 3)
{
return false;
}
} // end of IPv4address
else
{
//
// hostname = *( domainlabel "." ) toplabel [ "." ]
// domainlabel = alphanum | alphanum *( alphanum | "-" ) alphanum
// toplabel = alpha | alpha *( alphanum | "-" ) alphanum
//
// domain labels can contain alphanumerics and '-"
// but must start and end with an alphanumeric
for (int i = 0; i < addrStrLen; i++)
{
if (addrString[i] == chPeriod)
{
if (((i > 0) &&
(!XMLString::isAlphaNum(addrString[i-1]))) ||
((i + 1 < addrStrLen) &&
(!XMLString::isAlphaNum(addrString[i+1]))) )
{
return false;
}
}
else if (!XMLString::isAlphaNum(addrString[i]) &&
addrString[i] != chDash)
{
return false;
}
} //for
}
return true;
}
bool XMLUri::isGenericURI()
{
return (getHost() != 0);
}