blob: 6a68011dec97aa2f17b14d5edda977acc3dfdafd [file] [log] [blame]
var HTML_ALPHA = ['apos', 'nbsp', 'iexcl', 'cent', 'pound', 'curren', 'yen', 'brvbar', 'sect', 'uml', 'copy', 'ordf', 'laquo', 'not', 'shy', 'reg', 'macr', 'deg', 'plusmn', 'sup2', 'sup3', 'acute', 'micro', 'para', 'middot', 'cedil', 'sup1', 'ordm', 'raquo', 'frac14', 'frac12', 'frac34', 'iquest', 'Agrave', 'Aacute', 'Acirc', 'Atilde', 'Auml', 'Aring', 'Aelig', 'Ccedil', 'Egrave', 'Eacute', 'Ecirc', 'Euml', 'Igrave', 'Iacute', 'Icirc', 'Iuml', 'ETH', 'Ntilde', 'Ograve', 'Oacute', 'Ocirc', 'Otilde', 'Ouml', 'times', 'Oslash', 'Ugrave', 'Uacute', 'Ucirc', 'Uuml', 'Yacute', 'THORN', 'szlig', 'agrave', 'aacute', 'acirc', 'atilde', 'auml', 'aring', 'aelig', 'ccedil', 'egrave', 'eacute', 'ecirc', 'euml', 'igrave', 'iacute', 'icirc', 'iuml', 'eth', 'ntilde', 'ograve', 'oacute', 'ocirc', 'otilde', 'ouml', 'divide', 'oslash', 'ugrave', 'uacute', 'ucirc', 'uuml', 'yacute', 'thorn', 'yuml', 'quot', 'amp', 'lt', 'gt', 'OElig', 'oelig', 'Scaron', 'scaron', 'Yuml', 'circ', 'tilde', 'ensp', 'emsp', 'thinsp', 'zwnj', 'zwj', 'lrm', 'rlm', 'ndash', 'mdash', 'lsquo', 'rsquo', 'sbquo', 'ldquo', 'rdquo', 'bdquo', 'dagger', 'Dagger', 'permil', 'lsaquo', 'rsaquo', 'euro', 'fnof', 'Alpha', 'Beta', 'Gamma', 'Delta', 'Epsilon', 'Zeta', 'Eta', 'Theta', 'Iota', 'Kappa', 'Lambda', 'Mu', 'Nu', 'Xi', 'Omicron', 'Pi', 'Rho', 'Sigma', 'Tau', 'Upsilon', 'Phi', 'Chi', 'Psi', 'Omega', 'alpha', 'beta', 'gamma', 'delta', 'epsilon', 'zeta', 'eta', 'theta', 'iota', 'kappa', 'lambda', 'mu', 'nu', 'xi', 'omicron', 'pi', 'rho', 'sigmaf', 'sigma', 'tau', 'upsilon', 'phi', 'chi', 'psi', 'omega', 'thetasym', 'upsih', 'piv', 'bull', 'hellip', 'prime', 'Prime', 'oline', 'frasl', 'weierp', 'image', 'real', 'trade', 'alefsym', 'larr', 'uarr', 'rarr', 'darr', 'harr', 'crarr', 'lArr', 'uArr', 'rArr', 'dArr', 'hArr', 'forall', 'part', 'exist', 'empty', 'nabla', 'isin', 'notin', 'ni', 'prod', 'sum', 'minus', 'lowast', 'radic', 'prop', 'infin', 'ang', 'and', 'or', 'cap', 'cup', 'int', 'there4', 'sim', 'cong', 'asymp', 'ne', 'equiv', 'le', 'ge', 'sub', 'sup', 'nsub', 'sube', 'supe', 'oplus', 'otimes', 'perp', 'sdot', 'lceil', 'rceil', 'lfloor', 'rfloor', 'lang', 'rang', 'loz', 'spades', 'clubs', 'hearts', 'diams'];
var HTML_CODES = [39, 160, 161, 162, 163, 164, 165, 166, 167, 168, 169, 170, 171, 172, 173, 174, 175, 176, 177, 178, 179, 180, 181, 182, 183, 184, 185, 186, 187, 188, 189, 190, 191, 192, 193, 194, 195, 196, 197, 198, 199, 200, 201, 202, 203, 204, 205, 206, 207, 208, 209, 210, 211, 212, 213, 214, 215, 216, 217, 218, 219, 220, 221, 222, 223, 224, 225, 226, 227, 228, 229, 230, 231, 232, 233, 234, 235, 236, 237, 238, 239, 240, 241, 242, 243, 244, 245, 246, 247, 248, 249, 250, 251, 252, 253, 254, 255, 34, 38, 60, 62, 338, 339, 352, 353, 376, 710, 732, 8194, 8195, 8201, 8204, 8205, 8206, 8207, 8211, 8212, 8216, 8217, 8218, 8220, 8221, 8222, 8224, 8225, 8240, 8249, 8250, 8364, 402, 913, 914, 915, 916, 917, 918, 919, 920, 921, 922, 923, 924, 925, 926, 927, 928, 929, 931, 932, 933, 934, 935, 936, 937, 945, 946, 947, 948, 949, 950, 951, 952, 953, 954, 955, 956, 957, 958, 959, 960, 961, 962, 963, 964, 965, 966, 967, 968, 969, 977, 978, 982, 8226, 8230, 8242, 8243, 8254, 8260, 8472, 8465, 8476, 8482, 8501, 8592, 8593, 8594, 8595, 8596, 8629, 8656, 8657, 8658, 8659, 8660, 8704, 8706, 8707, 8709, 8711, 8712, 8713, 8715, 8719, 8721, 8722, 8727, 8730, 8733, 8734, 8736, 8743, 8744, 8745, 8746, 8747, 8756, 8764, 8773, 8776, 8800, 8801, 8804, 8805, 8834, 8835, 8836, 8838, 8839, 8853, 8855, 8869, 8901, 8968, 8969, 8970, 8971, 9001, 9002, 9674, 9824, 9827, 9829, 9830];
var alphaIndex = {};
var numIndex = {};
var i = 0;
var length = HTML_ALPHA.length;
while (i < length) {
var a = HTML_ALPHA[i];
var c = HTML_CODES[i];
alphaIndex[a] = String.fromCharCode(c);
numIndex[c] = a;
i++;
}
/**
* @constructor
*/
function Html4Entities() {}
/**
* @param {String} str
* @returns {String}
*/
Html4Entities.prototype.decode = function(str) {
if (!str || !str.length) {
return '';
}
return str.replace(/&(#?[\w\d]+);?/g, function(s, entity) {
var chr;
if (entity.charAt(0) === "#") {
var code = entity.charAt(1).toLowerCase() === 'x' ?
parseInt(entity.substr(2), 16) :
parseInt(entity.substr(1));
if (!(isNaN(code) || code < -32768 || code > 65535)) {
chr = String.fromCharCode(code);
}
} else {
chr = alphaIndex[entity];
}
return chr || s;
});
};
/**
* @param {String} str
* @returns {String}
*/
Html4Entities.decode = function(str) {
return new Html4Entities().decode(str);
};
/**
* @param {String} str
* @returns {String}
*/
Html4Entities.prototype.encode = function(str) {
if (!str || !str.length) {
return '';
}
var strLength = str.length;
var result = '';
var i = 0;
while (i < strLength) {
var alpha = numIndex[str.charCodeAt(i)];
result += alpha ? "&" + alpha + ";" : str.charAt(i);
i++;
}
return result;
};
/**
* @param {String} str
* @returns {String}
*/
Html4Entities.encode = function(str) {
return new Html4Entities().encode(str);
};
/**
* @param {String} str
* @returns {String}
*/
Html4Entities.prototype.encodeNonUTF = function(str) {
if (!str || !str.length) {
return '';
}
var strLength = str.length;
var result = '';
var i = 0;
while (i < strLength) {
var cc = str.charCodeAt(i);
var alpha = numIndex[cc];
if (alpha) {
result += "&" + alpha + ";";
} else if (cc < 32 || cc > 126) {
result += "&#" + cc + ";";
} else {
result += str.charAt(i);
}
i++;
}
return result;
};
/**
* @param {String} str
* @returns {String}
*/
Html4Entities.encodeNonUTF = function(str) {
return new Html4Entities().encodeNonUTF(str);
};
/**
* @param {String} str
* @returns {String}
*/
Html4Entities.prototype.encodeNonASCII = function(str) {
if (!str || !str.length) {
return '';
}
var strLength = str.length;
var result = '';
var i = 0;
while (i < strLength) {
var c = str.charCodeAt(i);
if (c <= 255) {
result += str[i++];
continue;
}
result += '&#' + c + ';';
i++;
}
return result;
};
/**
* @param {String} str
* @returns {String}
*/
Html4Entities.encodeNonASCII = function(str) {
return new Html4Entities().encodeNonASCII(str);
};
module.exports = Html4Entities;