export const xmlReplacer = /["&'<>$\x80-\uFFFF]/g; | |
const xmlCodeMap = new Map([ | |
[34, """], | |
[38, "&"], | |
[39, "'"], | |
[60, "<"], | |
[62, ">"], | |
]); | |
// For compatibility with node < 4, we wrap `codePointAt` | |
export const getCodePoint = | |
// eslint-disable-next-line @typescript-eslint/no-unnecessary-condition | |
String.prototype.codePointAt != null | |
? (str, index) => str.codePointAt(index) | |
: // http://mathiasbynens.be/notes/javascript-encoding#surrogate-formulae | |
(c, index) => (c.charCodeAt(index) & 0xfc00) === 0xd800 | |
? (c.charCodeAt(index) - 0xd800) * 0x400 + | |
c.charCodeAt(index + 1) - | |
0xdc00 + | |
0x10000 | |
: c.charCodeAt(index); | |
/** | |
* Encodes all non-ASCII characters, as well as characters not valid in XML | |
* documents using XML entities. | |
* | |
* If a character has no equivalent entity, a | |
* numeric hexadecimal reference (eg. `ü`) will be used. | |
*/ | |
export function encodeXML(str) { | |
let ret = ""; | |
let lastIdx = 0; | |
let match; | |
while ((match = xmlReplacer.exec(str)) !== null) { | |
const i = match.index; | |
const char = str.charCodeAt(i); | |
const next = xmlCodeMap.get(char); | |
if (next !== undefined) { | |
ret += str.substring(lastIdx, i) + next; | |
lastIdx = i + 1; | |
} | |
else { | |
ret += `${str.substring(lastIdx, i)}&#x${getCodePoint(str, i).toString(16)};`; | |
// Increase by 1 if we have a surrogate pair | |
lastIdx = xmlReplacer.lastIndex += Number((char & 0xfc00) === 0xd800); | |
} | |
} | |
return ret + str.substr(lastIdx); | |
} | |
/** | |
* Encodes all non-ASCII characters, as well as characters not valid in XML | |
* documents using numeric hexadecimal reference (eg. `ü`). | |
* | |
* Have a look at `escapeUTF8` if you want a more concise output at the expense | |
* of reduced transportability. | |
* | |
* @param data String to escape. | |
*/ | |
export const escape = encodeXML; | |
/** | |
* Creates a function that escapes all characters matched by the given regular | |
* expression using the given map of characters to escape to their entities. | |
* | |
* @param regex Regular expression to match characters to escape. | |
* @param map Map of characters to escape to their entities. | |
* | |
* @returns Function that escapes all characters matched by the given regular | |
* expression using the given map of characters to escape to their entities. | |
*/ | |
function getEscaper(regex, map) { | |
return function escape(data) { | |
let match; | |
let lastIdx = 0; | |
let result = ""; | |
while ((match = regex.exec(data))) { | |
if (lastIdx !== match.index) { | |
result += data.substring(lastIdx, match.index); | |
} | |
// We know that this character will be in the map. | |
result += map.get(match[0].charCodeAt(0)); | |
// Every match will be of length 1 | |
lastIdx = match.index + 1; | |
} | |
return result + data.substring(lastIdx); | |
}; | |
} | |
/** | |
* Encodes all characters not valid in XML documents using XML entities. | |
* | |
* Note that the output will be character-set dependent. | |
* | |
* @param data String to escape. | |
*/ | |
export const escapeUTF8 = getEscaper(/[&<>'"]/g, xmlCodeMap); | |
/** | |
* Encodes all characters that have to be escaped in HTML attributes, | |
* following {@link https://html.spec.whatwg.org/multipage/parsing.html#escapingString}. | |
* | |
* @param data String to escape. | |
*/ | |
export const escapeAttribute = getEscaper(/["&\u00A0]/g, new Map([ | |
[34, """], | |
[38, "&"], | |
[160, " "], | |
])); | |
/** | |
* Encodes all characters that have to be escaped in HTML text, | |
* following {@link https://html.spec.whatwg.org/multipage/parsing.html#escapingString}. | |
* | |
* @param data String to escape. | |
*/ | |
export const escapeText = getEscaper(/[&<>\u00A0]/g, new Map([ | |
[38, "&"], | |
[60, "<"], | |
[62, ">"], | |
[160, " "], | |
])); | |
//# sourceMappingURL=escape.js.map |