116 lines
No EOL
3.9 KiB
JavaScript
116 lines
No EOL
3.9 KiB
JavaScript
export const xmlReplacer = /["&'<>$\x80-\uFFFF]/g;
|
|
const xmlCodeMap = new Map([
|
|
[34, """],
|
|
[38, "&"],
|
|
[39, "'"],
|
|
[60, "<"],
|
|
[62, ">"],
|
|
]);
|
|
// For compatibility with node < 4, we wrap `codePointAt`
|
|
export const getCodePoint =
|
|
// eslint-disable-next-line @typescript-eslint/no-unnecessary-condition
|
|
String.prototype.codePointAt != null
|
|
? (str, index) => str.codePointAt(index)
|
|
: // http://mathiasbynens.be/notes/javascript-encoding#surrogate-formulae
|
|
(c, index) => (c.charCodeAt(index) & 0xfc00) === 0xd800
|
|
? (c.charCodeAt(index) - 0xd800) * 0x400 +
|
|
c.charCodeAt(index + 1) -
|
|
0xdc00 +
|
|
0x10000
|
|
: c.charCodeAt(index);
|
|
/**
|
|
* Encodes all non-ASCII characters, as well as characters not valid in XML
|
|
* documents using XML entities.
|
|
*
|
|
* If a character has no equivalent entity, a
|
|
* numeric hexadecimal reference (eg. `ü`) will be used.
|
|
*/
|
|
export function encodeXML(str) {
|
|
let ret = "";
|
|
let lastIdx = 0;
|
|
let match;
|
|
while ((match = xmlReplacer.exec(str)) !== null) {
|
|
const i = match.index;
|
|
const char = str.charCodeAt(i);
|
|
const next = xmlCodeMap.get(char);
|
|
if (next !== undefined) {
|
|
ret += str.substring(lastIdx, i) + next;
|
|
lastIdx = i + 1;
|
|
}
|
|
else {
|
|
ret += `${str.substring(lastIdx, i)}&#x${getCodePoint(str, i).toString(16)};`;
|
|
// Increase by 1 if we have a surrogate pair
|
|
lastIdx = xmlReplacer.lastIndex += Number((char & 0xfc00) === 0xd800);
|
|
}
|
|
}
|
|
return ret + str.substr(lastIdx);
|
|
}
|
|
/**
|
|
* Encodes all non-ASCII characters, as well as characters not valid in XML
|
|
* documents using numeric hexadecimal reference (eg. `ü`).
|
|
*
|
|
* Have a look at `escapeUTF8` if you want a more concise output at the expense
|
|
* of reduced transportability.
|
|
*
|
|
* @param data String to escape.
|
|
*/
|
|
export const escape = encodeXML;
|
|
/**
|
|
* Creates a function that escapes all characters matched by the given regular
|
|
* expression using the given map of characters to escape to their entities.
|
|
*
|
|
* @param regex Regular expression to match characters to escape.
|
|
* @param map Map of characters to escape to their entities.
|
|
*
|
|
* @returns Function that escapes all characters matched by the given regular
|
|
* expression using the given map of characters to escape to their entities.
|
|
*/
|
|
function getEscaper(regex, map) {
|
|
return function escape(data) {
|
|
let match;
|
|
let lastIdx = 0;
|
|
let result = "";
|
|
while ((match = regex.exec(data))) {
|
|
if (lastIdx !== match.index) {
|
|
result += data.substring(lastIdx, match.index);
|
|
}
|
|
// We know that this character will be in the map.
|
|
result += map.get(match[0].charCodeAt(0));
|
|
// Every match will be of length 1
|
|
lastIdx = match.index + 1;
|
|
}
|
|
return result + data.substring(lastIdx);
|
|
};
|
|
}
|
|
/**
|
|
* Encodes all characters not valid in XML documents using XML entities.
|
|
*
|
|
* Note that the output will be character-set dependent.
|
|
*
|
|
* @param data String to escape.
|
|
*/
|
|
export const escapeUTF8 = getEscaper(/[&<>'"]/g, xmlCodeMap);
|
|
/**
|
|
* Encodes all characters that have to be escaped in HTML attributes,
|
|
* following {@link https://html.spec.whatwg.org/multipage/parsing.html#escapingString}.
|
|
*
|
|
* @param data String to escape.
|
|
*/
|
|
export const escapeAttribute = getEscaper(/["&\u00A0]/g, new Map([
|
|
[34, """],
|
|
[38, "&"],
|
|
[160, " "],
|
|
]));
|
|
/**
|
|
* Encodes all characters that have to be escaped in HTML text,
|
|
* following {@link https://html.spec.whatwg.org/multipage/parsing.html#escapingString}.
|
|
*
|
|
* @param data String to escape.
|
|
*/
|
|
export const escapeText = getEscaper(/[&<>\u00A0]/g, new Map([
|
|
[38, "&"],
|
|
[60, "<"],
|
|
[62, ">"],
|
|
[160, " "],
|
|
]));
|
|
//# sourceMappingURL=escape.js.map
|