site/node_modules/micromark-util-decode-numeric-character-reference/dev/index.js

43 lines
1.2 KiB
JavaScript
Raw Normal View History

2024-10-14 08:09:33 +02:00
import {codes, values} from 'micromark-util-symbol'
/**
* Turn the number (in string form as either hexa- or plain decimal) coming from
* a numeric character reference into a character.
*
* Sort of like `String.fromCodePoint(Number.parseInt(value, base))`, but makes
* non-characters and control characters safe.
*
* @param {string} value
* Value to decode.
* @param {number} base
* Numeric base.
* @returns {string}
* Character.
*/
export function decodeNumericCharacterReference(value, base) {
const code = Number.parseInt(value, base)
if (
// C0 except for HT, LF, FF, CR, space.
code < codes.ht ||
code === codes.vt ||
(code > codes.cr && code < codes.space) ||
// Control character (DEL) of C0, and C1 controls.
(code > codes.tilde && code < 160) ||
// Lone high surrogates and low surrogates.
(code > 55_295 && code < 57_344) ||
// Noncharacters.
(code > 64_975 && code < 65_008) ||
/* eslint-disable no-bitwise */
(code & 65_535) === 65_535 ||
(code & 65_535) === 65_534 ||
/* eslint-enable no-bitwise */
// Out of range
code > 1_114_111
) {
return values.replacementCharacter
}
return String.fromCodePoint(code)
}