site/node_modules/mdast-util-math/lib/index.js
2024-10-14 08:09:33 +02:00

317 lines
8.4 KiB
JavaScript
Raw Blame History

This file contains ambiguous Unicode characters

This file contains Unicode characters that might be confused with other characters. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.

/**
* @typedef {import('hast').Element} HastElement
* @typedef {import('hast').ElementContent} HastElementContent
* @typedef {import('mdast-util-from-markdown').CompileContext} CompileContext
* @typedef {import('mdast-util-from-markdown').Extension} FromMarkdownExtension
* @typedef {import('mdast-util-from-markdown').Handle} FromMarkdownHandle
* @typedef {import('mdast-util-to-markdown').Handle} ToMarkdownHandle
* @typedef {import('mdast-util-to-markdown').Options} ToMarkdownExtension
* @typedef {import('../index.js').InlineMath} InlineMath
* @typedef {import('../index.js').Math} Math
*
* @typedef ToOptions
* Configuration.
* @property {boolean | null | undefined} [singleDollarTextMath=true]
* Whether to support math (text) with a single dollar (default: `true`).
*
* Single dollars work in Pandoc and many other places, but often interfere
* with “normal” dollars in text.
* If you turn this off, you can still use two or more dollars for text math.
*/
import {ok as assert} from 'devlop'
import {longestStreak} from 'longest-streak'
/**
* Create an extension for `mdast-util-from-markdown`.
*
* @returns {FromMarkdownExtension}
* Extension for `mdast-util-from-markdown`.
*/
export function mathFromMarkdown() {
return {
enter: {
mathFlow: enterMathFlow,
mathFlowFenceMeta: enterMathFlowMeta,
mathText: enterMathText
},
exit: {
mathFlow: exitMathFlow,
mathFlowFence: exitMathFlowFence,
mathFlowFenceMeta: exitMathFlowMeta,
mathFlowValue: exitMathData,
mathText: exitMathText,
mathTextData: exitMathData
}
}
/**
* @this {CompileContext}
* @type {FromMarkdownHandle}
*/
function enterMathFlow(token) {
/** @type {HastElement} */
const code = {
type: 'element',
tagName: 'code',
properties: {className: ['language-math', 'math-display']},
children: []
}
this.enter(
{
type: 'math',
meta: null,
value: '',
data: {hName: 'pre', hChildren: [code]}
},
token
)
}
/**
* @this {CompileContext}
* @type {FromMarkdownHandle}
*/
function enterMathFlowMeta() {
this.buffer()
}
/**
* @this {CompileContext}
* @type {FromMarkdownHandle}
*/
function exitMathFlowMeta() {
const data = this.resume()
const node = this.stack[this.stack.length - 1]
assert(node.type === 'math')
node.meta = data
}
/**
* @this {CompileContext}
* @type {FromMarkdownHandle}
*/
function exitMathFlowFence() {
// Exit if this is the closing fence.
if (this.data.mathFlowInside) return
this.buffer()
this.data.mathFlowInside = true
}
/**
* @this {CompileContext}
* @type {FromMarkdownHandle}
*/
function exitMathFlow(token) {
const data = this.resume().replace(/^(\r?\n|\r)|(\r?\n|\r)$/g, '')
const node = this.stack[this.stack.length - 1]
assert(node.type === 'math')
this.exit(token)
node.value = data
// @ts-expect-error: we defined it in `enterMathFlow`.
const code = /** @type {HastElement} */ (node.data.hChildren[0])
assert(code.type === 'element')
assert(code.tagName === 'code')
code.children.push({type: 'text', value: data})
this.data.mathFlowInside = undefined
}
/**
* @this {CompileContext}
* @type {FromMarkdownHandle}
*/
function enterMathText(token) {
this.enter(
{
type: 'inlineMath',
value: '',
data: {
hName: 'code',
hProperties: {className: ['language-math', 'math-inline']},
hChildren: []
}
},
token
)
this.buffer()
}
/**
* @this {CompileContext}
* @type {FromMarkdownHandle}
*/
function exitMathText(token) {
const data = this.resume()
const node = this.stack[this.stack.length - 1]
assert(node.type === 'inlineMath')
this.exit(token)
node.value = data
const children = /** @type {Array<HastElementContent>} */ (
// @ts-expect-error: we defined it in `enterMathFlow`.
node.data.hChildren
)
children.push({type: 'text', value: data})
}
/**
* @this {CompileContext}
* @type {FromMarkdownHandle}
*/
function exitMathData(token) {
this.config.enter.data.call(this, token)
this.config.exit.data.call(this, token)
}
}
/**
* Create an extension for `mdast-util-to-markdown`.
*
* @param {ToOptions | null | undefined} [options]
* Configuration (optional).
* @returns {ToMarkdownExtension}
* Extension for `mdast-util-to-markdown`.
*/
export function mathToMarkdown(options) {
let single = (options || {}).singleDollarTextMath
if (single === null || single === undefined) {
single = true
}
inlineMath.peek = inlineMathPeek
return {
unsafe: [
{character: '\r', inConstruct: 'mathFlowMeta'},
{character: '\n', inConstruct: 'mathFlowMeta'},
{
character: '$',
after: single ? undefined : '\\$',
inConstruct: 'phrasing'
},
{character: '$', inConstruct: 'mathFlowMeta'},
{atBreak: true, character: '$', after: '\\$'}
],
handlers: {math, inlineMath}
}
/**
* @type {ToMarkdownHandle}
* @param {Math} node
*/
// Note: fixing this code? Please also fix the similar code for code:
// <https://github.com/syntax-tree/mdast-util-to-markdown/blob/main/lib/handle/code.js>
function math(node, _, state, info) {
const raw = node.value || ''
const tracker = state.createTracker(info)
const sequence = '$'.repeat(Math.max(longestStreak(raw, '$') + 1, 2))
const exit = state.enter('mathFlow')
let value = tracker.move(sequence)
if (node.meta) {
const subexit = state.enter('mathFlowMeta')
value += tracker.move(
state.safe(node.meta, {
after: '\n',
before: value,
encode: ['$'],
...tracker.current()
})
)
subexit()
}
value += tracker.move('\n')
if (raw) {
value += tracker.move(raw + '\n')
}
value += tracker.move(sequence)
exit()
return value
}
/**
* @type {ToMarkdownHandle}
* @param {InlineMath} node
*/
// Note: fixing this code? Please also fix the similar code for inline code:
// <https://github.com/syntax-tree/mdast-util-to-markdown/blob/main/lib/handle/inline-code.js>
function inlineMath(node, _, state) {
let value = node.value || ''
let size = 1
if (!single) size++
// If there is a single dollar sign on its own in the math, use a fence of
// two.
// If there are two in a row, use one.
while (
new RegExp('(^|[^$])' + '\\$'.repeat(size) + '([^$]|$)').test(value)
) {
size++
}
const sequence = '$'.repeat(size)
// If this is not just spaces or eols (tabs dont count), and either the
// first and last character are a space or eol, or the first or last
// character are dollar signs, then pad with spaces.
if (
// Contains non-space.
/[^ \r\n]/.test(value) &&
// Starts with space and ends with space.
((/^[ \r\n]/.test(value) && /[ \r\n]$/.test(value)) ||
// Starts or ends with dollar.
/^\$|\$$/.test(value))
) {
value = ' ' + value + ' '
}
let index = -1
// We have a potential problem: certain characters after eols could result in
// blocks being seen.
// For example, if someone injected the string `'\n# b'`, then that would
// result in an ATX heading.
// We cant escape characters in `inlineMath`, but because eols are
// transformed to spaces when going from markdown to HTML anyway, we can swap
// them out.
while (++index < state.unsafe.length) {
const pattern = state.unsafe[index]
// Only look for `atBreak`s.
// Btw: note that `atBreak` patterns will always start the regex at LF or
// CR.
if (!pattern.atBreak) continue
const expression = state.compilePattern(pattern)
/** @type {RegExpExecArray | null} */
let match
while ((match = expression.exec(value))) {
let position = match.index
// Support CRLF (patterns only look for one of the characters).
if (
value.codePointAt(position) === 10 /* `\n` */ &&
value.codePointAt(position - 1) === 13 /* `\r` */
) {
position--
}
value = value.slice(0, position) + ' ' + value.slice(match.index + 1)
}
}
return sequence + value + sequence
}
/**
* @returns {string}
*/
function inlineMathPeek() {
return '$'
}
}