263 lines
7.7 KiB
JavaScript
263 lines
7.7 KiB
JavaScript
/**
|
||
* @typedef {import('micromark-util-types').Code} Code
|
||
* @typedef {import('micromark-util-types').Construct} Construct
|
||
* @typedef {import('micromark-util-types').Event} Event
|
||
* @typedef {import('micromark-util-types').Point} Point
|
||
* @typedef {import('micromark-util-types').Resolver} Resolver
|
||
* @typedef {import('micromark-util-types').State} State
|
||
* @typedef {import('micromark-util-types').Token} Token
|
||
* @typedef {import('micromark-util-types').TokenizeContext} TokenizeContext
|
||
* @typedef {import('micromark-util-types').Tokenizer} Tokenizer
|
||
*/
|
||
|
||
import {push, splice} from 'micromark-util-chunked'
|
||
import {classifyCharacter} from 'micromark-util-classify-character'
|
||
import {resolveAll} from 'micromark-util-resolve-all'
|
||
/** @type {Construct} */
|
||
export const attention = {
|
||
name: 'attention',
|
||
tokenize: tokenizeAttention,
|
||
resolveAll: resolveAllAttention
|
||
}
|
||
|
||
/**
|
||
* Take all events and resolve attention to emphasis or strong.
|
||
*
|
||
* @type {Resolver}
|
||
*/
|
||
// eslint-disable-next-line complexity
|
||
function resolveAllAttention(events, context) {
|
||
let index = -1
|
||
/** @type {number} */
|
||
let open
|
||
/** @type {Token} */
|
||
let group
|
||
/** @type {Token} */
|
||
let text
|
||
/** @type {Token} */
|
||
let openingSequence
|
||
/** @type {Token} */
|
||
let closingSequence
|
||
/** @type {number} */
|
||
let use
|
||
/** @type {Array<Event>} */
|
||
let nextEvents
|
||
/** @type {number} */
|
||
let offset
|
||
|
||
// Walk through all events.
|
||
//
|
||
// Note: performance of this is fine on an mb of normal markdown, but it’s
|
||
// a bottleneck for malicious stuff.
|
||
while (++index < events.length) {
|
||
// Find a token that can close.
|
||
if (
|
||
events[index][0] === 'enter' &&
|
||
events[index][1].type === 'attentionSequence' &&
|
||
events[index][1]._close
|
||
) {
|
||
open = index
|
||
|
||
// Now walk back to find an opener.
|
||
while (open--) {
|
||
// Find a token that can open the closer.
|
||
if (
|
||
events[open][0] === 'exit' &&
|
||
events[open][1].type === 'attentionSequence' &&
|
||
events[open][1]._open &&
|
||
// If the markers are the same:
|
||
context.sliceSerialize(events[open][1]).charCodeAt(0) ===
|
||
context.sliceSerialize(events[index][1]).charCodeAt(0)
|
||
) {
|
||
// If the opening can close or the closing can open,
|
||
// and the close size *is not* a multiple of three,
|
||
// but the sum of the opening and closing size *is* multiple of three,
|
||
// then don’t match.
|
||
if (
|
||
(events[open][1]._close || events[index][1]._open) &&
|
||
(events[index][1].end.offset - events[index][1].start.offset) % 3 &&
|
||
!(
|
||
(events[open][1].end.offset -
|
||
events[open][1].start.offset +
|
||
events[index][1].end.offset -
|
||
events[index][1].start.offset) %
|
||
3
|
||
)
|
||
) {
|
||
continue
|
||
}
|
||
|
||
// Number of markers to use from the sequence.
|
||
use =
|
||
events[open][1].end.offset - events[open][1].start.offset > 1 &&
|
||
events[index][1].end.offset - events[index][1].start.offset > 1
|
||
? 2
|
||
: 1
|
||
const start = Object.assign({}, events[open][1].end)
|
||
const end = Object.assign({}, events[index][1].start)
|
||
movePoint(start, -use)
|
||
movePoint(end, use)
|
||
openingSequence = {
|
||
type: use > 1 ? 'strongSequence' : 'emphasisSequence',
|
||
start,
|
||
end: Object.assign({}, events[open][1].end)
|
||
}
|
||
closingSequence = {
|
||
type: use > 1 ? 'strongSequence' : 'emphasisSequence',
|
||
start: Object.assign({}, events[index][1].start),
|
||
end
|
||
}
|
||
text = {
|
||
type: use > 1 ? 'strongText' : 'emphasisText',
|
||
start: Object.assign({}, events[open][1].end),
|
||
end: Object.assign({}, events[index][1].start)
|
||
}
|
||
group = {
|
||
type: use > 1 ? 'strong' : 'emphasis',
|
||
start: Object.assign({}, openingSequence.start),
|
||
end: Object.assign({}, closingSequence.end)
|
||
}
|
||
events[open][1].end = Object.assign({}, openingSequence.start)
|
||
events[index][1].start = Object.assign({}, closingSequence.end)
|
||
nextEvents = []
|
||
|
||
// If there are more markers in the opening, add them before.
|
||
if (events[open][1].end.offset - events[open][1].start.offset) {
|
||
nextEvents = push(nextEvents, [
|
||
['enter', events[open][1], context],
|
||
['exit', events[open][1], context]
|
||
])
|
||
}
|
||
|
||
// Opening.
|
||
nextEvents = push(nextEvents, [
|
||
['enter', group, context],
|
||
['enter', openingSequence, context],
|
||
['exit', openingSequence, context],
|
||
['enter', text, context]
|
||
])
|
||
|
||
// Always populated by defaults.
|
||
|
||
// Between.
|
||
nextEvents = push(
|
||
nextEvents,
|
||
resolveAll(
|
||
context.parser.constructs.insideSpan.null,
|
||
events.slice(open + 1, index),
|
||
context
|
||
)
|
||
)
|
||
|
||
// Closing.
|
||
nextEvents = push(nextEvents, [
|
||
['exit', text, context],
|
||
['enter', closingSequence, context],
|
||
['exit', closingSequence, context],
|
||
['exit', group, context]
|
||
])
|
||
|
||
// If there are more markers in the closing, add them after.
|
||
if (events[index][1].end.offset - events[index][1].start.offset) {
|
||
offset = 2
|
||
nextEvents = push(nextEvents, [
|
||
['enter', events[index][1], context],
|
||
['exit', events[index][1], context]
|
||
])
|
||
} else {
|
||
offset = 0
|
||
}
|
||
splice(events, open - 1, index - open + 3, nextEvents)
|
||
index = open + nextEvents.length - offset - 2
|
||
break
|
||
}
|
||
}
|
||
}
|
||
}
|
||
|
||
// Remove remaining sequences.
|
||
index = -1
|
||
while (++index < events.length) {
|
||
if (events[index][1].type === 'attentionSequence') {
|
||
events[index][1].type = 'data'
|
||
}
|
||
}
|
||
return events
|
||
}
|
||
|
||
/**
|
||
* @this {TokenizeContext}
|
||
* @type {Tokenizer}
|
||
*/
|
||
function tokenizeAttention(effects, ok) {
|
||
const attentionMarkers = this.parser.constructs.attentionMarkers.null
|
||
const previous = this.previous
|
||
const before = classifyCharacter(previous)
|
||
|
||
/** @type {NonNullable<Code>} */
|
||
let marker
|
||
return start
|
||
|
||
/**
|
||
* Before a sequence.
|
||
*
|
||
* ```markdown
|
||
* > | **
|
||
* ^
|
||
* ```
|
||
*
|
||
* @type {State}
|
||
*/
|
||
function start(code) {
|
||
marker = code
|
||
effects.enter('attentionSequence')
|
||
return inside(code)
|
||
}
|
||
|
||
/**
|
||
* In a sequence.
|
||
*
|
||
* ```markdown
|
||
* > | **
|
||
* ^^
|
||
* ```
|
||
*
|
||
* @type {State}
|
||
*/
|
||
function inside(code) {
|
||
if (code === marker) {
|
||
effects.consume(code)
|
||
return inside
|
||
}
|
||
const token = effects.exit('attentionSequence')
|
||
|
||
// To do: next major: move this to resolver, just like `markdown-rs`.
|
||
const after = classifyCharacter(code)
|
||
|
||
// Always populated by defaults.
|
||
|
||
const open =
|
||
!after || (after === 2 && before) || attentionMarkers.includes(code)
|
||
const close =
|
||
!before || (before === 2 && after) || attentionMarkers.includes(previous)
|
||
token._open = Boolean(marker === 42 ? open : open && (before || !close))
|
||
token._close = Boolean(marker === 42 ? close : close && (after || !open))
|
||
return ok(code)
|
||
}
|
||
}
|
||
|
||
/**
|
||
* Move a point a bit.
|
||
*
|
||
* Note: `move` only works inside lines! It’s not possible to move past other
|
||
* chunks (replacement characters, tabs, or line endings).
|
||
*
|
||
* @param {Point} point
|
||
* @param {number} offset
|
||
* @returns {undefined}
|
||
*/
|
||
function movePoint(point, offset) {
|
||
point.column += offset
|
||
point.offset += offset
|
||
point._bufferIndex += offset
|
||
}
|