2023-09-02 01:27:33 +02:00
|
|
|
interface KaTeXMacro {
|
2023-03-31 04:10:03 +02:00
|
|
|
args: number;
|
|
|
|
rule: (string | number)[];
|
2023-09-02 01:27:33 +02:00
|
|
|
}
|
2023-03-30 05:11:57 +02:00
|
|
|
|
|
|
|
function parseSingleKaTeXMacro(src: string): [string, KaTeXMacro] {
|
|
|
|
const invalid: [string, KaTeXMacro] = ["", { args: 0, rule: [] }];
|
|
|
|
|
|
|
|
const skipSpaces = (pos: number): number => {
|
2023-03-31 04:10:03 +02:00
|
|
|
while (src[pos] === " ") ++pos;
|
2023-03-30 05:11:57 +02:00
|
|
|
return pos;
|
|
|
|
};
|
|
|
|
|
2023-03-31 04:10:03 +02:00
|
|
|
if (!src.startsWith("\\newcommand") || src.slice(-1) !== "}") return invalid;
|
2023-03-30 05:11:57 +02:00
|
|
|
|
|
|
|
// current index we are checking (= "\\newcommand".length)
|
2023-06-06 02:27:40 +02:00
|
|
|
let currentPos = 11;
|
2023-03-30 05:11:57 +02:00
|
|
|
currentPos = skipSpaces(currentPos);
|
|
|
|
|
|
|
|
// parse {\name}, (\name), or [\name]
|
|
|
|
let bracket: string;
|
2023-03-31 04:10:03 +02:00
|
|
|
if (src[currentPos] === "{") bracket = "{}";
|
|
|
|
else if (src[currentPos] === "(") bracket = "()";
|
|
|
|
else if (src[currentPos] === "[") bracket = "[]";
|
|
|
|
else return invalid;
|
2023-03-30 05:11:57 +02:00
|
|
|
|
|
|
|
++currentPos;
|
|
|
|
currentPos = skipSpaces(currentPos);
|
|
|
|
|
2023-03-31 04:10:03 +02:00
|
|
|
if (src[currentPos] !== "\\") return invalid;
|
2023-03-30 05:11:57 +02:00
|
|
|
|
|
|
|
const closeNameBracketPos: number = src.indexOf(bracket[1], currentPos);
|
2023-03-31 04:10:03 +02:00
|
|
|
if (closeNameBracketPos === -1) return invalid;
|
2023-03-30 05:11:57 +02:00
|
|
|
|
|
|
|
const name: string = src.slice(currentPos + 1, closeNameBracketPos).trim();
|
2023-03-31 04:10:03 +02:00
|
|
|
if (!/^[a-zA-Z]+$/.test(name)) return invalid;
|
2023-03-30 05:11:57 +02:00
|
|
|
|
|
|
|
currentPos = skipSpaces(closeNameBracketPos + 1);
|
|
|
|
|
2023-09-02 01:27:33 +02:00
|
|
|
const macro: KaTeXMacro = { args: 0, rule: [] };
|
2023-03-30 05:11:57 +02:00
|
|
|
|
|
|
|
// parse [number of arguments] (optional)
|
|
|
|
if (src[currentPos] === "[") {
|
|
|
|
const closeArgsBracketPos: number = src.indexOf("]", currentPos);
|
|
|
|
macro.args = Number(src.slice(currentPos + 1, closeArgsBracketPos).trim());
|
|
|
|
currentPos = closeArgsBracketPos + 1;
|
|
|
|
|
2023-03-31 04:10:03 +02:00
|
|
|
if (Number.isNaN(macro.args) || macro.args < 0) return invalid;
|
2023-03-30 05:11:57 +02:00
|
|
|
} else if (src[currentPos] === "{") {
|
|
|
|
macro.args = 0;
|
|
|
|
} else {
|
|
|
|
return invalid;
|
|
|
|
}
|
|
|
|
|
|
|
|
currentPos = skipSpaces(currentPos);
|
|
|
|
|
|
|
|
// parse {rule}
|
2023-03-31 04:10:03 +02:00
|
|
|
if (src[currentPos] !== "{") return invalid;
|
2023-03-30 05:11:57 +02:00
|
|
|
|
|
|
|
++currentPos;
|
|
|
|
currentPos = skipSpaces(currentPos);
|
|
|
|
|
|
|
|
while (currentPos < src.length - 1) {
|
2023-09-02 01:27:33 +02:00
|
|
|
let numbersignPos = -1,
|
|
|
|
isEscaped = false;
|
2023-03-30 05:11:57 +02:00
|
|
|
|
|
|
|
for (let i = currentPos; i < src.length - 1; ++i) {
|
|
|
|
if (src[i] !== "\\" && src[i] !== "#") {
|
|
|
|
isEscaped = false;
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
if (src[i] === "\\") {
|
|
|
|
isEscaped = !isEscaped;
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
if (!isEscaped && src[i] === "#") {
|
|
|
|
numbersignPos = i;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if (numbersignPos === -1) {
|
|
|
|
macro.rule.push(src.slice(currentPos, -1));
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
2023-03-31 04:10:03 +02:00
|
|
|
const argIndexEndPos =
|
|
|
|
src.slice(numbersignPos + 1).search(/[^\d]/) + numbersignPos;
|
2023-09-02 01:27:33 +02:00
|
|
|
const argIndex = Number(src.slice(numbersignPos + 1, argIndexEndPos + 1));
|
2023-03-30 05:11:57 +02:00
|
|
|
|
|
|
|
if (Number.isNaN(argIndex) || argIndex < 1 || macro.args < argIndex)
|
|
|
|
return invalid;
|
|
|
|
|
|
|
|
if (currentPos !== numbersignPos)
|
|
|
|
macro.rule.push(src.slice(currentPos, numbersignPos));
|
|
|
|
macro.rule.push(argIndex);
|
|
|
|
|
|
|
|
currentPos = argIndexEndPos + 1;
|
|
|
|
}
|
|
|
|
|
2023-03-31 04:10:03 +02:00
|
|
|
if (macro.args === 0) return [name, macro];
|
|
|
|
else return [name + bracket[0], macro];
|
2023-03-30 05:11:57 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
export function parseKaTeXMacros(src: string): string {
|
2023-09-02 01:27:33 +02:00
|
|
|
const result: Record<string, KaTeXMacro> = {};
|
2023-03-30 05:11:57 +02:00
|
|
|
|
|
|
|
for (const s of src.split("\n")) {
|
|
|
|
const [name, macro]: [string, KaTeXMacro] = parseSingleKaTeXMacro(s.trim());
|
2023-03-31 04:10:03 +02:00
|
|
|
if (name !== "") result[name] = macro;
|
2023-03-30 05:11:57 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
return JSON.stringify(result);
|
|
|
|
}
|
|
|
|
|
|
|
|
// returns [expanded text, whether something is expanded, how many times we can expand more]
|
|
|
|
// the boolean value is used for multi-pass expansions (macros can expand to other macros)
|
2023-03-31 04:10:03 +02:00
|
|
|
function expandKaTeXMacroOnce(
|
|
|
|
src: string,
|
2023-09-02 01:27:33 +02:00
|
|
|
macros: Record<string, KaTeXMacro>,
|
2023-03-31 04:10:03 +02:00
|
|
|
maxNumberOfExpansions: number,
|
|
|
|
): [string, boolean, number] {
|
2023-03-30 05:11:57 +02:00
|
|
|
const bracketKinds = 3;
|
2023-09-02 01:27:33 +02:00
|
|
|
const openBracketId: Record<string, number> = {
|
2023-03-31 04:10:03 +02:00
|
|
|
"(": 0,
|
|
|
|
"{": 1,
|
|
|
|
"[": 2,
|
|
|
|
};
|
2023-09-02 01:27:33 +02:00
|
|
|
const closeBracketId: Record<string, number> = {
|
2023-03-31 04:10:03 +02:00
|
|
|
")": 0,
|
|
|
|
"}": 1,
|
|
|
|
"]": 2,
|
|
|
|
};
|
2023-03-30 05:11:57 +02:00
|
|
|
const openBracketFromId = ["(", "{", "["];
|
|
|
|
const closeBracketFromId = [")", "}", "]"];
|
|
|
|
|
|
|
|
// mappings from open brackets to their corresponding close brackets
|
2023-09-02 01:27:33 +02:00
|
|
|
type BracketMapping = Record<number, number>;
|
2023-03-30 05:11:57 +02:00
|
|
|
|
|
|
|
const bracketMapping = ((): BracketMapping => {
|
2023-09-02 01:27:33 +02:00
|
|
|
const result: BracketMapping = {};
|
2023-03-30 05:11:57 +02:00
|
|
|
const n = src.length;
|
|
|
|
|
2023-09-02 01:27:33 +02:00
|
|
|
const depths = new Array<number>(bracketKinds).fill(0); // current bracket depth for "()", "{}", and "[]"
|
|
|
|
const buffer = Array.from(Array<number[]>(bracketKinds), () =>
|
2023-03-31 04:10:03 +02:00
|
|
|
Array<number>(n),
|
|
|
|
);
|
2023-03-30 05:11:57 +02:00
|
|
|
|
|
|
|
let isEscaped = false;
|
|
|
|
|
|
|
|
for (let i = 0; i < n; ++i) {
|
2023-03-31 04:10:03 +02:00
|
|
|
if (
|
|
|
|
!isEscaped &&
|
|
|
|
src[i] === "\\" &&
|
|
|
|
i + 1 < n &&
|
|
|
|
["{", "}", "\\"].includes(src[i + 1])
|
|
|
|
) {
|
2023-03-30 05:11:57 +02:00
|
|
|
isEscaped = true;
|
|
|
|
continue;
|
|
|
|
}
|
2023-03-31 04:10:03 +02:00
|
|
|
if (
|
|
|
|
isEscaped ||
|
|
|
|
(src[i] !== "\\" &&
|
|
|
|
!openBracketFromId.includes(src[i]) &&
|
|
|
|
!closeBracketFromId.includes(src[i]))
|
|
|
|
) {
|
2023-03-30 05:11:57 +02:00
|
|
|
isEscaped = false;
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
isEscaped = false;
|
|
|
|
|
|
|
|
if (openBracketFromId.includes(src[i])) {
|
|
|
|
const id: number = openBracketId[src[i]];
|
|
|
|
buffer[id][depths[id]] = i;
|
|
|
|
++depths[id];
|
|
|
|
} else if (closeBracketFromId.includes(src[i])) {
|
|
|
|
const id: number = closeBracketId[src[i]];
|
|
|
|
if (depths[id] > 0) {
|
|
|
|
--depths[id];
|
|
|
|
result[buffer[id][depths[id]]] = i;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return result;
|
|
|
|
})();
|
|
|
|
|
2023-03-31 04:10:03 +02:00
|
|
|
function expandSingleKaTeXMacro(
|
|
|
|
expandedArgs: string[],
|
|
|
|
macroName: string,
|
|
|
|
): string {
|
2023-03-30 05:11:57 +02:00
|
|
|
let result = "";
|
|
|
|
for (const block of macros[macroName].rule) {
|
2023-03-31 04:10:03 +02:00
|
|
|
if (typeof block === "string") result += block;
|
|
|
|
else result += expandedArgs[block - 1];
|
2023-03-30 05:11:57 +02:00
|
|
|
}
|
|
|
|
return result;
|
|
|
|
}
|
|
|
|
|
|
|
|
// only expand src.slice(beginPos, endPos)
|
2023-03-31 04:10:03 +02:00
|
|
|
function expandKaTeXMacroImpl(
|
|
|
|
beginPos: number,
|
|
|
|
endPos: number,
|
|
|
|
): [string, boolean] {
|
|
|
|
if (endPos <= beginPos) return ["", false];
|
2023-03-30 05:11:57 +02:00
|
|
|
|
|
|
|
const raw: string = src.slice(beginPos, endPos);
|
2023-03-31 04:10:03 +02:00
|
|
|
const fallback: string = raw; // returned for invalid inputs or too many expansions
|
2023-03-30 05:11:57 +02:00
|
|
|
|
2023-03-31 04:10:03 +02:00
|
|
|
if (maxNumberOfExpansions <= 0) return [fallback, false];
|
2023-03-30 05:11:57 +02:00
|
|
|
--maxNumberOfExpansions;
|
|
|
|
|
|
|
|
// search for a custom macro
|
2023-09-02 01:27:33 +02:00
|
|
|
let checkedPos = beginPos - 1,
|
|
|
|
macroName = "",
|
|
|
|
macroBackslashPos = 0,
|
|
|
|
// for macros w/o args: unused
|
|
|
|
// w/ args: the first open bracket ("(", "{", or "[") after cmd name
|
|
|
|
macroArgBeginPos = 0,
|
|
|
|
// for macros w/o args: the end of cmd name
|
|
|
|
// w/ args: the closing bracket of the last arg
|
|
|
|
macroArgEndPos = 0;
|
2023-03-30 05:11:57 +02:00
|
|
|
|
|
|
|
while (checkedPos < endPos) {
|
|
|
|
checkedPos = src.indexOf("\\", checkedPos + 1);
|
|
|
|
|
|
|
|
// there is no macro to expand
|
2023-03-31 04:10:03 +02:00
|
|
|
if (checkedPos === -1) return [raw, false];
|
2023-03-30 05:11:57 +02:00
|
|
|
|
|
|
|
// is it a custom macro?
|
2023-03-31 04:10:03 +02:00
|
|
|
let nonAlphaPos =
|
|
|
|
src.slice(checkedPos + 1).search(/[^A-Za-z]/) + checkedPos + 1;
|
2023-03-30 05:11:57 +02:00
|
|
|
|
2023-03-31 04:10:03 +02:00
|
|
|
if (nonAlphaPos === checkedPos) nonAlphaPos = endPos;
|
2023-03-30 05:11:57 +02:00
|
|
|
|
|
|
|
let macroNameCandidate = src.slice(checkedPos + 1, nonAlphaPos);
|
|
|
|
if (macros.hasOwnProperty(macroNameCandidate)) {
|
|
|
|
// this is a custom macro without args
|
|
|
|
macroBackslashPos = checkedPos;
|
|
|
|
macroArgEndPos = nonAlphaPos - 1;
|
|
|
|
macroName = macroNameCandidate;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
|
|
|
let nextOpenBracketPos = endPos;
|
|
|
|
for (let i = 0; i < bracketKinds; ++i) {
|
|
|
|
const pos = src.indexOf(openBracketFromId[i], checkedPos + 1);
|
2023-03-31 04:10:03 +02:00
|
|
|
if (pos !== -1 && pos < nextOpenBracketPos) nextOpenBracketPos = pos;
|
2023-03-30 05:11:57 +02:00
|
|
|
}
|
|
|
|
|
2023-03-31 04:10:03 +02:00
|
|
|
if (nextOpenBracketPos === endPos) continue; // there is no open bracket
|
2023-03-30 05:11:57 +02:00
|
|
|
|
|
|
|
macroNameCandidate += src[nextOpenBracketPos];
|
|
|
|
|
|
|
|
if (macros.hasOwnProperty(macroNameCandidate)) {
|
|
|
|
macroBackslashPos = checkedPos;
|
|
|
|
macroArgBeginPos = nextOpenBracketPos;
|
2023-03-31 04:10:03 +02:00
|
|
|
macroArgEndPos = nextOpenBracketPos; // to search the first arg from here
|
2023-03-30 05:11:57 +02:00
|
|
|
macroName = macroNameCandidate;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2023-04-01 14:18:55 +02:00
|
|
|
if (!macros.hasOwnProperty(macroName)) return [fallback, false];
|
|
|
|
|
2023-03-30 05:11:57 +02:00
|
|
|
const numArgs: number = macros[macroName].args;
|
|
|
|
const openBracket: string = macroName.slice(-1);
|
|
|
|
|
2023-09-02 01:27:33 +02:00
|
|
|
const expandedArgs = new Array<string>(numArgs);
|
2023-03-30 05:11:57 +02:00
|
|
|
|
|
|
|
for (let i = 0; i < numArgs; ++i) {
|
|
|
|
// find the first open bracket after what we've searched
|
|
|
|
const nextOpenBracketPos = src.indexOf(openBracket, macroArgEndPos);
|
2023-03-31 04:10:03 +02:00
|
|
|
if (nextOpenBracketPos === -1) return [fallback, false]; // not enough arguments are provided
|
|
|
|
if (!bracketMapping[nextOpenBracketPos]) return [fallback, false]; // found open bracket doesn't correspond to any close bracket
|
2023-03-30 05:11:57 +02:00
|
|
|
|
|
|
|
macroArgEndPos = bracketMapping[nextOpenBracketPos];
|
2023-03-31 04:10:03 +02:00
|
|
|
expandedArgs[i] = expandKaTeXMacroImpl(
|
|
|
|
nextOpenBracketPos + 1,
|
|
|
|
macroArgEndPos,
|
|
|
|
)[0];
|
2023-03-30 05:11:57 +02:00
|
|
|
}
|
|
|
|
|
2023-03-31 04:10:03 +02:00
|
|
|
return [
|
|
|
|
src.slice(beginPos, macroBackslashPos) +
|
|
|
|
expandSingleKaTeXMacro(expandedArgs, macroName) +
|
|
|
|
expandKaTeXMacroImpl(macroArgEndPos + 1, endPos)[0],
|
|
|
|
true,
|
|
|
|
];
|
2023-03-30 05:11:57 +02:00
|
|
|
}
|
|
|
|
|
2023-03-31 04:10:03 +02:00
|
|
|
const [expandedText, expandedFlag]: [string, boolean] = expandKaTeXMacroImpl(
|
|
|
|
0,
|
|
|
|
src.length,
|
|
|
|
);
|
2023-03-30 05:11:57 +02:00
|
|
|
return [expandedText, expandedFlag, maxNumberOfExpansions];
|
|
|
|
}
|
|
|
|
|
2023-03-31 04:10:03 +02:00
|
|
|
export function expandKaTeXMacro(
|
|
|
|
src: string,
|
|
|
|
macrosAsJSONString: string,
|
|
|
|
maxNumberOfExpansions: number,
|
|
|
|
): string {
|
2023-03-30 05:11:57 +02:00
|
|
|
const macros = JSON.parse(macrosAsJSONString);
|
|
|
|
|
|
|
|
let expandMore = true;
|
|
|
|
|
2023-09-02 01:27:33 +02:00
|
|
|
while (expandMore && maxNumberOfExpansions > 0)
|
2023-03-31 04:10:03 +02:00
|
|
|
[src, expandMore, maxNumberOfExpansions] = expandKaTeXMacroOnce(
|
|
|
|
src,
|
|
|
|
macros,
|
|
|
|
maxNumberOfExpansions,
|
|
|
|
);
|
2023-03-30 05:11:57 +02:00
|
|
|
|
|
|
|
return src;
|
|
|
|
}
|