refac: latex

This commit is contained in:
Timothy J. Baek 2024-08-14 16:07:39 +02:00
parent 0ec1f9e331
commit 6aefc79807
3 changed files with 120 additions and 70 deletions

View File

@ -37,10 +37,7 @@
</del> </del>
{:else if token.type === 'inlineKatex'} {:else if token.type === 'inlineKatex'}
{#if token.text} {#if token.text}
<KatexRenderer <KatexRenderer content={revertSanitizedResponseContent(token.text)} displayMode={false} />
content={revertSanitizedResponseContent(token.text)}
displayMode={token?.displayMode ?? false}
/>
{/if} {/if}
{:else if token.type === 'text'} {:else if token.type === 'text'}
{token.raw} {token.raw}

View File

@ -116,6 +116,13 @@
displayMode={token?.displayMode ?? false} displayMode={token?.displayMode ?? false}
/> />
{/if} {/if}
{:else if token.type === 'blockKatex'}
{#if token.text}
<KatexRenderer
content={revertSanitizedResponseContent(token.text)}
displayMode={token?.displayMode ?? false}
/>
{/if}
{:else if token.type === 'space'} {:else if token.type === 'space'}
{''} {''}
{:else} {:else}

View File

@ -1,29 +1,72 @@
import katex from 'katex'; import katex from 'katex';
const inlineRule = const DELIMITER_LIST = [
/^(\${1,2})(?!\$)((?:\\.|[^\\\n])*?(?:\\.|[^\\\n\$]))\1(?=[\s?!\.,:?!。,:]|$)/; { left: '$$', right: '$$', display: false },
const inlineRuleNonStandard = /^(\${1,2})(?!\$)((?:\\.|[^\\\n])*?(?:\\.|[^\\\n\$]))\1/; // Non-standard, even if there are no spaces before and after $ or $$, try to parse { left: '$', right: '$', display: false },
{ left: '\\pu{', right: '}', display: false },
{ left: '\\ce{', right: '}', display: false },
{ left: '\\(', right: '\\)', display: false },
{ left: '( ', right: ' )', display: false },
{ left: '\\[', right: '\\]', display: true },
{ left: '[', right: ']', display: true }
]
const blockRule = /^(\${1,2})\n((?:\\[^]|[^\\])+?)\n\1(?:\n|$)/; // const DELIMITER_LIST = [
// { left: '$$', right: '$$', display: false },
// { left: '$', right: '$', display: false },
// ];
export default function (options = {}) { // const inlineRule = /^(\${1,2})(?!\$)((?:\\.|[^\\\n])*?(?:\\.|[^\\\n\$]))\1(?=[\s?!\.,:?!。,:]|$)/;
// const blockRule = /^(\${1,2})\n((?:\\[^]|[^\\])+?)\n\1(?:\n|$)/;
let inlinePatterns = [];
let blockPatterns = [];
function escapeRegex(string) {
return string.replace(/[-\/\\^$*+?.()|[\]{}]/g, '\\$&');
}
function generateRegexRules(delimiters) {
delimiters.forEach(delimiter => {
const { left, right } = delimiter;
// Ensure regex-safe delimiters
const escapedLeft = escapeRegex(left);
const escapedRight = escapeRegex(right);
// Inline pattern - Capture group $1, token content, followed by end delimiter and normal punctuation marks.
// Example: $text$
inlinePatterns.push(`${escapedLeft}((?:\\\\.|[^\\\\\\n])*?(?:\\\\.|[^\\\\\\n${escapedRight}]))${escapedRight}`);
// Block pattern - Starts and ends with the delimiter on new lines. Example:
// $$\ncontent here\n$$
blockPatterns.push(`${escapedLeft}\n((?:\\\\[^]|[^\\\\])+?)\n${escapedRight}`);
});
const inlineRule = new RegExp(`^(${inlinePatterns.join('|')})(?=[\\s?!.,:?!。,:]|$)`, 'u');
const blockRule = new RegExp(`^(${blockPatterns.join('|')})(?:\n|$)`, 'u');
return { inlineRule, blockRule };
}
const { inlineRule, blockRule } = generateRegexRules(DELIMITER_LIST);
export default function(options = {}) {
return { return {
extensions: [ extensions: [
inlineKatex(options, createRenderer(options, false)), inlineKatex(options, createRenderer(options, false)),
blockKatex(options, createRenderer(options, true)) blockKatex(options, createRenderer(options, true)),
] ],
}; };
} }
function createRenderer(options, newlineAfter) { function createRenderer(options, newlineAfter) {
return (token) => return (token) => katex.renderToString(token.text, { ...options, displayMode: token.displayMode }) + (newlineAfter ? '\n' : '');
katex.renderToString(token.text, { ...options, displayMode: token.displayMode }) +
(newlineAfter ? '\n' : '');
} }
function inlineKatex(options, renderer) { function inlineKatex(options, renderer) {
const nonStandard = options && options.nonStandard; const ruleReg = inlineRule;
const ruleReg = nonStandard ? inlineRuleNonStandard : inlineRule;
return { return {
name: 'inlineKatex', name: 'inlineKatex',
level: 'inline', level: 'inline',
@ -36,7 +79,7 @@ function inlineKatex(options, renderer) {
if (index === -1) { if (index === -1) {
return; return;
} }
const f = nonStandard ? index > -1 : index === 0 || indexSrc.charAt(index - 1) === ' '; const f = index === 0 || indexSrc.charAt(index - 1) === ' ';
if (f) { if (f) {
const possibleKatex = indexSrc.substring(index); const possibleKatex = indexSrc.substring(index);
@ -50,16 +93,19 @@ function inlineKatex(options, renderer) {
}, },
tokenizer(src, tokens) { tokenizer(src, tokens) {
const match = src.match(ruleReg); const match = src.match(ruleReg);
if (match) { if (match) {
console.log(match)
const text = match.slice(2).filter((item) => item).find((item) => item.trim());
return { return {
type: 'inlineKatex', type: 'inlineKatex',
raw: match[0], raw: match[0],
text: match[2].trim(), text: text,
displayMode: match[1].length === 2
}; };
} }
}, },
renderer renderer,
}; };
} }
@ -73,11 +119,11 @@ function blockKatex(options, renderer) {
return { return {
type: 'blockKatex', type: 'blockKatex',
raw: match[0], raw: match[0],
text: match[2].trim(), text: match[0],
displayMode: match[1].length === 2
}; };
} }
}, },
renderer renderer,
}; };
} }