mirror of
https://github.com/Mintplex-Labs/anything-llm.git
synced 2025-03-13 05:32:24 +00:00
breakout latex plugin for delims (#3040)
* Breakout LaTeX plugin for modification * backport regular markdown link
This commit is contained in:
parent
55ffc08867
commit
c56d3b1558
4 changed files with 280 additions and 10 deletions
frontend
|
@ -24,7 +24,7 @@
|
||||||
"js-levenshtein": "^1.1.6",
|
"js-levenshtein": "^1.1.6",
|
||||||
"lodash.debounce": "^4.0.8",
|
"lodash.debounce": "^4.0.8",
|
||||||
"markdown-it": "^13.0.1",
|
"markdown-it": "^13.0.1",
|
||||||
"markdown-it-katex": "^2.0.3",
|
"katex": "^0.6.0",
|
||||||
"moment": "^2.30.1",
|
"moment": "^2.30.1",
|
||||||
"onnxruntime-web": "^1.18.0",
|
"onnxruntime-web": "^1.18.0",
|
||||||
"pluralize": "^8.0.0",
|
"pluralize": "^8.0.0",
|
||||||
|
|
|
@ -1,6 +1,6 @@
|
||||||
import { encode as HTMLEncode } from "he";
|
import { encode as HTMLEncode } from "he";
|
||||||
import markdownIt from "markdown-it";
|
import markdownIt from "markdown-it";
|
||||||
import markdownItKatex from "markdown-it-katex";
|
import markdownItKatexPlugin from "./plugins/markdown-katex";
|
||||||
import hljs from "highlight.js";
|
import hljs from "highlight.js";
|
||||||
import "./themes/github-dark.css";
|
import "./themes/github-dark.css";
|
||||||
import "./themes/github.css";
|
import "./themes/github.css";
|
||||||
|
@ -66,7 +66,7 @@ markdown.renderer.rules.image = function (tokens, idx) {
|
||||||
return `<div class="w-full max-w-[800px]"><img src="${src}" alt="${alt}" class="w-full h-auto" /></div>`;
|
return `<div class="w-full max-w-[800px]"><img src="${src}" alt="${alt}" class="w-full h-auto" /></div>`;
|
||||||
};
|
};
|
||||||
|
|
||||||
markdown.use(markdownItKatex);
|
markdown.use(markdownItKatexPlugin);
|
||||||
|
|
||||||
export default function renderMarkdown(text = "") {
|
export default function renderMarkdown(text = "") {
|
||||||
return markdown.render(text);
|
return markdown.render(text);
|
||||||
|
|
277
frontend/src/utils/chat/plugins/markdown-katex.js
Normal file
277
frontend/src/utils/chat/plugins/markdown-katex.js
Normal file
|
@ -0,0 +1,277 @@
|
||||||
|
import katex from "katex";
|
||||||
|
|
||||||
|
// Test if potential opening or closing delimieter
|
||||||
|
// Assumes that there is a "$" at state.src[pos]
|
||||||
|
function isValidDelim(state, pos) {
|
||||||
|
var prevChar,
|
||||||
|
nextChar,
|
||||||
|
max = state.posMax,
|
||||||
|
can_open = true,
|
||||||
|
can_close = true;
|
||||||
|
|
||||||
|
prevChar = pos > 0 ? state.src.charCodeAt(pos - 1) : -1;
|
||||||
|
nextChar = pos + 1 <= max ? state.src.charCodeAt(pos + 1) : -1;
|
||||||
|
|
||||||
|
// Only apply whitespace rules if we're dealing with $ delimiter
|
||||||
|
if (state.src[pos] === "$") {
|
||||||
|
if (
|
||||||
|
prevChar === 0x20 /* " " */ ||
|
||||||
|
prevChar === 0x09 /* \t */ ||
|
||||||
|
(nextChar >= 0x30 /* "0" */ && nextChar <= 0x39) /* "9" */
|
||||||
|
) {
|
||||||
|
can_close = false;
|
||||||
|
}
|
||||||
|
if (nextChar === 0x20 /* " " */ || nextChar === 0x09 /* \t */) {
|
||||||
|
can_open = false;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
return {
|
||||||
|
can_open: can_open,
|
||||||
|
can_close: can_close,
|
||||||
|
};
|
||||||
|
}
|
||||||
|
|
||||||
|
function math_inline(state, silent) {
|
||||||
|
var start, match, token, res, pos, esc_count;
|
||||||
|
|
||||||
|
// Only process $ and \( delimiters for inline math
|
||||||
|
if (
|
||||||
|
state.src[state.pos] !== "$" &&
|
||||||
|
(state.src[state.pos] !== "\\" || state.src[state.pos + 1] !== "(")
|
||||||
|
) {
|
||||||
|
return false;
|
||||||
|
}
|
||||||
|
|
||||||
|
// Handle \( ... \) case separately
|
||||||
|
if (state.src[state.pos] === "\\" && state.src[state.pos + 1] === "(") {
|
||||||
|
start = state.pos + 2;
|
||||||
|
match = start;
|
||||||
|
while ((match = state.src.indexOf("\\)", match)) !== -1) {
|
||||||
|
pos = match - 1;
|
||||||
|
while (state.src[pos] === "\\") {
|
||||||
|
pos -= 1;
|
||||||
|
}
|
||||||
|
if ((match - pos) % 2 == 1) {
|
||||||
|
break;
|
||||||
|
}
|
||||||
|
match += 1;
|
||||||
|
}
|
||||||
|
|
||||||
|
if (match === -1) {
|
||||||
|
if (!silent) {
|
||||||
|
state.pending += "\\(";
|
||||||
|
}
|
||||||
|
state.pos = start;
|
||||||
|
return true;
|
||||||
|
}
|
||||||
|
|
||||||
|
if (!silent) {
|
||||||
|
token = state.push("math_inline", "math", 0);
|
||||||
|
token.markup = "\\(";
|
||||||
|
token.content = state.src.slice(start, match);
|
||||||
|
}
|
||||||
|
|
||||||
|
state.pos = match + 2;
|
||||||
|
return true;
|
||||||
|
}
|
||||||
|
|
||||||
|
res = isValidDelim(state, state.pos);
|
||||||
|
if (!res.can_open) {
|
||||||
|
if (!silent) {
|
||||||
|
state.pending += "$";
|
||||||
|
}
|
||||||
|
state.pos += 1;
|
||||||
|
return true;
|
||||||
|
}
|
||||||
|
|
||||||
|
// First check for and bypass all properly escaped delimieters
|
||||||
|
// This loop will assume that the first leading backtick can not
|
||||||
|
// be the first character in state.src, which is known since
|
||||||
|
// we have found an opening delimieter already.
|
||||||
|
start = state.pos + 1;
|
||||||
|
match = start;
|
||||||
|
while ((match = state.src.indexOf("$", match)) !== -1) {
|
||||||
|
// Found potential $, look for escapes, pos will point to
|
||||||
|
// first non escape when complete
|
||||||
|
pos = match - 1;
|
||||||
|
while (state.src[pos] === "\\") {
|
||||||
|
pos -= 1;
|
||||||
|
}
|
||||||
|
|
||||||
|
// Even number of escapes, potential closing delimiter found
|
||||||
|
if ((match - pos) % 2 == 1) {
|
||||||
|
break;
|
||||||
|
}
|
||||||
|
match += 1;
|
||||||
|
}
|
||||||
|
|
||||||
|
// No closing delimter found. Consume $ and continue.
|
||||||
|
if (match === -1) {
|
||||||
|
if (!silent) {
|
||||||
|
state.pending += "$";
|
||||||
|
}
|
||||||
|
state.pos = start;
|
||||||
|
return true;
|
||||||
|
}
|
||||||
|
|
||||||
|
// Check if we have empty content, ie: $$. Do not parse.
|
||||||
|
if (match - start === 0) {
|
||||||
|
if (!silent) {
|
||||||
|
state.pending += "$$";
|
||||||
|
}
|
||||||
|
state.pos = start + 1;
|
||||||
|
return true;
|
||||||
|
}
|
||||||
|
|
||||||
|
// Check for valid closing delimiter
|
||||||
|
res = isValidDelim(state, match);
|
||||||
|
if (!res.can_close) {
|
||||||
|
if (!silent) {
|
||||||
|
state.pending += "$";
|
||||||
|
}
|
||||||
|
state.pos = start;
|
||||||
|
return true;
|
||||||
|
}
|
||||||
|
|
||||||
|
if (!silent) {
|
||||||
|
token = state.push("math_inline", "math", 0);
|
||||||
|
token.markup = "$";
|
||||||
|
token.content = state.src.slice(start, match);
|
||||||
|
}
|
||||||
|
|
||||||
|
state.pos = match + 1;
|
||||||
|
return true;
|
||||||
|
}
|
||||||
|
|
||||||
|
function math_block(state, start, end, silent) {
|
||||||
|
var firstLine,
|
||||||
|
lastLine,
|
||||||
|
next,
|
||||||
|
lastPos,
|
||||||
|
found = false,
|
||||||
|
token,
|
||||||
|
pos = state.bMarks[start] + state.tShift[start],
|
||||||
|
max = state.eMarks[start];
|
||||||
|
|
||||||
|
// Check for $$, \[, or standalone [ as opening delimiters
|
||||||
|
if (pos + 1 > max) {
|
||||||
|
return false;
|
||||||
|
}
|
||||||
|
|
||||||
|
let openDelim = state.src.slice(pos, pos + 2);
|
||||||
|
let isDoubleDollar = openDelim === "$$";
|
||||||
|
let isLatexBracket = openDelim === "\\[";
|
||||||
|
|
||||||
|
if (!isDoubleDollar && !isLatexBracket) {
|
||||||
|
return false;
|
||||||
|
}
|
||||||
|
|
||||||
|
// Determine the closing delimiter and position adjustment
|
||||||
|
let delimiter, posAdjust;
|
||||||
|
if (isDoubleDollar) {
|
||||||
|
delimiter = "$$";
|
||||||
|
posAdjust = 2;
|
||||||
|
} else if (isLatexBracket) {
|
||||||
|
delimiter = "\\]";
|
||||||
|
posAdjust = 2;
|
||||||
|
}
|
||||||
|
|
||||||
|
pos += posAdjust;
|
||||||
|
firstLine = state.src.slice(pos, max);
|
||||||
|
|
||||||
|
if (silent) {
|
||||||
|
return true;
|
||||||
|
}
|
||||||
|
if (firstLine.trim().slice(-delimiter.length) === delimiter) {
|
||||||
|
// Single line expression
|
||||||
|
firstLine = firstLine.trim().slice(0, -delimiter.length);
|
||||||
|
found = true;
|
||||||
|
}
|
||||||
|
|
||||||
|
for (next = start; !found; ) {
|
||||||
|
next++;
|
||||||
|
|
||||||
|
if (next >= end) {
|
||||||
|
break;
|
||||||
|
}
|
||||||
|
|
||||||
|
pos = state.bMarks[next] + state.tShift[next];
|
||||||
|
max = state.eMarks[next];
|
||||||
|
|
||||||
|
if (pos < max && state.tShift[next] < state.blkIndent) {
|
||||||
|
// non-empty line with negative indent should stop the list:
|
||||||
|
break;
|
||||||
|
}
|
||||||
|
|
||||||
|
if (
|
||||||
|
state.src.slice(pos, max).trim().slice(-delimiter.length) === delimiter
|
||||||
|
) {
|
||||||
|
lastPos = state.src.slice(0, max).lastIndexOf(delimiter);
|
||||||
|
lastLine = state.src.slice(pos, lastPos);
|
||||||
|
found = true;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
state.line = next + 1;
|
||||||
|
|
||||||
|
token = state.push("math_block", "math", 0);
|
||||||
|
token.block = true;
|
||||||
|
token.content =
|
||||||
|
(firstLine && firstLine.trim() ? firstLine + "\n" : "") +
|
||||||
|
state.getLines(start + 1, next, state.tShift[start], true) +
|
||||||
|
(lastLine && lastLine.trim() ? lastLine : "");
|
||||||
|
token.map = [start, state.line];
|
||||||
|
token.markup = delimiter;
|
||||||
|
return true;
|
||||||
|
}
|
||||||
|
|
||||||
|
export default function math_plugin(md, options) {
|
||||||
|
// Default options
|
||||||
|
options = options || {};
|
||||||
|
|
||||||
|
var katexInline = function (latex) {
|
||||||
|
options.displayMode = false;
|
||||||
|
try {
|
||||||
|
latex = latex
|
||||||
|
.replace(/^\[(.*)\]$/, "$1")
|
||||||
|
.replace(/^\\\((.*)\\\)$/, "$1")
|
||||||
|
.replace(/^\\\[(.*)\\\]$/, "$1");
|
||||||
|
return katex.renderToString(latex, options);
|
||||||
|
} catch (error) {
|
||||||
|
if (options.throwOnError) {
|
||||||
|
console.log(error);
|
||||||
|
}
|
||||||
|
return latex;
|
||||||
|
}
|
||||||
|
};
|
||||||
|
|
||||||
|
var inlineRenderer = function (tokens, idx) {
|
||||||
|
return katexInline(tokens[idx].content);
|
||||||
|
};
|
||||||
|
|
||||||
|
var katexBlock = function (latex) {
|
||||||
|
options.displayMode = true;
|
||||||
|
try {
|
||||||
|
// Remove surrounding delimiters if present
|
||||||
|
latex = latex.replace(/^\[(.*)\]$/, "$1").replace(/^\\\[(.*)\\\]$/, "$1");
|
||||||
|
return "<p>" + katex.renderToString(latex, options) + "</p>";
|
||||||
|
} catch (error) {
|
||||||
|
if (options.throwOnError) {
|
||||||
|
console.log(error);
|
||||||
|
}
|
||||||
|
return latex;
|
||||||
|
}
|
||||||
|
};
|
||||||
|
|
||||||
|
var blockRenderer = function (tokens, idx) {
|
||||||
|
return katexBlock(tokens[idx].content) + "\n";
|
||||||
|
};
|
||||||
|
|
||||||
|
md.inline.ruler.after("escape", "math_inline", math_inline);
|
||||||
|
md.block.ruler.after("blockquote", "math_block", math_block, {
|
||||||
|
alt: ["paragraph", "reference", "blockquote", "list"],
|
||||||
|
});
|
||||||
|
md.renderer.rules.math_inline = inlineRenderer;
|
||||||
|
md.renderer.rules.math_block = blockRenderer;
|
||||||
|
}
|
|
@ -2483,13 +2483,6 @@ lru-cache@^5.1.1:
|
||||||
dependencies:
|
dependencies:
|
||||||
yallist "^3.0.2"
|
yallist "^3.0.2"
|
||||||
|
|
||||||
markdown-it-katex@^2.0.3:
|
|
||||||
version "2.0.3"
|
|
||||||
resolved "https://registry.yarnpkg.com/markdown-it-katex/-/markdown-it-katex-2.0.3.tgz#d7b86a1aea0b9d6496fab4e7919a18fdef589c39"
|
|
||||||
integrity sha512-nUkkMtRWeg7OpdflamflE/Ho/pWl64Lk9wNBKOmaj33XkQdumhXAIYhI0WO03GeiycPCsxbmX536V5NEXpC3Ng==
|
|
||||||
dependencies:
|
|
||||||
katex "^0.6.0"
|
|
||||||
|
|
||||||
markdown-it@^13.0.1:
|
markdown-it@^13.0.1:
|
||||||
version "13.0.2"
|
version "13.0.2"
|
||||||
resolved "https://registry.yarnpkg.com/markdown-it/-/markdown-it-13.0.2.tgz#1bc22e23379a6952e5d56217fbed881e0c94d536"
|
resolved "https://registry.yarnpkg.com/markdown-it/-/markdown-it-13.0.2.tgz#1bc22e23379a6952e5d56217fbed881e0c94d536"
|
||||||
|
|
Loading…
Add table
Reference in a new issue