import DOMPurify from 'dompurify'; import type { MermaidConfig } from '../../config.type.js'; // Remove and ignore br:s export const lineBreakRegex = //gi; /** * Gets the rows of lines in a string * * @param s - The string to check the lines for * @returns The rows in that string */ export const getRows = (s?: string): string[] => { if (!s) { return ['']; } const str = breakToPlaceholder(s).replace(/\\n/g, '#br#'); return str.split('#br#'); }; const setupDompurifyHooksIfNotSetup = (() => { let setup = false; return () => { if (!setup) { setupDompurifyHooks(); setup = true; } }; })(); function setupDompurifyHooks() { const TEMPORARY_ATTRIBUTE = 'data-temp-href-target'; DOMPurify.addHook('beforeSanitizeAttributes', (node: Element) => { if (node.tagName === 'A' && node.hasAttribute('target')) { node.setAttribute(TEMPORARY_ATTRIBUTE, node.getAttribute('target') ?? ''); } }); DOMPurify.addHook('afterSanitizeAttributes', (node: Element) => { if (node.tagName === 'A' && node.hasAttribute(TEMPORARY_ATTRIBUTE)) { node.setAttribute('target', node.getAttribute(TEMPORARY_ATTRIBUTE) ?? ''); node.removeAttribute(TEMPORARY_ATTRIBUTE); if (node.getAttribute('target') === '_blank') { node.setAttribute('rel', 'noopener'); } } }); } /** * Removes script tags from a text * * @param txt - The text to sanitize * @returns The safer text */ export const removeScript = (txt: string): string => { setupDompurifyHooksIfNotSetup(); const sanitizedText = DOMPurify.sanitize(txt); return sanitizedText; }; const sanitizeMore = (text: string, config: MermaidConfig) => { if (config.flowchart?.htmlLabels !== false) { const level = config.securityLevel; if (level === 'antiscript' || level === 'strict') { text = removeScript(text); } else if (level !== 'loose') { text = breakToPlaceholder(text); text = text.replace(//g, '>'); text = text.replace(/=/g, '='); text = placeholderToBreak(text); } } return text; }; export const sanitizeText = (text: string, config: MermaidConfig): string => { if (!text) { return text; } if (config.dompurifyConfig) { // eslint-disable-next-line @typescript-eslint/no-base-to-string text = DOMPurify.sanitize(sanitizeMore(text, config), config.dompurifyConfig).toString(); } else { text = DOMPurify.sanitize(sanitizeMore(text, config), { FORBID_TAGS: ['style'], }).toString(); } return text; }; export const sanitizeTextOrArray = ( a: string | string[] | string[][], config: MermaidConfig ): string | string[] => { if (typeof a === 'string') { return sanitizeText(a, config); } // TODO: Refactor to avoid flat. return a.flat().map((x: string) => sanitizeText(x, config)); }; /** * Whether or not a text has any line breaks * * @param text - The text to test * @returns Whether or not the text has breaks */ export const hasBreaks = (text: string): boolean => { return lineBreakRegex.test(text); }; /** * Splits on
tags * * @param text - Text to split * @returns List of lines as strings */ export const splitBreaks = (text: string): string[] => { return text.split(lineBreakRegex); }; /** * Converts placeholders to line breaks in HTML * * @param s - HTML with placeholders * @returns HTML with breaks instead of placeholders */ const placeholderToBreak = (s: string): string => { return s.replace(/#br#/g, '
'); }; /** * Opposite of `placeholderToBreak`, converts breaks to placeholders * * @param s - HTML string * @returns String with placeholders */ const breakToPlaceholder = (s: string): string => { return s.replace(lineBreakRegex, '#br#'); }; /** * Gets the current URL * * @param useAbsolute - Whether to return the absolute URL or not * @returns The current URL */ const getUrl = (useAbsolute: boolean): string => { let url = ''; if (useAbsolute) { url = window.location.protocol + '//' + window.location.host + window.location.pathname + window.location.search; url = url.replaceAll(/$/g, '\\('); url = url.replaceAll(/$/g, '\\)'); } return url; }; /** * Converts a string/boolean into a boolean * * @param val - String or boolean to convert * @returns The result from the input */ export const evaluate = (val?: string | boolean): boolean => val === false || ['false', 'null', '0'].includes(String(val).trim().toLowerCase()) ? false : true; /** * Wrapper around Math.max which removes non-numeric values * Returns the larger of a set of supplied numeric expressions. * @param values - Numeric expressions to be evaluated * @returns The smaller value */ export const getMax = function (...values: number[]): number { const newValues: number[] = values.filter((value) => { return !isNaN(value); }); return Math.max(...newValues); }; /** * Wrapper around Math.min which removes non-numeric values * Returns the smaller of a set of supplied numeric expressions. * @param values - Numeric expressions to be evaluated * @returns The smaller value */ export const getMin = function (...values: number[]): number { const newValues: number[] = values.filter((value) => { return !isNaN(value); }); return Math.min(...newValues); }; /** * Makes generics in typescript syntax * * @example * Array of array of strings in typescript syntax * * ```js * // returns "Array>" * parseGenericTypes('Array~Array~string~~'); * ``` * @param text - The text to convert * @returns The converted string */ export const parseGenericTypes = function (input: string): string { const inputSets = input.split(/(,)/); const output = []; for (let i = 0; i < inputSets.length; i++) { let thisSet = inputSets[i]; // if the original input included a value such as "~K, V~"", these will be split into // an array of ["~K",","," V~"]. // This means that on each call of processSet, there will only be 1 ~ present // To account for this, if we encounter a ",", we are checking the previous and next sets in the array // to see if they contain matching ~'s // in which case we are assuming that they should be rejoined and sent to be processed if (thisSet === ',' && i > 0 && i + 1 < inputSets.length) { const previousSet = inputSets[i - 1]; const nextSet = inputSets[i + 1]; if (shouldCombineSets(previousSet, nextSet)) { thisSet = previousSet + ',' + nextSet; i++; // Move the index forward to skip the next iteration since we're combining sets output.pop(); } } output.push(processSet(thisSet)); } return output.join(''); }; export const countOccurrence = (string: string, substring: string): number => { return Math.max(0, string.split(substring).length - 1); }; const shouldCombineSets = (previousSet: string, nextSet: string): boolean => { const prevCount = countOccurrence(previousSet, '~'); const nextCount = countOccurrence(nextSet, '~'); return prevCount === 1 && nextCount === 1; }; const processSet = (input: string): string => { const tildeCount = countOccurrence(input, '~'); let hasStartingTilde = false; if (tildeCount <= 1) { return input; } // If there is an odd number of tildes, and the input starts with a tilde, we need to remove it and add it back in later if (tildeCount % 2 !== 0 && input.startsWith('~')) { input = input.substring(1); hasStartingTilde = true; } const chars = [...input]; let first = chars.indexOf('~'); let last = chars.lastIndexOf('~'); while (first !== -1 && last !== -1 && first !== last) { chars[first] = '<'; chars[last] = '>'; first = chars.indexOf('~'); last = chars.lastIndexOf('~'); } // Add the starting tilde back in if we removed it if (hasStartingTilde) { chars.unshift('~'); } return chars.join(''); }; // TODO: find a better method for detecting support. This interface was added in the MathML 4 spec. // Firefox versions between [4,71] (0.47%) and Safari versions between [5,13.4] (0.17%) don't have this interface implemented but MathML is supported export const isMathMLSupported = () => window.MathMLElement !== undefined; export const katexRegex = /\$\$(.*)\$\$/g; /** * Whether or not a text has KaTeX delimiters * * @param text - The text to test * @returns Whether or not the text has KaTeX delimiters */ export const hasKatex = (text: string): boolean => (text.match(katexRegex)?.length ?? 0) > 0; /** * Computes the minimum dimensions needed to display a div containing MathML * * @param text - The text to test * @param config - Configuration for Mermaid * @returns Object containing \{width, height\} */ export const calculateMathMLDimensions = async (text: string, config: MermaidConfig) => { text = await renderKatex(text, config); const divElem = document.createElement('div'); divElem.innerHTML = text; divElem.id = 'katex-temp'; divElem.style.visibility = 'hidden'; divElem.style.position = 'absolute'; divElem.style.top = '0'; const body = document.querySelector('body'); body?.insertAdjacentElement('beforeend', divElem); const dim = { width: divElem.clientWidth, height: divElem.clientHeight }; divElem.remove(); return dim; }; /** * Attempts to render and return the KaTeX portion of a string with MathML * * @param text - The text to test * @param config - Configuration for Mermaid * @returns String containing MathML if KaTeX is supported, or an error message if it is not and stylesheets aren't present */ export const renderKatex = async (text: string, config: MermaidConfig): Promise => { if (!hasKatex(text)) { return text; } if (!(isMathMLSupported() || config.legacyMathML || config.forceLegacyMathML)) { return text.replace(katexRegex, 'MathML is unsupported in this environment.'); } const { default: katex } = await import('katex'); const outputMode = config.forceLegacyMathML || (!isMathMLSupported() && config.legacyMathML) ? 'htmlAndMathml' : 'mathml'; return text .split(lineBreakRegex) .map((line) => hasKatex(line) ? `

${line}

` : `

${line}

` ) .join('') .replace(katexRegex, (_, c) => katex .renderToString(c, { throwOnError: true, displayMode: true, output: outputMode, }) .replace(/\n/g, ' ') .replace(//g, '') ); }; export default { getRows, sanitizeText, sanitizeTextOrArray, hasBreaks, splitBreaks, lineBreakRegex, removeScript, getUrl, evaluate, getMax, getMin, };