Path: blob/main/src/vs/base/browser/markdownRenderer.ts
3292 views
/*---------------------------------------------------------------------------------------------1* Copyright (c) Microsoft Corporation. All rights reserved.2* Licensed under the MIT License. See License.txt in the project root for license information.3*--------------------------------------------------------------------------------------------*/45import { onUnexpectedError } from '../common/errors.js';6import { escapeDoubleQuotes, IMarkdownString, MarkdownStringTrustedOptions, parseHrefAndDimensions, removeMarkdownEscapes } from '../common/htmlContent.js';7import { markdownEscapeEscapedIcons } from '../common/iconLabels.js';8import { defaultGenerator } from '../common/idGenerator.js';9import { KeyCode } from '../common/keyCodes.js';10import { Lazy } from '../common/lazy.js';11import { DisposableStore } from '../common/lifecycle.js';12import * as marked from '../common/marked/marked.js';13import { parse } from '../common/marshalling.js';14import { FileAccess, Schemas } from '../common/network.js';15import { cloneAndChange } from '../common/objects.js';16import { dirname, resolvePath } from '../common/resources.js';17import { escape } from '../common/strings.js';18import { URI } from '../common/uri.js';19import * as DOM from './dom.js';20import * as domSanitize from './domSanitize.js';21import { convertTagToPlaintext } from './domSanitize.js';22import { StandardKeyboardEvent } from './keyboardEvent.js';23import { StandardMouseEvent } from './mouseEvent.js';24import { renderLabelWithIcons } from './ui/iconLabel/iconLabels.js';2526export type MarkdownActionHandler = (linkContent: string, mdStr: IMarkdownString) => void;2728/**29* Options for the rendering of markdown with {@link renderMarkdown}.30*/31export interface MarkdownRenderOptions {32readonly codeBlockRenderer?: (languageId: string, value: string) => Promise<HTMLElement>;33readonly codeBlockRendererSync?: (languageId: string, value: string, raw?: string) => HTMLElement;34readonly asyncRenderCallback?: () => void;3536readonly actionHandler?: MarkdownActionHandler;3738readonly fillInIncompleteTokens?: boolean;3940readonly sanitizerConfig?: MarkdownSanitizerConfig;4142readonly markedOptions?: MarkdownRendererMarkedOptions;43readonly markedExtensions?: marked.MarkedExtension[];44}4546/**47* Subset of options passed to `Marked` for rendering markdown.48*/49export interface MarkdownRendererMarkedOptions {50readonly gfm?: boolean;51readonly breaks?: boolean;52}5354export interface MarkdownSanitizerConfig {55readonly replaceWithPlaintext?: boolean;56readonly allowedTags?: {57readonly override: readonly string[];58};59readonly allowedAttributes?: {60readonly override: ReadonlyArray<string | domSanitize.SanitizeAttributeRule>;61};62readonly allowedLinkSchemes?: {63readonly augment: readonly string[];64};65readonly remoteImageIsAllowed?: (uri: URI) => boolean;66}6768const defaultMarkedRenderers = Object.freeze({69image: ({ href, title, text }: marked.Tokens.Image): string => {70let dimensions: string[] = [];71let attributes: string[] = [];72if (href) {73({ href, dimensions } = parseHrefAndDimensions(href));74attributes.push(`src="${escapeDoubleQuotes(href)}"`);75}76if (text) {77attributes.push(`alt="${escapeDoubleQuotes(text)}"`);78}79if (title) {80attributes.push(`title="${escapeDoubleQuotes(title)}"`);81}82if (dimensions.length) {83attributes = attributes.concat(dimensions);84}85return '<img ' + attributes.join(' ') + '>';86},8788paragraph(this: marked.Renderer, { tokens }: marked.Tokens.Paragraph): string {89return `<p>${this.parser.parseInline(tokens)}</p>`;90},9192link(this: marked.Renderer, { href, title, tokens }: marked.Tokens.Link): string {93let text = this.parser.parseInline(tokens);94if (typeof href !== 'string') {95return '';96}9798// Remove markdown escapes. Workaround for https://github.com/chjj/marked/issues/82999if (href === text) { // raw link case100text = removeMarkdownEscapes(text);101}102103title = typeof title === 'string' ? escapeDoubleQuotes(removeMarkdownEscapes(title)) : '';104href = removeMarkdownEscapes(href);105106// HTML Encode href107href = href.replace(/&/g, '&')108.replace(/</g, '<')109.replace(/>/g, '>')110.replace(/"/g, '"')111.replace(/'/g, ''');112113return `<a href="${href}" title="${title || href}" draggable="false">${text}</a>`;114},115});116117/**118* Low-level way create a html element from a markdown string.119*120* **Note** that for most cases you should be using {@link import('../../editor/browser/widget/markdownRenderer/browser/markdownRenderer.js').MarkdownRenderer MarkdownRenderer}121* which comes with support for pretty code block rendering and which uses the default way of handling links.122*/123export function renderMarkdown(markdown: IMarkdownString, options: MarkdownRenderOptions = {}, target?: HTMLElement): { element: HTMLElement; dispose: () => void } {124const disposables = new DisposableStore();125let isDisposed = false;126127const markedInstance = new marked.Marked(...(options.markedExtensions ?? []));128const { renderer, codeBlocks, syncCodeBlocks } = createMarkdownRenderer(markedInstance, options, markdown);129const value = preprocessMarkdownString(markdown);130131let renderedMarkdown: string;132if (options.fillInIncompleteTokens) {133// The defaults are applied by parse but not lexer()/parser(), and they need to be present134const opts: marked.MarkedOptions = {135...markedInstance.defaults,136...options.markedOptions,137renderer138};139const tokens = markedInstance.lexer(value, opts);140const newTokens = fillInIncompleteTokens(tokens);141renderedMarkdown = markedInstance.parser(newTokens, opts);142} else {143renderedMarkdown = markedInstance.parse(value, { ...options?.markedOptions, renderer, async: false });144}145146// Rewrite theme icons147if (markdown.supportThemeIcons) {148const elements = renderLabelWithIcons(renderedMarkdown);149renderedMarkdown = elements.map(e => typeof e === 'string' ? e : e.outerHTML).join('');150}151152const renderedContent = document.createElement('div');153const sanitizerConfig = getDomSanitizerConfig(markdown.isTrusted ?? false, options.sanitizerConfig ?? {});154domSanitize.safeSetInnerHtml(renderedContent, renderedMarkdown, sanitizerConfig);155156// Rewrite links and images before potentially inserting them into the real dom157rewriteRenderedLinks(markdown, options, renderedContent);158159let outElement: HTMLElement;160if (target) {161outElement = target;162DOM.reset(target, ...renderedContent.children);163} else {164outElement = renderedContent;165}166167if (codeBlocks.length > 0) {168Promise.all(codeBlocks).then((tuples) => {169if (isDisposed) {170return;171}172const renderedElements = new Map(tuples);173const placeholderElements = outElement.querySelectorAll<HTMLDivElement>(`div[data-code]`);174for (const placeholderElement of placeholderElements) {175const renderedElement = renderedElements.get(placeholderElement.dataset['code'] ?? '');176if (renderedElement) {177DOM.reset(placeholderElement, renderedElement);178}179}180options.asyncRenderCallback?.();181});182} else if (syncCodeBlocks.length > 0) {183const renderedElements = new Map(syncCodeBlocks);184const placeholderElements = outElement.querySelectorAll<HTMLDivElement>(`div[data-code]`);185for (const placeholderElement of placeholderElements) {186const renderedElement = renderedElements.get(placeholderElement.dataset['code'] ?? '');187if (renderedElement) {188DOM.reset(placeholderElement, renderedElement);189}190}191}192193// Signal size changes for image tags194if (options.asyncRenderCallback) {195for (const img of outElement.getElementsByTagName('img')) {196const listener = disposables.add(DOM.addDisposableListener(img, 'load', () => {197listener.dispose();198options.asyncRenderCallback!();199}));200}201}202203// Add event listeners for links204if (options.actionHandler) {205const clickCb = (e: PointerEvent) => {206const mouseEvent = new StandardMouseEvent(DOM.getWindow(outElement), e);207if (!mouseEvent.leftButton && !mouseEvent.middleButton) {208return;209}210activateLink(markdown, options, mouseEvent);211};212disposables.add(DOM.addDisposableListener(outElement, 'click', clickCb));213disposables.add(DOM.addDisposableListener(outElement, 'auxclick', clickCb));214215disposables.add(DOM.addDisposableListener(outElement, 'keydown', (e) => {216const keyboardEvent = new StandardKeyboardEvent(e);217if (!keyboardEvent.equals(KeyCode.Space) && !keyboardEvent.equals(KeyCode.Enter)) {218return;219}220activateLink(markdown, options, keyboardEvent);221}));222}223224// Remove/disable inputs225for (const input of [...outElement.getElementsByTagName('input')]) {226if (input.attributes.getNamedItem('type')?.value === 'checkbox') {227input.setAttribute('disabled', '');228} else {229if (options.sanitizerConfig?.replaceWithPlaintext) {230const replacement = convertTagToPlaintext(input);231input.parentElement?.replaceChild(replacement, input);232} else {233input.remove();234}235}236}237238return {239element: outElement,240dispose: () => {241isDisposed = true;242disposables.dispose();243}244};245}246247function rewriteRenderedLinks(markdown: IMarkdownString, options: MarkdownRenderOptions, root: HTMLElement) {248for (const el of root.querySelectorAll('img, audio, video, source')) {249const src = el.getAttribute('src'); // Get the raw 'src' attribute value as text, not the resolved 'src'250if (src) {251let href = src;252try {253if (markdown.baseUri) { // absolute or relative local path, or file: uri254href = resolveWithBaseUri(URI.from(markdown.baseUri), href);255}256} catch (err) { }257258el.setAttribute('src', massageHref(markdown, href, true));259260if (options.sanitizerConfig?.remoteImageIsAllowed) {261const uri = URI.parse(href);262if (uri.scheme !== Schemas.file && uri.scheme !== Schemas.data && !options.sanitizerConfig.remoteImageIsAllowed(uri)) {263el.replaceWith(DOM.$('', undefined, el.outerHTML));264}265}266}267}268269for (const el of root.querySelectorAll('a')) {270const href = el.getAttribute('href'); // Get the raw 'href' attribute value as text, not the resolved 'href'271el.setAttribute('href', ''); // Clear out href. We use the `data-href` for handling clicks instead272if (!href273|| /^data:|javascript:/i.test(href)274|| (/^command:/i.test(href) && !markdown.isTrusted)275|| /^command:(\/\/\/)?_workbench\.downloadResource/i.test(href)) {276// drop the link277el.replaceWith(...el.childNodes);278} else {279let resolvedHref = massageHref(markdown, href, false);280if (markdown.baseUri) {281resolvedHref = resolveWithBaseUri(URI.from(markdown.baseUri), href);282}283el.dataset.href = resolvedHref;284}285}286}287288function createMarkdownRenderer(marked: marked.Marked, options: MarkdownRenderOptions, markdown: IMarkdownString): { renderer: marked.Renderer; codeBlocks: Promise<[string, HTMLElement]>[]; syncCodeBlocks: [string, HTMLElement][] } {289const renderer = new marked.Renderer(options.markedOptions);290renderer.image = defaultMarkedRenderers.image;291renderer.link = defaultMarkedRenderers.link;292renderer.paragraph = defaultMarkedRenderers.paragraph;293294// Will collect [id, renderedElement] tuples295const codeBlocks: Promise<[string, HTMLElement]>[] = [];296const syncCodeBlocks: [string, HTMLElement][] = [];297298if (options.codeBlockRendererSync) {299renderer.code = ({ text, lang, raw }: marked.Tokens.Code) => {300const id = defaultGenerator.nextId();301const value = options.codeBlockRendererSync!(postProcessCodeBlockLanguageId(lang), text, raw);302syncCodeBlocks.push([id, value]);303return `<div class="code" data-code="${id}">${escape(text)}</div>`;304};305} else if (options.codeBlockRenderer) {306renderer.code = ({ text, lang }: marked.Tokens.Code) => {307const id = defaultGenerator.nextId();308const value = options.codeBlockRenderer!(postProcessCodeBlockLanguageId(lang), text);309codeBlocks.push(value.then(element => [id, element]));310return `<div class="code" data-code="${id}">${escape(text)}</div>`;311};312}313314if (!markdown.supportHtml) {315// Note: we always pass the output through dompurify after this so that we don't rely on316// marked for real sanitization.317renderer.html = ({ text }) => {318if (options.sanitizerConfig?.replaceWithPlaintext) {319return escape(text);320}321322const match = markdown.isTrusted ? text.match(/^(<span[^>]+>)|(<\/\s*span>)$/) : undefined;323return match ? text : '';324};325}326return { renderer, codeBlocks, syncCodeBlocks };327}328329function preprocessMarkdownString(markdown: IMarkdownString) {330let value = markdown.value;331332// values that are too long will freeze the UI333if (value.length > 100_000) {334value = `${value.substr(0, 100_000)}…`;335}336337// escape theme icons338if (markdown.supportThemeIcons) {339value = markdownEscapeEscapedIcons(value);340}341342return value;343}344345function activateLink(mdStr: IMarkdownString, options: MarkdownRenderOptions, event: StandardMouseEvent | StandardKeyboardEvent): void {346const target = event.target.closest('a[data-href]');347if (!DOM.isHTMLElement(target)) {348return;349}350351try {352let href = target.dataset['href'];353if (href) {354if (mdStr.baseUri) {355href = resolveWithBaseUri(URI.from(mdStr.baseUri), href);356}357options.actionHandler?.(href, mdStr);358}359} catch (err) {360onUnexpectedError(err);361} finally {362event.preventDefault();363}364}365366function uriMassage(markdown: IMarkdownString, part: string): string {367let data: unknown;368try {369data = parse(decodeURIComponent(part));370} catch (e) {371// ignore372}373if (!data) {374return part;375}376data = cloneAndChange(data, value => {377if (markdown.uris && markdown.uris[value]) {378return URI.revive(markdown.uris[value]);379} else {380return undefined;381}382});383return encodeURIComponent(JSON.stringify(data));384}385386function massageHref(markdown: IMarkdownString, href: string, isDomUri: boolean): string {387const data = markdown.uris && markdown.uris[href];388let uri = URI.revive(data);389if (isDomUri) {390if (href.startsWith(Schemas.data + ':')) {391return href;392}393if (!uri) {394uri = URI.parse(href);395}396// this URI will end up as "src"-attribute of a dom node397// and because of that special rewriting needs to be done398// so that the URI uses a protocol that's understood by399// browsers (like http or https)400return FileAccess.uriToBrowserUri(uri).toString(true);401}402if (!uri) {403return href;404}405if (URI.parse(href).toString() === uri.toString()) {406return href; // no transformation performed407}408if (uri.query) {409uri = uri.with({ query: uriMassage(markdown, uri.query) });410}411return uri.toString();412}413414function postProcessCodeBlockLanguageId(lang: string | undefined): string {415if (!lang) {416return '';417}418419const parts = lang.split(/[\s+|:|,|\{|\?]/, 1);420if (parts.length) {421return parts[0];422}423return lang;424}425426function resolveWithBaseUri(baseUri: URI, href: string): string {427const hasScheme = /^\w[\w\d+.-]*:/.test(href);428if (hasScheme) {429return href;430}431432if (baseUri.path.endsWith('/')) {433return resolvePath(baseUri, href).toString();434} else {435return resolvePath(dirname(baseUri), href).toString();436}437}438439function sanitizeRenderedMarkdown(440renderedMarkdown: string,441isTrusted: boolean | MarkdownStringTrustedOptions,442options: MarkdownSanitizerConfig = {},443): TrustedHTML {444const sanitizerConfig = getDomSanitizerConfig(isTrusted, options);445return domSanitize.sanitizeHtml(renderedMarkdown, sanitizerConfig);446}447448export const allowedMarkdownHtmlTags = Object.freeze([449...domSanitize.basicMarkupHtmlTags,450'input', // Allow inputs for rendering checkboxes. Other types of inputs are removed and the inputs are always disabled451]);452453export const allowedMarkdownHtmlAttributes = Object.freeze<Array<string | domSanitize.SanitizeAttributeRule>>([454'align',455'autoplay',456'alt',457'colspan',458'controls',459'draggable',460'height',461'href',462'loop',463'muted',464'playsinline',465'poster',466'rowspan',467'src',468'target',469'title',470'type',471'width',472'start',473474// Input (For disabled inputs)475'checked',476'disabled',477'value',478479// Custom markdown attributes480'data-code',481'data-href',482483// Only allow very specific styles484{485attributeName: 'style',486shouldKeep: (element, data) => {487if (element.tagName === 'SPAN') {488if (data.attrName === 'style') {489return /^(color\:(#[0-9a-fA-F]+|var\(--vscode(-[a-zA-Z0-9]+)+\));)?(background-color\:(#[0-9a-fA-F]+|var\(--vscode(-[a-zA-Z0-9]+)+\));)?(border-radius:[0-9]+px;)?$/.test(data.attrValue);490}491}492return false;493}494},495496// Only allow codicons for classes497{498attributeName: 'class',499shouldKeep: (element, data) => {500if (element.tagName === 'SPAN') {501if (data.attrName === 'class') {502return /^codicon codicon-[a-z\-]+( codicon-modifier-[a-z\-]+)?$/.test(data.attrValue);503}504}505return false;506},507},508]);509510function getDomSanitizerConfig(isTrusted: boolean | MarkdownStringTrustedOptions, options: MarkdownSanitizerConfig): domSanitize.DomSanitizerConfig {511const allowedLinkSchemes = [512Schemas.http,513Schemas.https,514Schemas.mailto,515Schemas.file,516Schemas.vscodeFileResource,517Schemas.vscodeRemote,518Schemas.vscodeRemoteResource,519Schemas.vscodeNotebookCell520];521522if (isTrusted) {523allowedLinkSchemes.push(Schemas.command);524}525526if (options.allowedLinkSchemes?.augment) {527allowedLinkSchemes.push(...options.allowedLinkSchemes.augment);528}529530return {531// allowedTags should included everything that markdown renders to.532// Since we have our own sanitize function for marked, it's possible we missed some tag so let dompurify make sure.533// HTML tags that can result from markdown are from reading https://spec.commonmark.org/0.29/534// HTML table tags that can result from markdown are from https://github.github.com/gfm/#tables-extension-535allowedTags: {536override: options.allowedTags?.override ?? allowedMarkdownHtmlTags537},538allowedAttributes: {539override: options.allowedAttributes?.override ?? allowedMarkdownHtmlAttributes,540},541allowedLinkProtocols: {542override: allowedLinkSchemes,543},544allowedMediaProtocols: {545override: [546Schemas.http,547Schemas.https,548Schemas.data,549Schemas.file,550Schemas.vscodeFileResource,551Schemas.vscodeRemote,552Schemas.vscodeRemoteResource,553]554},555replaceWithPlaintext: options.replaceWithPlaintext,556};557}558559/**560* Renders `str` as plaintext, stripping out Markdown syntax if it's a {@link IMarkdownString}.561*562* For example `# Header` would be output as `Header`.563*/564export function renderAsPlaintext(str: IMarkdownString | string, options?: {565/** Controls if the ``` of code blocks should be preserved in the output or not */566readonly includeCodeBlocksFences?: boolean;567}) {568if (typeof str === 'string') {569return str;570}571572// values that are too long will freeze the UI573let value = str.value ?? '';574if (value.length > 100_000) {575value = `${value.substr(0, 100_000)}…`;576}577578const html = marked.parse(value, { async: false, renderer: options?.includeCodeBlocksFences ? plainTextWithCodeBlocksRenderer.value : plainTextRenderer.value });579return sanitizeRenderedMarkdown(html, /* isTrusted */ false, {})580.toString()581.replace(/&(#\d+|[a-zA-Z]+);/g, m => unescapeInfo.get(m) ?? m)582.trim();583}584585const unescapeInfo = new Map<string, string>([586['"', '"'],587[' ', ' '],588['&', '&'],589[''', '\''],590['<', '<'],591['>', '>'],592]);593594function createPlainTextRenderer(): marked.Renderer {595const renderer = new marked.Renderer();596597renderer.code = ({ text }: marked.Tokens.Code): string => {598return escape(text);599};600renderer.blockquote = ({ text }: marked.Tokens.Blockquote): string => {601return text + '\n';602};603renderer.html = (_: marked.Tokens.HTML): string => {604return '';605};606renderer.heading = function ({ tokens }: marked.Tokens.Heading): string {607return this.parser.parseInline(tokens) + '\n';608};609renderer.hr = (): string => {610return '';611};612renderer.list = function ({ items }: marked.Tokens.List): string {613return items.map(x => this.listitem(x)).join('\n') + '\n';614};615renderer.listitem = ({ text }: marked.Tokens.ListItem): string => {616return text + '\n';617};618renderer.paragraph = function ({ tokens }: marked.Tokens.Paragraph): string {619return this.parser.parseInline(tokens) + '\n';620};621renderer.table = function ({ header, rows }: marked.Tokens.Table): string {622return header.map(cell => this.tablecell(cell)).join(' ') + '\n' + rows.map(cells => cells.map(cell => this.tablecell(cell)).join(' ')).join('\n') + '\n';623};624renderer.tablerow = ({ text }: marked.Tokens.TableRow): string => {625return text;626};627renderer.tablecell = function ({ tokens }: marked.Tokens.TableCell): string {628return this.parser.parseInline(tokens);629};630renderer.strong = ({ text }: marked.Tokens.Strong): string => {631return text;632};633renderer.em = ({ text }: marked.Tokens.Em): string => {634return text;635};636renderer.codespan = ({ text }: marked.Tokens.Codespan): string => {637return escape(text);638};639renderer.br = (_: marked.Tokens.Br): string => {640return '\n';641};642renderer.del = ({ text }: marked.Tokens.Del): string => {643return text;644};645renderer.image = (_: marked.Tokens.Image): string => {646return '';647};648renderer.text = ({ text }: marked.Tokens.Text): string => {649return text;650};651renderer.link = ({ text }: marked.Tokens.Link): string => {652return text;653};654return renderer;655}656const plainTextRenderer = new Lazy<marked.Renderer>(createPlainTextRenderer);657658const plainTextWithCodeBlocksRenderer = new Lazy<marked.Renderer>(() => {659const renderer = createPlainTextRenderer();660renderer.code = ({ text }: marked.Tokens.Code): string => {661return `\n\`\`\`\n${escape(text)}\n\`\`\`\n`;662};663return renderer;664});665666function mergeRawTokenText(tokens: marked.Token[]): string {667let mergedTokenText = '';668tokens.forEach(token => {669mergedTokenText += token.raw;670});671return mergedTokenText;672}673674function completeSingleLinePattern(token: marked.Tokens.Text | marked.Tokens.Paragraph): marked.Token | undefined {675if (!token.tokens) {676return undefined;677}678679for (let i = token.tokens.length - 1; i >= 0; i--) {680const subtoken = token.tokens[i];681if (subtoken.type === 'text') {682const lines = subtoken.raw.split('\n');683const lastLine = lines[lines.length - 1];684if (lastLine.includes('`')) {685return completeCodespan(token);686}687688else if (lastLine.includes('**')) {689return completeDoublestar(token);690}691692else if (lastLine.match(/\*\w/)) {693return completeStar(token);694}695696else if (lastLine.match(/(^|\s)__\w/)) {697return completeDoubleUnderscore(token);698}699700else if (lastLine.match(/(^|\s)_\w/)) {701return completeUnderscore(token);702}703704else if (705// Text with start of link target706hasLinkTextAndStartOfLinkTarget(lastLine) ||707// This token doesn't have the link text, eg if it contains other markdown constructs that are in other subtokens.708// But some preceding token does have an unbalanced [ at least709hasStartOfLinkTargetAndNoLinkText(lastLine) && token.tokens.slice(0, i).some(t => t.type === 'text' && t.raw.match(/\[[^\]]*$/))710) {711const nextTwoSubTokens = token.tokens.slice(i + 1);712713// A markdown link can look like714// [link text](https://microsoft.com "more text")715// Where "more text" is a title for the link or an argument to a vscode command link716if (717// If the link was parsed as a link, then look for a link token and a text token with a quote718nextTwoSubTokens[0]?.type === 'link' && nextTwoSubTokens[1]?.type === 'text' && nextTwoSubTokens[1].raw.match(/^ *"[^"]*$/) ||719// And if the link was not parsed as a link (eg command link), just look for a single quote in this token720lastLine.match(/^[^"]* +"[^"]*$/)721) {722723return completeLinkTargetArg(token);724}725return completeLinkTarget(token);726}727728// Contains the start of link text, and no following tokens contain the link target729else if (lastLine.match(/(^|\s)\[\w*[^\]]*$/)) {730return completeLinkText(token);731}732}733}734735return undefined;736}737738function hasLinkTextAndStartOfLinkTarget(str: string): boolean {739return !!str.match(/(^|\s)\[.*\]\(\w*/);740}741742function hasStartOfLinkTargetAndNoLinkText(str: string): boolean {743return !!str.match(/^[^\[]*\]\([^\)]*$/);744}745746function completeListItemPattern(list: marked.Tokens.List): marked.Tokens.List | undefined {747// Patch up this one list item748const lastListItem = list.items[list.items.length - 1];749const lastListSubToken = lastListItem.tokens ? lastListItem.tokens[lastListItem.tokens.length - 1] : undefined;750751/*752Example list token structures:753754list755list_item756text757text758codespan759link760list_item761text762code // Complete indented codeblock763list_item764text765space766text767text // Incomplete indented codeblock768list_item769text770list // Nested list771list_item772text773text774775Contrast with paragraph:776paragraph777text778codespan779*/780781const listEndsInHeading = (list: marked.Tokens.List): boolean => {782// A list item can be rendered as a heading for some reason when it has a subitem where we haven't rendered the text yet like this:783// 1. list item784// -785const lastItem = list.items.at(-1);786const lastToken = lastItem?.tokens.at(-1);787return lastToken?.type === 'heading' || lastToken?.type === 'list' && listEndsInHeading(lastToken as marked.Tokens.List);788};789790let newToken: marked.Token | undefined;791if (lastListSubToken?.type === 'text' && !('inRawBlock' in lastListItem)) { // Why does Tag have a type of 'text'792newToken = completeSingleLinePattern(lastListSubToken as marked.Tokens.Text);793} else if (listEndsInHeading(list)) {794const newList = marked.lexer(list.raw.trim() + ' ')[0] as marked.Tokens.List;795if (newList.type !== 'list') {796// Something went wrong797return;798}799return newList;800}801802if (!newToken || newToken.type !== 'paragraph') { // 'text' item inside the list item turns into paragraph803// Nothing to fix, or not a pattern we were expecting804return;805}806807const previousListItemsText = mergeRawTokenText(list.items.slice(0, -1));808809// Grabbing the `- ` or `1. ` or `* ` off the list item because I can't find a better way to do this810const lastListItemLead = lastListItem.raw.match(/^(\s*(-|\d+\.|\*) +)/)?.[0];811if (!lastListItemLead) {812// Is badly formatted813return;814}815816const newListItemText = lastListItemLead +817mergeRawTokenText(lastListItem.tokens.slice(0, -1)) +818newToken.raw;819820const newList = marked.lexer(previousListItemsText + newListItemText)[0] as marked.Tokens.List;821if (newList.type !== 'list') {822// Something went wrong823return;824}825826return newList;827}828829function completeHeading(token: marked.Tokens.Heading, fullRawText: string): marked.TokensList | void {830if (token.raw.match(/-\s*$/)) {831return marked.lexer(fullRawText + ' ');832}833}834835const maxIncompleteTokensFixRounds = 3;836export function fillInIncompleteTokens(tokens: marked.TokensList): marked.TokensList {837for (let i = 0; i < maxIncompleteTokensFixRounds; i++) {838const newTokens = fillInIncompleteTokensOnce(tokens);839if (newTokens) {840tokens = newTokens;841} else {842break;843}844}845846return tokens;847}848849function fillInIncompleteTokensOnce(tokens: marked.TokensList): marked.TokensList | null {850let i: number;851let newTokens: marked.Token[] | undefined;852for (i = 0; i < tokens.length; i++) {853const token = tokens[i];854855if (token.type === 'paragraph' && token.raw.match(/(\n|^)\|/)) {856newTokens = completeTable(tokens.slice(i));857break;858}859}860861const lastToken = tokens.at(-1);862if (!newTokens && lastToken?.type === 'list') {863const newListToken = completeListItemPattern(lastToken as marked.Tokens.List);864if (newListToken) {865newTokens = [newListToken];866i = tokens.length - 1;867}868}869870if (!newTokens && lastToken?.type === 'paragraph') {871// Only operates on a single token, because any newline that follows this should break these patterns872const newToken = completeSingleLinePattern(lastToken as marked.Tokens.Paragraph);873if (newToken) {874newTokens = [newToken];875i = tokens.length - 1;876}877}878879if (newTokens) {880const newTokensList = [881...tokens.slice(0, i),882...newTokens883];884(newTokensList as marked.TokensList).links = tokens.links;885return newTokensList as marked.TokensList;886}887888if (lastToken?.type === 'heading') {889const completeTokens = completeHeading(lastToken as marked.Tokens.Heading, mergeRawTokenText(tokens));890if (completeTokens) {891return completeTokens;892}893}894895return null;896}897898899function completeCodespan(token: marked.Token): marked.Token {900return completeWithString(token, '`');901}902903function completeStar(tokens: marked.Token): marked.Token {904return completeWithString(tokens, '*');905}906907function completeUnderscore(tokens: marked.Token): marked.Token {908return completeWithString(tokens, '_');909}910911function completeLinkTarget(tokens: marked.Token): marked.Token {912return completeWithString(tokens, ')', false);913}914915function completeLinkTargetArg(tokens: marked.Token): marked.Token {916return completeWithString(tokens, '")', false);917}918919function completeLinkText(tokens: marked.Token): marked.Token {920return completeWithString(tokens, '](https://microsoft.com)', false);921}922923function completeDoublestar(tokens: marked.Token): marked.Token {924return completeWithString(tokens, '**');925}926927function completeDoubleUnderscore(tokens: marked.Token): marked.Token {928return completeWithString(tokens, '__');929}930931function completeWithString(tokens: marked.Token[] | marked.Token, closingString: string, shouldTrim = true): marked.Token {932const mergedRawText = mergeRawTokenText(Array.isArray(tokens) ? tokens : [tokens]);933934// If it was completed correctly, this should be a single token.935// Expecting either a Paragraph or a List936const trimmedRawText = shouldTrim ? mergedRawText.trimEnd() : mergedRawText;937return marked.lexer(trimmedRawText + closingString)[0] as marked.Token;938}939940function completeTable(tokens: marked.Token[]): marked.Token[] | undefined {941const mergedRawText = mergeRawTokenText(tokens);942const lines = mergedRawText.split('\n');943944let numCols: number | undefined; // The number of line1 col headers945let hasSeparatorRow = false;946for (let i = 0; i < lines.length; i++) {947const line = lines[i].trim();948if (typeof numCols === 'undefined' && line.match(/^\s*\|/)) {949const line1Matches = line.match(/(\|[^\|]+)(?=\||$)/g);950if (line1Matches) {951numCols = line1Matches.length;952}953} else if (typeof numCols === 'number') {954if (line.match(/^\s*\|/)) {955if (i !== lines.length - 1) {956// We got the line1 header row, and the line2 separator row, but there are more lines, and it wasn't parsed as a table!957// That's strange and means that the table is probably malformed in the source, so I won't try to patch it up.958return undefined;959}960961// Got a line2 separator row- partial or complete, doesn't matter, we'll replace it with a correct one962hasSeparatorRow = true;963} else {964// The line after the header row isn't a valid separator row, so the table is malformed, don't fix it up965return undefined;966}967}968}969970if (typeof numCols === 'number' && numCols > 0) {971const prefixText = hasSeparatorRow ? lines.slice(0, -1).join('\n') : mergedRawText;972const line1EndsInPipe = !!prefixText.match(/\|\s*$/);973const newRawText = prefixText + (line1EndsInPipe ? '' : '|') + `\n|${' --- |'.repeat(numCols)}`;974return marked.lexer(newRawText);975}976977return undefined;978}979980981982