silverbullet/plugs/markdown/markdown_render.ts

530 lines
13 KiB
TypeScript
Raw Normal View History

import {
2023-10-29 19:10:30 +08:00
addParentPointers,
collectNodesOfType,
findNodeOfType,
ParseTree,
2023-11-28 17:06:53 +08:00
removeParentPointers,
renderToText,
traverseTree,
2024-02-29 22:23:05 +08:00
} from "../../plug-api/lib/tree.ts";
import { encodePageRef, parsePageRef } from "$sb/lib/page_ref.ts";
import { Fragment, renderHtml, Tag } from "./html_render.ts";
2023-11-02 19:35:30 +08:00
export type MarkdownRenderOptions = {
failOnUnknown?: true;
smartHardBreak?: true;
annotationPositions?: true;
attachmentUrlPrefix?: string;
2023-07-25 01:54:31 +08:00
preserveAttributes?: true;
2023-02-23 22:33:51 +08:00
// When defined, use to inline images as data: urls
2023-12-20 00:20:47 +08:00
translateUrls?: (url: string, type: "link" | "image") => string;
};
2023-10-29 19:10:30 +08:00
function cleanTags(values: (Tag | null)[], cleanWhitespace = false): Tag[] {
const result: Tag[] = [];
for (const value of values) {
2023-10-29 19:10:30 +08:00
if (cleanWhitespace && typeof value === "string" && value.match(/^\s+$/)) {
continue;
}
if (value) {
result.push(value);
}
}
return result;
}
function preprocess(t: ParseTree) {
2023-10-29 19:10:30 +08:00
addParentPointers(t);
traverseTree(t, (node) => {
2023-10-29 19:10:30 +08:00
if (!node.type) {
if (node.text?.startsWith("\n")) {
const prevNodeIdx = node.parent!.children!.indexOf(node) - 1;
2024-03-02 20:09:05 +08:00
const prevNodeType = node.parent!.children![prevNodeIdx]?.type;
2024-03-10 19:28:13 +08:00
if (
prevNodeType?.includes("Heading") || prevNodeType?.includes("Table")
) {
2023-10-29 19:10:30 +08:00
node.text = node.text.slice(1);
}
}
}
return false;
});
}
function posPreservingRender(
t: ParseTree,
options: MarkdownRenderOptions = {},
): Tag | null {
const tag = render(t, options);
if (!options.annotationPositions) {
return tag;
}
if (!tag) {
return null;
}
if (typeof tag === "string") {
return tag;
}
if (t.from) {
if (!tag.attrs) {
tag.attrs = {};
}
tag.attrs["data-pos"] = "" + t.from;
}
return tag;
}
function render(
t: ParseTree,
options: MarkdownRenderOptions = {},
): Tag | null {
if (t.type?.endsWith("Mark") || t.type?.endsWith("Delimiter")) {
return null;
}
switch (t.type) {
case "Document":
return {
name: Fragment,
body: cleanTags(mapRender(t.children!)),
};
case "FrontMatter":
return null;
case "CommentBlock":
// Remove, for now
return null;
case "ATXHeading1":
return {
name: "h1",
body: cleanTags(mapRender(t.children!)),
};
case "ATXHeading2":
return {
name: "h2",
body: cleanTags(mapRender(t.children!)),
};
case "ATXHeading3":
return {
name: "h3",
body: cleanTags(mapRender(t.children!)),
};
case "ATXHeading4":
return {
name: "h4",
body: cleanTags(mapRender(t.children!)),
};
case "ATXHeading5":
return {
name: "h5",
body: cleanTags(mapRender(t.children!)),
};
case "Paragraph":
return {
2023-10-29 19:10:30 +08:00
name: "span",
attrs: {
class: "p",
},
body: cleanTags(mapRender(t.children!)),
};
// Code blocks
case "FencedCode":
case "CodeBlock": {
// Clear out top-level indent blocks
const lang = findNodeOfType(t, "CodeInfo");
t.children = t.children!.filter((c) => c.type);
return {
name: "pre",
attrs: {
"data-lang": lang ? lang.children![0].text : undefined,
},
body: cleanTags(mapRender(t.children!)),
};
}
case "CodeInfo":
return null;
case "CodeText":
return t.children![0].text!;
case "Blockquote":
return {
name: "blockquote",
body: cleanTags(mapRender(t.children!)),
};
case "HardBreak":
return {
name: "br",
body: "",
};
// Basic styling
case "Emphasis":
return {
name: "em",
body: cleanTags(mapRender(t.children!)),
};
case "Highlight":
return {
name: "span",
attrs: {
class: "highlight",
},
body: cleanTags(mapRender(t.children!)),
};
case "Strikethrough":
return {
name: "del",
body: cleanTags(mapRender(t.children!)),
};
case "InlineCode":
return {
name: "tt",
body: cleanTags(mapRender(t.children!)),
};
case "BulletList":
return {
name: "ul",
2023-10-29 19:10:30 +08:00
body: cleanTags(mapRender(t.children!), true),
};
case "OrderedList":
return {
name: "ol",
2023-10-29 19:10:30 +08:00
body: cleanTags(mapRender(t.children!), true),
};
case "ListItem":
return {
name: "li",
2023-10-29 19:10:30 +08:00
body: cleanTags(mapRender(t.children!), true),
};
case "StrongEmphasis":
return {
name: "strong",
body: cleanTags(mapRender(t.children!)),
};
case "HorizontalRule":
return {
name: "hr",
body: "",
};
case "Link": {
const linkTextChildren = t.children!.slice(1, -4);
const urlNode = findNodeOfType(t, "URL");
if (!urlNode) {
return renderToText(t);
}
let url = urlNode.children![0].text!;
if (url.indexOf("://") === -1) {
if (
options.attachmentUrlPrefix &&
!url.startsWith(options.attachmentUrlPrefix)
) {
url = `${options.attachmentUrlPrefix}${url}`;
}
}
return {
name: "a",
attrs: {
href: url,
},
body: cleanTags(mapRender(linkTextChildren)),
};
}
case "Image": {
const altText = t.children![1].text!;
const urlNode = findNodeOfType(t, "URL");
if (!urlNode) {
return renderToText(t);
}
let url = urlNode!.children![0].text!;
if (url.indexOf("://") === -1) {
if (
options.attachmentUrlPrefix &&
!url.startsWith(options.attachmentUrlPrefix)
) {
url = `${options.attachmentUrlPrefix}${url}`;
}
}
return {
name: "img",
attrs: {
src: url,
alt: altText,
},
body: "",
};
}
// Custom stuff
case "WikiLink": {
const ref = findNodeOfType(t, "WikiLinkPage")!.children![0].text!;
2023-08-18 02:37:55 +08:00
let linkText = ref.split("/").pop()!;
2022-11-27 18:20:43 +08:00
const aliasNode = findNodeOfType(t, "WikiLinkAlias");
if (aliasNode) {
linkText = aliasNode.children![0].text!;
}
2024-01-24 21:44:39 +08:00
const pageRef = parsePageRef(ref);
return {
name: "a",
attrs: {
2024-01-24 21:44:39 +08:00
href: `/${encodePageRef(pageRef)}`,
2023-11-12 19:08:09 +08:00
class: "wiki-link",
"data-ref": ref,
},
2022-11-27 18:20:43 +08:00
body: linkText,
};
}
case "NakedURL": {
const url = t.children![0].text!;
return {
name: "a",
attrs: {
href: url,
},
body: url,
};
}
case "Hashtag":
return {
name: "span",
attrs: {
class: "hashtag",
},
body: t.children![0].text!,
};
case "Task": {
let externalTaskRef = "";
collectNodesOfType(t, "WikiLinkPage").forEach((wikilink) => {
const pageRef = parsePageRef(wikilink.children![0].text!);
if (!externalTaskRef && (pageRef.pos !== undefined || pageRef.anchor)) {
externalTaskRef = wikilink.children![0].text!;
}
});
return {
name: "span",
attrs: externalTaskRef
? {
"data-external-task-ref": externalTaskRef,
}
: {},
body: cleanTags(mapRender(t.children!)),
};
}
case "TaskState": {
// child[0] = marker, child[1] = state, child[2] = marker
const stateText = t.children![1].text!;
if ([" ", "x", "X"].includes(stateText)) {
return {
name: "input",
attrs: {
type: "checkbox",
checked: stateText !== " " ? "checked" : undefined,
"data-state": stateText,
},
body: "",
};
} else {
return {
name: "span",
attrs: {
class: "task-state",
},
body: stateText,
};
}
}
case "NamedAnchor":
return {
name: "a",
attrs: {
name: t.children![0].text?.substring(1),
},
body: "",
};
case "ImageWithSize": {
const alt = findNodeOfType(t, "ImageWithSizeAlt")!.children![0].text!;
const src = findNodeOfType(t, "ImageWithSizeURL")!.children![0].text!;
const dimensionsToParse = findNodeOfType(t, "ImageWithSizeSize")!.children![0].text!;
const [, width, widthUnit = "px", height, heightUnit = "px"] =
dimensionsToParse.match(/(\d*)(%)?x(\d*)(%)?/) ?? [];
return {
name: "img",
attrs: {
alt,
src,
style: `width: ${width}${widthUnit}; height: ${height}${heightUnit};`
},
body: "",
};
}
case "CommandLink": {
// Child 0 is CommandLinkMark, child 1 is CommandLinkPage
const command = t.children![1].children![0].text!;
let commandText = command;
const aliasNode = findNodeOfType(t, "CommandLinkAlias");
const argsNode = findNodeOfType(t, "CommandLinkArgs");
let args: any = [];
if (argsNode) {
args = JSON.parse(`[${argsNode.children![0].text!}]`);
}
if (aliasNode) {
commandText = aliasNode.children![0].text!;
}
return {
name: "button",
attrs: {
"data-onclick": JSON.stringify(["command", command, args]),
},
body: commandText,
};
}
case "DeadlineDate":
2023-11-12 19:08:09 +08:00
return {
name: "span",
attrs: {
class: "task-deadline",
},
body: renderToText(t),
};
// Tables
case "Table":
return {
name: "table",
body: cleanTags(mapRender(t.children!)),
};
case "TableHeader":
return {
name: "thead",
body: [
{
name: "tr",
body: cleanTags(mapRender(t.children!)),
},
],
};
case "TableCell":
return {
name: "td",
body: cleanTags(mapRender(t.children!)),
};
2022-11-30 22:59:41 +08:00
case "TableRow": {
const children = t.children!;
const newChildren: ParseTree[] = [];
// Ensure there is TableCell in between every delimiter
let lookingForCell = false;
for (const child of children) {
if (child.type === "TableDelimiter" && lookingForCell) {
// We were looking for a cell, but didn't fine one: empty cell!
// Let's inject an empty one
newChildren.push({
type: "TableCell",
children: [],
});
}
if (child.type === "TableDelimiter") {
lookingForCell = true;
}
if (child.type === "TableCell") {
lookingForCell = false;
}
newChildren.push(child);
}
return {
name: "tr",
2022-11-30 22:59:41 +08:00
body: cleanTags(mapRender(newChildren)),
};
2022-11-30 22:59:41 +08:00
}
2023-07-25 01:54:31 +08:00
case "Attribute":
if (options.preserveAttributes) {
return {
name: "span",
attrs: {
class: "attribute",
},
body: renderToText(t),
};
}
return null;
case "Escape": {
return {
name: "span",
attrs: {
class: "escape",
},
body: t.children![0].text!.slice(1),
};
}
2023-11-28 17:06:53 +08:00
case "Entity":
return t.children![0].text!;
case "TemplateDirective": {
return {
name: "span",
attrs: {
class: "template-directive",
},
body: renderToText(t),
};
}
// Text
case undefined:
return t.text!;
default:
if (options.failOnUnknown) {
2023-11-28 17:06:53 +08:00
removeParentPointers(t);
console.error("Not handling", JSON.stringify(t, null, 2));
throw new Error(`Unknown markdown node type ${t.type}`);
} else {
// Falling back to rendering verbatim
2023-11-28 17:06:53 +08:00
removeParentPointers(t);
console.warn("Not handling", JSON.stringify(t, null, 2));
return renderToText(t);
}
}
function mapRender(children: ParseTree[]) {
return children.map((t) => posPreservingRender(t, options));
}
}
function traverseTag(
2023-02-23 22:33:51 +08:00
t: Tag,
fn: (t: Tag) => void,
) {
fn(t);
2023-02-23 22:33:51 +08:00
if (typeof t === "string") {
return;
}
if (t.body) {
for (const child of t.body) {
traverseTag(child, fn);
2023-02-23 22:33:51 +08:00
}
}
}
export function renderMarkdownToHtml(
t: ParseTree,
options: MarkdownRenderOptions = {},
) {
preprocess(t);
const htmlTree = posPreservingRender(t, options);
if (htmlTree && options.translateUrls) {
traverseTag(htmlTree, (t) => {
2023-02-23 22:33:51 +08:00
if (typeof t === "string") {
return;
}
if (t.name === "img") {
2023-12-20 00:20:47 +08:00
t.attrs!.src = options.translateUrls!(t.attrs!.src!, "image");
}
2023-07-07 17:44:05 +08:00
if (t.name === "a" && t.attrs!.href) {
2023-12-20 00:20:47 +08:00
t.attrs!.href = options.translateUrls!(t.attrs!.href, "link");
2023-02-23 22:33:51 +08:00
}
});
}
return renderHtml(htmlTree);
}