silverbullet/plug-api/lib/frontmatter.ts

198 lines
5.7 KiB
TypeScript
Raw Permalink Normal View History

2022-11-24 19:04:00 +08:00
import {
addParentPointers,
2024-07-30 23:33:33 +08:00
type ParseTree,
2022-11-24 19:04:00 +08:00
renderToText,
replaceNodesMatchingAsync,
traverseTreeAsync,
2024-02-29 22:23:05 +08:00
} from "./tree.ts";
2024-07-06 21:07:40 +08:00
import { cleanupJSON } from "./json.ts";
import { YAML } from "../syscalls.ts";
import { extractHashtag } from "./tags.ts";
2022-11-24 19:04:00 +08:00
export type FrontMatter = { tags?: string[] } & Record<string, any>;
2023-11-06 16:14:16 +08:00
export type FrontmatterExtractOptions = {
removeKeys?: string[];
removeTags?: string[] | true;
removeFrontmatterSection?: boolean;
};
/**
* Extracts front matter from a markdown document, as well as extracting tags that are to apply to the page
* optionally removes certain keys from the front matter
* Side effect: will add parent pointers
*/
export async function extractFrontmatter(
2022-11-24 19:04:00 +08:00
tree: ParseTree,
options: FrontmatterExtractOptions = {},
2023-11-06 16:14:16 +08:00
): Promise<FrontMatter> {
let data: FrontMatter = {
tags: [],
};
const tags: string[] = [];
2022-11-24 19:04:00 +08:00
addParentPointers(tree);
await replaceNodesMatchingAsync(tree, async (t) => {
// Find tags in paragraphs directly nested under the document where the only content is tags
if (t.type === "Paragraph" && t.parent?.type === "Document") {
let onlyTags = true;
const collectedTags = new Set<string>();
for (const child of t.children!) {
if (child.text) {
if (child.text.startsWith("\n") && child.text !== "\n") {
// Multi line paragraph, cut it off here
break;
}
if (child.text.trim()) {
// Text node with actual text (not just whitespace): not a page tag line!
onlyTags = false;
break;
}
} else if (child.type === "Hashtag") {
const tagname = extractHashtag(child.children![0].text!);
collectedTags.add(tagname);
if (
options.removeTags === true || options.removeTags?.includes(tagname)
) {
// Ugly hack to remove the hashtag
child.children![0].text = "";
}
} else if (child.type) {
// Found something else than tags, so... nope!
onlyTags = false;
break;
}
}
if (onlyTags) {
tags.push(...collectedTags);
}
2022-11-24 19:04:00 +08:00
}
// Find FrontMatter and parse it
if (t.type === "FrontMatter") {
2022-11-24 23:08:51 +08:00
const yamlNode = t.children![1].children![0];
const yamlText = renderToText(yamlNode);
2022-11-24 19:04:00 +08:00
try {
const parsedData: any = await YAML.parse(yamlText);
// console.log("Parsed front matter", parsedData);
2022-11-24 19:04:00 +08:00
const newData = { ...parsedData };
data = { ...data, ...parsedData };
2023-11-06 16:14:16 +08:00
// Make sure we have a tags array
if (!data.tags) {
data.tags = [];
}
// Normalize tags to an array
// support "tag1, tag2" as well as "tag1 tag2" as well as "#tag1 #tag2" notations
2023-11-06 16:14:16 +08:00
if (typeof data.tags === "string") {
tags.push(...(data.tags as string).split(/,\s*|\s+/));
2023-11-06 16:14:16 +08:00
}
if (Array.isArray(data.tags)) {
tags.push(...data.tags);
}
if (options.removeKeys && options.removeKeys.length > 0) {
2022-11-24 19:04:00 +08:00
let removedOne = false;
for (const key of options.removeKeys) {
2022-11-24 19:04:00 +08:00
if (key in newData) {
delete newData[key];
removedOne = true;
}
}
if (removedOne) {
yamlNode.text = await YAML.stringify(newData);
2022-11-24 19:04:00 +08:00
}
}
// If nothing is left, let's just delete this whole block
if (
Object.keys(newData).length === 0 || options.removeFrontmatterSection
) {
2022-11-24 19:04:00 +08:00
return null;
}
} catch {
// console.warn("Could not parse frontmatter", e.message);
2022-11-24 19:04:00 +08:00
}
}
return undefined;
});
try {
data.tags = [
...new Set([...tags.map((t) => {
// Always treat tags as strings
const tagAsString = String(t);
// Strip # from tags
return tagAsString.replace(/^#/, "");
})]),
];
} catch (e) {
console.error("Error while processing tags", e);
}
// console.log("Extracted tags", data.tags);
// Expand property names (e.g. "foo.bar" => { foo: { bar: true } })
2024-07-06 21:07:40 +08:00
data = cleanupJSON(data);
2022-11-24 19:04:00 +08:00
return data;
}
2024-08-07 19:27:25 +08:00
/**
* Updates the front matter of a markdown document and returns the text as a rendered string
*/
export async function prepareFrontmatterDispatch(
2022-11-24 19:04:00 +08:00
tree: ParseTree,
2023-11-13 22:49:21 +08:00
data: string | Record<string, any>,
): Promise<any> {
2022-11-24 19:04:00 +08:00
let dispatchData: any = null;
await traverseTreeAsync(tree, async (t) => {
2022-11-24 19:04:00 +08:00
// Find FrontMatter and parse it
if (t.type === "FrontMatter") {
const bodyNode = t.children![1].children![0];
const yamlText = renderToText(bodyNode);
try {
2023-11-13 22:49:21 +08:00
let frontmatterText = "";
if (typeof data === "string") {
frontmatterText = yamlText + data + "\n";
} else {
const parsedYaml = await YAML.parse(yamlText) as any;
const newData = { ...parsedYaml, ...data };
frontmatterText = await YAML.stringify(newData);
}
2022-11-24 19:04:00 +08:00
// Patch inline
dispatchData = {
changes: {
from: bodyNode.from,
to: bodyNode.to,
2023-11-13 22:49:21 +08:00
insert: frontmatterText,
2022-11-24 19:04:00 +08:00
},
};
} catch (e: any) {
console.error("Error parsing YAML", e);
}
return true;
}
return false;
});
if (!dispatchData) {
// If we didn't find frontmatter, let's add it
2023-11-13 22:49:21 +08:00
let frontmatterText = "";
if (typeof data === "string") {
frontmatterText = data + "\n";
} else {
frontmatterText = await YAML.stringify(data);
}
const fullFrontmatterText = "---\n" + frontmatterText +
"---\n";
2022-11-24 19:04:00 +08:00
dispatchData = {
changes: {
from: 0,
to: 0,
2023-11-13 22:49:21 +08:00
insert: fullFrontmatterText,
2022-11-24 19:04:00 +08:00
},
};
}
return dispatchData;
}