2022-11-24 19:04:00 +08:00
|
|
|
import {
|
|
|
|
addParentPointers,
|
2024-07-30 23:33:33 +08:00
|
|
|
type ParseTree,
|
2022-11-24 19:04:00 +08:00
|
|
|
renderToText,
|
2023-05-24 02:53:53 +08:00
|
|
|
replaceNodesMatchingAsync,
|
|
|
|
traverseTreeAsync,
|
2024-02-29 22:23:05 +08:00
|
|
|
} from "./tree.ts";
|
2024-07-06 21:07:40 +08:00
|
|
|
import { cleanupJSON } from "./json.ts";
|
2024-03-16 22:29:24 +08:00
|
|
|
import { YAML } from "../syscalls.ts";
|
2024-10-20 18:39:58 +08:00
|
|
|
import { extractHashtag } from "./tags.ts";
|
2022-11-24 19:04:00 +08:00
|
|
|
|
2024-01-11 20:20:50 +08:00
|
|
|
export type FrontMatter = { tags?: string[] } & Record<string, any>;
|
2023-11-06 16:14:16 +08:00
|
|
|
|
2023-11-09 16:26:44 +08:00
|
|
|
export type FrontmatterExtractOptions = {
|
|
|
|
removeKeys?: string[];
|
|
|
|
removeTags?: string[] | true;
|
|
|
|
removeFrontmatterSection?: boolean;
|
|
|
|
};
|
|
|
|
|
2024-01-11 20:20:50 +08:00
|
|
|
/**
|
|
|
|
* Extracts front matter from a markdown document, as well as extracting tags that are to apply to the page
|
|
|
|
* optionally removes certain keys from the front matter
|
|
|
|
* Side effect: will add parent pointers
|
|
|
|
*/
|
2023-05-24 02:53:53 +08:00
|
|
|
export async function extractFrontmatter(
|
2022-11-24 19:04:00 +08:00
|
|
|
tree: ParseTree,
|
2023-11-09 16:26:44 +08:00
|
|
|
options: FrontmatterExtractOptions = {},
|
2023-11-06 16:14:16 +08:00
|
|
|
): Promise<FrontMatter> {
|
|
|
|
let data: FrontMatter = {
|
|
|
|
tags: [],
|
|
|
|
};
|
2024-01-11 20:20:50 +08:00
|
|
|
const tags: string[] = [];
|
2022-11-24 19:04:00 +08:00
|
|
|
addParentPointers(tree);
|
|
|
|
|
2023-05-24 02:53:53 +08:00
|
|
|
await replaceNodesMatchingAsync(tree, async (t) => {
|
2024-01-11 20:20:50 +08:00
|
|
|
// Find tags in paragraphs directly nested under the document where the only content is tags
|
|
|
|
if (t.type === "Paragraph" && t.parent?.type === "Document") {
|
|
|
|
let onlyTags = true;
|
|
|
|
const collectedTags = new Set<string>();
|
|
|
|
for (const child of t.children!) {
|
|
|
|
if (child.text) {
|
|
|
|
if (child.text.startsWith("\n") && child.text !== "\n") {
|
|
|
|
// Multi line paragraph, cut it off here
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
if (child.text.trim()) {
|
|
|
|
// Text node with actual text (not just whitespace): not a page tag line!
|
|
|
|
onlyTags = false;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
} else if (child.type === "Hashtag") {
|
2024-10-20 18:39:58 +08:00
|
|
|
const tagname = extractHashtag(child.children![0].text!);
|
2024-01-11 20:20:50 +08:00
|
|
|
collectedTags.add(tagname);
|
|
|
|
|
|
|
|
if (
|
|
|
|
options.removeTags === true || options.removeTags?.includes(tagname)
|
|
|
|
) {
|
|
|
|
// Ugly hack to remove the hashtag
|
|
|
|
child.children![0].text = "";
|
|
|
|
}
|
|
|
|
} else if (child.type) {
|
|
|
|
// Found something else than tags, so... nope!
|
|
|
|
onlyTags = false;
|
|
|
|
break;
|
2023-11-09 16:26:44 +08:00
|
|
|
}
|
2024-01-11 20:20:50 +08:00
|
|
|
}
|
|
|
|
if (onlyTags) {
|
|
|
|
tags.push(...collectedTags);
|
|
|
|
}
|
2022-11-24 19:04:00 +08:00
|
|
|
}
|
|
|
|
// Find FrontMatter and parse it
|
|
|
|
if (t.type === "FrontMatter") {
|
2022-11-24 23:08:51 +08:00
|
|
|
const yamlNode = t.children![1].children![0];
|
|
|
|
const yamlText = renderToText(yamlNode);
|
2022-11-24 19:04:00 +08:00
|
|
|
try {
|
2023-05-24 02:53:53 +08:00
|
|
|
const parsedData: any = await YAML.parse(yamlText);
|
2024-07-07 16:35:17 +08:00
|
|
|
// console.log("Parsed front matter", parsedData);
|
2022-11-24 19:04:00 +08:00
|
|
|
const newData = { ...parsedData };
|
|
|
|
data = { ...data, ...parsedData };
|
2023-11-06 16:14:16 +08:00
|
|
|
// Make sure we have a tags array
|
|
|
|
if (!data.tags) {
|
|
|
|
data.tags = [];
|
|
|
|
}
|
2023-12-22 20:59:16 +08:00
|
|
|
// Normalize tags to an array
|
|
|
|
// support "tag1, tag2" as well as "tag1 tag2" as well as "#tag1 #tag2" notations
|
2023-11-06 16:14:16 +08:00
|
|
|
if (typeof data.tags === "string") {
|
2024-01-11 20:20:50 +08:00
|
|
|
tags.push(...(data.tags as string).split(/,\s*|\s+/));
|
2023-11-06 16:14:16 +08:00
|
|
|
}
|
2024-01-28 20:42:25 +08:00
|
|
|
if (Array.isArray(data.tags)) {
|
|
|
|
tags.push(...data.tags);
|
|
|
|
}
|
2023-12-22 20:59:16 +08:00
|
|
|
|
2023-11-09 16:26:44 +08:00
|
|
|
if (options.removeKeys && options.removeKeys.length > 0) {
|
2022-11-24 19:04:00 +08:00
|
|
|
let removedOne = false;
|
|
|
|
|
2023-11-09 16:26:44 +08:00
|
|
|
for (const key of options.removeKeys) {
|
2022-11-24 19:04:00 +08:00
|
|
|
if (key in newData) {
|
|
|
|
delete newData[key];
|
|
|
|
removedOne = true;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if (removedOne) {
|
2023-05-24 02:53:53 +08:00
|
|
|
yamlNode.text = await YAML.stringify(newData);
|
2022-11-24 19:04:00 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
// If nothing is left, let's just delete this whole block
|
2023-11-09 16:26:44 +08:00
|
|
|
if (
|
|
|
|
Object.keys(newData).length === 0 || options.removeFrontmatterSection
|
|
|
|
) {
|
2022-11-24 19:04:00 +08:00
|
|
|
return null;
|
|
|
|
}
|
2024-08-24 18:35:09 +08:00
|
|
|
} catch {
|
|
|
|
// console.warn("Could not parse frontmatter", e.message);
|
2022-11-24 19:04:00 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return undefined;
|
|
|
|
});
|
|
|
|
|
2024-03-27 04:04:34 +08:00
|
|
|
try {
|
|
|
|
data.tags = [
|
|
|
|
...new Set([...tags.map((t) => {
|
|
|
|
// Always treat tags as strings
|
|
|
|
const tagAsString = String(t);
|
|
|
|
// Strip # from tags
|
|
|
|
return tagAsString.replace(/^#/, "");
|
|
|
|
})]),
|
|
|
|
];
|
|
|
|
} catch (e) {
|
|
|
|
console.error("Error while processing tags", e);
|
|
|
|
}
|
2024-01-11 20:20:50 +08:00
|
|
|
|
|
|
|
// console.log("Extracted tags", data.tags);
|
2024-01-15 23:43:12 +08:00
|
|
|
// Expand property names (e.g. "foo.bar" => { foo: { bar: true } })
|
2024-07-06 21:07:40 +08:00
|
|
|
data = cleanupJSON(data);
|
2024-01-11 20:20:50 +08:00
|
|
|
|
2022-11-24 19:04:00 +08:00
|
|
|
return data;
|
|
|
|
}
|
|
|
|
|
2024-08-07 19:27:25 +08:00
|
|
|
/**
|
|
|
|
* Updates the front matter of a markdown document and returns the text as a rendered string
|
|
|
|
*/
|
2023-05-24 02:53:53 +08:00
|
|
|
export async function prepareFrontmatterDispatch(
|
2022-11-24 19:04:00 +08:00
|
|
|
tree: ParseTree,
|
2023-11-13 22:49:21 +08:00
|
|
|
data: string | Record<string, any>,
|
2023-05-24 02:53:53 +08:00
|
|
|
): Promise<any> {
|
2022-11-24 19:04:00 +08:00
|
|
|
let dispatchData: any = null;
|
2023-05-24 02:53:53 +08:00
|
|
|
await traverseTreeAsync(tree, async (t) => {
|
2022-11-24 19:04:00 +08:00
|
|
|
// Find FrontMatter and parse it
|
|
|
|
if (t.type === "FrontMatter") {
|
|
|
|
const bodyNode = t.children![1].children![0];
|
|
|
|
const yamlText = renderToText(bodyNode);
|
|
|
|
|
|
|
|
try {
|
2023-11-13 22:49:21 +08:00
|
|
|
let frontmatterText = "";
|
|
|
|
if (typeof data === "string") {
|
|
|
|
frontmatterText = yamlText + data + "\n";
|
|
|
|
} else {
|
|
|
|
const parsedYaml = await YAML.parse(yamlText) as any;
|
|
|
|
const newData = { ...parsedYaml, ...data };
|
|
|
|
frontmatterText = await YAML.stringify(newData);
|
|
|
|
}
|
2022-11-24 19:04:00 +08:00
|
|
|
// Patch inline
|
|
|
|
dispatchData = {
|
|
|
|
changes: {
|
|
|
|
from: bodyNode.from,
|
|
|
|
to: bodyNode.to,
|
2023-11-13 22:49:21 +08:00
|
|
|
insert: frontmatterText,
|
2022-11-24 19:04:00 +08:00
|
|
|
},
|
|
|
|
};
|
|
|
|
} catch (e: any) {
|
|
|
|
console.error("Error parsing YAML", e);
|
|
|
|
}
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
return false;
|
|
|
|
});
|
|
|
|
if (!dispatchData) {
|
|
|
|
// If we didn't find frontmatter, let's add it
|
2023-11-13 22:49:21 +08:00
|
|
|
let frontmatterText = "";
|
|
|
|
if (typeof data === "string") {
|
|
|
|
frontmatterText = data + "\n";
|
|
|
|
} else {
|
|
|
|
frontmatterText = await YAML.stringify(data);
|
|
|
|
}
|
|
|
|
const fullFrontmatterText = "---\n" + frontmatterText +
|
|
|
|
"---\n";
|
2022-11-24 19:04:00 +08:00
|
|
|
dispatchData = {
|
|
|
|
changes: {
|
|
|
|
from: 0,
|
|
|
|
to: 0,
|
2023-11-13 22:49:21 +08:00
|
|
|
insert: fullFrontmatterText,
|
2022-11-24 19:04:00 +08:00
|
|
|
},
|
|
|
|
};
|
|
|
|
}
|
|
|
|
return dispatchData;
|
|
|
|
}
|