2023-01-17 01:55:35 +08:00
|
|
|
import { renderToText, replaceNodesMatching } from "../../plug-api/lib/tree.ts";
|
|
|
|
import buildMarkdown from "../markdown_parser/parser.ts";
|
|
|
|
import { parse } from "../markdown_parser/parse_tree.ts";
|
2023-01-13 22:41:29 +08:00
|
|
|
import type { FileMeta } from "../types.ts";
|
|
|
|
import { SpacePrimitives } from "./space_primitives.ts";
|
|
|
|
|
|
|
|
type SyncHash = number;
|
|
|
|
|
|
|
|
// Tuple where the first value represents a lastModified timestamp for the primary space
|
|
|
|
// and the second item the lastModified value of the secondary space
|
|
|
|
export type SyncStatusItem = [SyncHash, SyncHash];
|
|
|
|
|
2023-01-15 01:51:00 +08:00
|
|
|
export interface Logger {
|
|
|
|
log(level: string, ...messageBits: any[]): void;
|
|
|
|
}
|
|
|
|
|
|
|
|
class ConsoleLogger implements Logger {
|
|
|
|
log(_level: string, ...messageBits: any[]) {
|
|
|
|
console.log(...messageBits);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2023-02-28 18:13:18 +08:00
|
|
|
export type SyncOptions = {
|
|
|
|
logger?: Logger;
|
|
|
|
excludePrefixes?: string[];
|
|
|
|
};
|
|
|
|
|
2023-01-13 22:41:29 +08:00
|
|
|
// Implementation of this algorithm https://unterwaditzer.net/2016/sync-algorithm.html
|
|
|
|
export class SpaceSync {
|
2023-02-28 18:13:18 +08:00
|
|
|
logger: ConsoleLogger;
|
|
|
|
excludePrefixes: string[];
|
|
|
|
|
2023-01-13 22:41:29 +08:00
|
|
|
constructor(
|
|
|
|
private primary: SpacePrimitives,
|
|
|
|
private secondary: SpacePrimitives,
|
|
|
|
readonly snapshot: Map<string, SyncStatusItem>,
|
2023-02-28 18:13:18 +08:00
|
|
|
readonly options: SyncOptions,
|
|
|
|
) {
|
|
|
|
this.logger = options.logger || new ConsoleLogger();
|
|
|
|
this.excludePrefixes = options.excludePrefixes || [];
|
|
|
|
}
|
2023-01-13 22:41:29 +08:00
|
|
|
|
|
|
|
async syncFiles(
|
2023-01-20 23:08:01 +08:00
|
|
|
conflictResolver: (
|
2023-01-13 22:41:29 +08:00
|
|
|
name: string,
|
|
|
|
snapshot: Map<string, SyncStatusItem>,
|
|
|
|
primarySpace: SpacePrimitives,
|
|
|
|
secondarySpace: SpacePrimitives,
|
2023-01-15 01:51:00 +08:00
|
|
|
logger: Logger,
|
2023-01-17 01:55:35 +08:00
|
|
|
) => Promise<number>,
|
2023-01-13 22:41:29 +08:00
|
|
|
): Promise<number> {
|
|
|
|
let operations = 0;
|
2023-01-15 01:51:00 +08:00
|
|
|
this.logger.log("info", "Fetching snapshot from primary");
|
2023-01-13 22:41:29 +08:00
|
|
|
const primaryAllPages = this.syncCandidates(
|
|
|
|
await this.primary.fetchFileList(),
|
|
|
|
);
|
|
|
|
|
2023-01-15 01:51:00 +08:00
|
|
|
this.logger.log("info", "Fetching snapshot from secondary");
|
2023-01-13 22:41:29 +08:00
|
|
|
try {
|
|
|
|
const secondaryAllPages = this.syncCandidates(
|
|
|
|
await this.secondary.fetchFileList(),
|
|
|
|
);
|
|
|
|
|
|
|
|
const primaryFileMap = new Map<string, SyncHash>(
|
|
|
|
primaryAllPages.map((m) => [m.name, m.lastModified]),
|
|
|
|
);
|
|
|
|
const secondaryFileMap = new Map<string, SyncHash>(
|
|
|
|
secondaryAllPages.map((m) => [m.name, m.lastModified]),
|
|
|
|
);
|
|
|
|
|
|
|
|
const allFilesToProcess = new Set([
|
|
|
|
...this.snapshot.keys(),
|
|
|
|
...primaryFileMap.keys(),
|
|
|
|
...secondaryFileMap.keys(),
|
|
|
|
]);
|
|
|
|
|
2023-01-15 01:51:00 +08:00
|
|
|
this.logger.log("info", "Iterating over all files");
|
2023-01-13 22:41:29 +08:00
|
|
|
for (const name of allFilesToProcess) {
|
2023-01-25 16:46:56 +08:00
|
|
|
try {
|
|
|
|
operations += await this.syncFile(
|
|
|
|
name,
|
|
|
|
primaryFileMap.get(name),
|
|
|
|
secondaryFileMap.get(name),
|
|
|
|
conflictResolver,
|
|
|
|
);
|
|
|
|
} catch (e: any) {
|
|
|
|
this.logger.log("error", "Error syncing file", name, e.message);
|
|
|
|
}
|
2023-01-13 22:41:29 +08:00
|
|
|
}
|
|
|
|
} catch (e: any) {
|
2023-01-25 16:46:56 +08:00
|
|
|
this.logger.log("error", "General sync error:", e.message);
|
2023-01-13 22:41:29 +08:00
|
|
|
throw e;
|
|
|
|
}
|
2023-01-15 01:51:00 +08:00
|
|
|
this.logger.log("info", "Sync complete, operations performed", operations);
|
2023-01-13 22:41:29 +08:00
|
|
|
|
|
|
|
return operations;
|
|
|
|
}
|
|
|
|
|
2023-01-20 23:08:01 +08:00
|
|
|
async syncFile(
|
|
|
|
name: string,
|
|
|
|
primaryHash: SyncHash | undefined,
|
|
|
|
secondaryHash: SyncHash | undefined,
|
|
|
|
conflictResolver: (
|
|
|
|
name: string,
|
|
|
|
snapshot: Map<string, SyncStatusItem>,
|
|
|
|
primarySpace: SpacePrimitives,
|
|
|
|
secondarySpace: SpacePrimitives,
|
|
|
|
logger: Logger,
|
|
|
|
) => Promise<number>,
|
|
|
|
): Promise<number> {
|
2023-01-25 16:59:15 +08:00
|
|
|
// console.log("Syncing", name, primaryHash, secondaryHash);
|
2023-01-20 23:08:01 +08:00
|
|
|
let operations = 0;
|
|
|
|
|
2023-02-28 18:13:18 +08:00
|
|
|
// Check if not matching one of the excluded prefixes
|
|
|
|
for (const prefix of this.excludePrefixes) {
|
|
|
|
if (name.startsWith(prefix)) {
|
|
|
|
return operations;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2023-01-20 23:08:01 +08:00
|
|
|
if (
|
2023-01-20 23:51:06 +08:00
|
|
|
primaryHash !== undefined && secondaryHash === undefined &&
|
2023-01-20 23:08:01 +08:00
|
|
|
!this.snapshot.has(name)
|
|
|
|
) {
|
|
|
|
// New file, created on primary, copy from primary to secondary
|
|
|
|
this.logger.log(
|
|
|
|
"info",
|
|
|
|
"New file created on primary, copying to secondary",
|
|
|
|
name,
|
|
|
|
);
|
|
|
|
const { data } = await this.primary.readFile(name, "arraybuffer");
|
|
|
|
const writtenMeta = await this.secondary.writeFile(
|
|
|
|
name,
|
|
|
|
"arraybuffer",
|
|
|
|
data,
|
|
|
|
);
|
|
|
|
this.snapshot.set(name, [
|
|
|
|
primaryHash,
|
|
|
|
writtenMeta.lastModified,
|
|
|
|
]);
|
|
|
|
operations++;
|
|
|
|
} else if (
|
2023-01-20 23:51:06 +08:00
|
|
|
secondaryHash !== undefined && primaryHash === undefined &&
|
2023-01-20 23:08:01 +08:00
|
|
|
!this.snapshot.has(name)
|
|
|
|
) {
|
|
|
|
// New file, created on secondary, copy from secondary to primary
|
|
|
|
this.logger.log(
|
|
|
|
"info",
|
|
|
|
"New file created on secondary, copying from secondary to primary",
|
|
|
|
name,
|
|
|
|
);
|
|
|
|
const { data } = await this.secondary.readFile(name, "arraybuffer");
|
|
|
|
const writtenMeta = await this.primary.writeFile(
|
|
|
|
name,
|
|
|
|
"arraybuffer",
|
|
|
|
data,
|
|
|
|
);
|
|
|
|
this.snapshot.set(name, [
|
|
|
|
writtenMeta.lastModified,
|
|
|
|
secondaryHash,
|
|
|
|
]);
|
|
|
|
operations++;
|
|
|
|
} else if (
|
2023-01-20 23:51:06 +08:00
|
|
|
primaryHash !== undefined && this.snapshot.has(name) &&
|
|
|
|
secondaryHash === undefined
|
2023-01-20 23:08:01 +08:00
|
|
|
) {
|
|
|
|
// File deleted on B
|
|
|
|
this.logger.log(
|
|
|
|
"info",
|
|
|
|
"File deleted on secondary, deleting from primary",
|
|
|
|
name,
|
|
|
|
);
|
|
|
|
await this.primary.deleteFile(name);
|
|
|
|
this.snapshot.delete(name);
|
|
|
|
operations++;
|
|
|
|
} else if (
|
2023-01-20 23:51:06 +08:00
|
|
|
secondaryHash !== undefined && this.snapshot.has(name) &&
|
|
|
|
primaryHash === undefined
|
2023-01-20 23:08:01 +08:00
|
|
|
) {
|
|
|
|
// File deleted on A
|
|
|
|
this.logger.log(
|
|
|
|
"info",
|
|
|
|
"File deleted on primary, deleting from secondary",
|
|
|
|
name,
|
|
|
|
);
|
|
|
|
await this.secondary.deleteFile(name);
|
|
|
|
this.snapshot.delete(name);
|
|
|
|
operations++;
|
|
|
|
} else if (
|
2023-01-20 23:51:06 +08:00
|
|
|
this.snapshot.has(name) && primaryHash === undefined &&
|
|
|
|
secondaryHash === undefined
|
2023-01-20 23:08:01 +08:00
|
|
|
) {
|
|
|
|
// File deleted on both sides, :shrug:
|
|
|
|
this.logger.log(
|
|
|
|
"info",
|
|
|
|
"File deleted on both ends, deleting from status",
|
|
|
|
name,
|
|
|
|
);
|
|
|
|
this.snapshot.delete(name);
|
|
|
|
operations++;
|
|
|
|
} else if (
|
2023-01-20 23:51:06 +08:00
|
|
|
primaryHash !== undefined && secondaryHash !== undefined &&
|
2023-01-20 23:08:01 +08:00
|
|
|
this.snapshot.get(name) &&
|
|
|
|
primaryHash !== this.snapshot.get(name)![0] &&
|
|
|
|
secondaryHash === this.snapshot.get(name)![1]
|
|
|
|
) {
|
|
|
|
// File has changed on primary, but not secondary: copy from primary to secondary
|
|
|
|
this.logger.log(
|
|
|
|
"info",
|
|
|
|
"File changed on primary, copying to secondary",
|
|
|
|
name,
|
|
|
|
);
|
|
|
|
const { data } = await this.primary.readFile(name, "arraybuffer");
|
|
|
|
const writtenMeta = await this.secondary.writeFile(
|
|
|
|
name,
|
|
|
|
"arraybuffer",
|
|
|
|
data,
|
|
|
|
);
|
|
|
|
this.snapshot.set(name, [
|
|
|
|
primaryHash,
|
|
|
|
writtenMeta.lastModified,
|
|
|
|
]);
|
|
|
|
operations++;
|
|
|
|
} else if (
|
2023-01-20 23:51:06 +08:00
|
|
|
primaryHash !== undefined && secondaryHash !== undefined &&
|
2023-01-20 23:08:01 +08:00
|
|
|
this.snapshot.get(name) &&
|
|
|
|
secondaryHash !== this.snapshot.get(name)![1] &&
|
|
|
|
primaryHash === this.snapshot.get(name)![0]
|
|
|
|
) {
|
|
|
|
// File has changed on secondary, but not primary: copy from secondary to primary
|
2023-01-25 16:46:56 +08:00
|
|
|
this.logger.log(
|
|
|
|
"info",
|
|
|
|
"File has changed on secondary, but not primary: copy from secondary to primary",
|
|
|
|
name,
|
|
|
|
);
|
2023-01-20 23:08:01 +08:00
|
|
|
const { data } = await this.secondary.readFile(name, "arraybuffer");
|
|
|
|
const writtenMeta = await this.primary.writeFile(
|
|
|
|
name,
|
|
|
|
"arraybuffer",
|
|
|
|
data,
|
|
|
|
);
|
|
|
|
this.snapshot.set(name, [
|
|
|
|
writtenMeta.lastModified,
|
|
|
|
secondaryHash,
|
|
|
|
]);
|
|
|
|
operations++;
|
|
|
|
} else if (
|
|
|
|
( // File changed on both ends, but we don't have any info in the snapshot (resync scenario?): have to run through conflict handling
|
2023-01-20 23:51:06 +08:00
|
|
|
primaryHash !== undefined && secondaryHash !== undefined &&
|
2023-01-20 23:08:01 +08:00
|
|
|
!this.snapshot.has(name)
|
|
|
|
) ||
|
|
|
|
( // File changed on both ends, CONFLICT!
|
|
|
|
primaryHash && secondaryHash &&
|
|
|
|
this.snapshot.get(name) &&
|
|
|
|
secondaryHash !== this.snapshot.get(name)![1] &&
|
|
|
|
primaryHash !== this.snapshot.get(name)![0]
|
|
|
|
)
|
|
|
|
) {
|
|
|
|
this.logger.log(
|
|
|
|
"info",
|
|
|
|
"File changed on both ends, potential conflict",
|
|
|
|
name,
|
|
|
|
);
|
|
|
|
operations += await conflictResolver(
|
|
|
|
name,
|
|
|
|
this.snapshot,
|
|
|
|
this.primary,
|
|
|
|
this.secondary,
|
|
|
|
this.logger,
|
|
|
|
);
|
|
|
|
} else {
|
|
|
|
// Nothing needs to happen
|
|
|
|
}
|
|
|
|
return operations;
|
|
|
|
}
|
|
|
|
|
2023-01-13 22:41:29 +08:00
|
|
|
// Strategy: Primary wins
|
|
|
|
public static async primaryConflictResolver(
|
|
|
|
name: string,
|
|
|
|
snapshot: Map<string, SyncStatusItem>,
|
|
|
|
primary: SpacePrimitives,
|
|
|
|
secondary: SpacePrimitives,
|
2023-01-15 01:51:00 +08:00
|
|
|
logger: Logger,
|
2023-01-17 01:55:35 +08:00
|
|
|
): Promise<number> {
|
2023-01-15 01:51:00 +08:00
|
|
|
logger.log("info", "Starting conflict resolution for", name);
|
2023-01-13 22:41:29 +08:00
|
|
|
const filePieces = name.split(".");
|
|
|
|
const fileNameBase = filePieces.slice(0, -1).join(".");
|
|
|
|
const fileNameExt = filePieces[filePieces.length - 1];
|
|
|
|
const pageData1 = await primary.readFile(name, "arraybuffer");
|
|
|
|
const pageData2 = await secondary.readFile(name, "arraybuffer");
|
|
|
|
|
2023-01-17 01:55:35 +08:00
|
|
|
if (name.endsWith(".md")) {
|
|
|
|
logger.log("info", "File is markdown, using smart conflict resolution");
|
|
|
|
// Let's use a smartert check for markdown files, ignoring directive bodies
|
|
|
|
const pageText1 = removeDirectiveBody(
|
|
|
|
new TextDecoder().decode(pageData1.data as Uint8Array),
|
|
|
|
);
|
|
|
|
const pageText2 = removeDirectiveBody(
|
|
|
|
new TextDecoder().decode(pageData2.data as Uint8Array),
|
|
|
|
);
|
|
|
|
if (pageText1 === pageText2) {
|
|
|
|
logger.log(
|
|
|
|
"info",
|
|
|
|
"Files are the same (eliminating the directive bodies), no conflict",
|
|
|
|
);
|
2023-01-13 22:41:29 +08:00
|
|
|
snapshot.set(name, [
|
|
|
|
pageData1.meta.lastModified,
|
|
|
|
pageData2.meta.lastModified,
|
|
|
|
]);
|
2023-01-17 01:55:35 +08:00
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
let byteWiseMatch = true;
|
|
|
|
const arrayBuffer1 = new Uint8Array(pageData1.data as ArrayBuffer);
|
|
|
|
const arrayBuffer2 = new Uint8Array(pageData2.data as ArrayBuffer);
|
|
|
|
if (arrayBuffer1.byteLength !== arrayBuffer2.byteLength) {
|
|
|
|
byteWiseMatch = false;
|
|
|
|
}
|
|
|
|
if (byteWiseMatch) {
|
|
|
|
// Byte-wise comparison
|
|
|
|
for (let i = 0; i < arrayBuffer1.byteLength; i++) {
|
|
|
|
if (arrayBuffer1[i] !== arrayBuffer2[i]) {
|
|
|
|
byteWiseMatch = false;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
// Byte wise they're still the same, so no confict
|
|
|
|
if (byteWiseMatch) {
|
|
|
|
logger.log("info", "Files are the same, no conflict");
|
|
|
|
snapshot.set(name, [
|
|
|
|
pageData1.meta.lastModified,
|
|
|
|
pageData2.meta.lastModified,
|
|
|
|
]);
|
|
|
|
return 0;
|
|
|
|
}
|
2023-01-13 22:41:29 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
const revisionFileName = filePieces.length === 1
|
|
|
|
? `${name}.conflicted.${pageData2.meta.lastModified}`
|
|
|
|
: `${fileNameBase}.conflicted.${pageData2.meta.lastModified}.${fileNameExt}`;
|
2023-01-15 01:51:00 +08:00
|
|
|
logger.log(
|
|
|
|
"info",
|
2023-01-13 22:41:29 +08:00
|
|
|
"Going to create conflicting copy",
|
|
|
|
revisionFileName,
|
|
|
|
);
|
|
|
|
|
|
|
|
// Copy secondary to conflict copy
|
|
|
|
const localConflictMeta = await primary.writeFile(
|
|
|
|
revisionFileName,
|
|
|
|
"arraybuffer",
|
|
|
|
pageData2.data,
|
|
|
|
);
|
|
|
|
const remoteConflictMeta = await secondary.writeFile(
|
|
|
|
revisionFileName,
|
|
|
|
"arraybuffer",
|
|
|
|
pageData2.data,
|
|
|
|
);
|
|
|
|
|
|
|
|
// Updating snapshot
|
|
|
|
snapshot.set(revisionFileName, [
|
|
|
|
localConflictMeta.lastModified,
|
|
|
|
remoteConflictMeta.lastModified,
|
|
|
|
]);
|
|
|
|
|
|
|
|
// Write replacement on top
|
|
|
|
const writeMeta = await secondary.writeFile(
|
|
|
|
name,
|
|
|
|
"arraybuffer",
|
|
|
|
pageData1.data,
|
|
|
|
true,
|
|
|
|
);
|
|
|
|
|
|
|
|
snapshot.set(name, [pageData1.meta.lastModified, writeMeta.lastModified]);
|
2023-01-17 01:55:35 +08:00
|
|
|
return 1;
|
2023-01-13 22:41:29 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
syncCandidates(files: FileMeta[]): FileMeta[] {
|
2023-01-26 01:29:47 +08:00
|
|
|
return files.filter((f) =>
|
|
|
|
!f.name.startsWith("_plug/") && f.lastModified > 0
|
|
|
|
);
|
2023-01-13 22:41:29 +08:00
|
|
|
}
|
|
|
|
}
|
2023-01-17 01:55:35 +08:00
|
|
|
|
|
|
|
const markdownLanguage = buildMarkdown([]);
|
|
|
|
|
|
|
|
export function removeDirectiveBody(text: string): string {
|
|
|
|
// Parse
|
|
|
|
const tree = parse(markdownLanguage, text);
|
|
|
|
// Remove bodies
|
|
|
|
replaceNodesMatching(tree, (node) => {
|
|
|
|
if (node.type === "DirectiveBody") {
|
|
|
|
return null;
|
|
|
|
}
|
|
|
|
});
|
|
|
|
// Turn back into text
|
|
|
|
return renderToText(tree);
|
|
|
|
}
|