-
1
-
2
-
3
-
4
-
5
-
6
-
7
-
8
-
9
-
10
-
11
-
12
-
13
-
14
-
15
-
16
-
17
-
18
-
19
-
20
-
21
-
22
-
23
-
24
-
25
-
26
-
27
-
28
-
29
-
30
-
31
-
32
-
33
-
34
-
35
-
36
-
37
-
38
-
39
-
40
-
41
-
42
-
43
-
44
-
45
-
46
-
47
-
48
-
49
-
50
-
51
-
52
-
53
-
54
-
55
-
56
-
57
-
58
-
59
-
60
-
61
-
62
-
63
-
64
-
65
-
66
-
67
-
68
-
69
-
70
-
71
-
72
-
73
-
74
-
75
-
76
-
77
-
78
-
79
-
80
-
81
-
82
-
83
-
84
-
85
-
86
-
87
-
88
-
89
-
90
-
91
-
92
-
93
-
94
-
95
-
96
-
97
-
98
-
99
-
100
-
101
-
102
-
103
-
104
-
105
-
106
-
107
-
108
-
109
-
110
-
111
-
112
-
113
-
114
-
115
-
116
-
117
-
118
-
119
-
120
-
121
-
122
-
123
-
124
-
125
-
126
-
127
-
128
-
129
-
130
-
131
-
132
-
133
-
134
-
135
-
136
-
137
-
138
-
139
-
140
-
141
-
142
-
143
-
144
-
145
-
146
-
147
-
148
-
149
-
150
-
151
-
152
-
153
-
154
-
155
-
156
-
157
-
158
-
159
-
160
-
161
-
162
-
163
-
164
-
165
-
166
-
167
-
168
-
169
-
170
-
171
-
172
-
173
-
174
-
175
-
176
-
177
-
178
-
179
-
180
-
181
-
182
-
183
-
184
-
185
-
186
-
187
-
188
-
189
-
190
-
191
-
192
-
193
-
194
-
195
-
196
-
197
-
198
-
199
-
200
-
201
-
202
-
203
-
204
-
205
-
206
-
207
-
208
-
209
-
210
-
211
-
212
-
213
-
214
-
215
-
216
-
217
-
218
-
219
-
220
-
221
-
222
-
223
-
224
-
225
-
226
-
227
-
228
-
229
-
230
-
231
-
232
-
233
-
234
-
235
-
236
-
237
-
238
-
239
-
240
-
241
-
242
-
243
-
244
-
245
-
246
-
247
-
248
-
249
-
250
-
251
-
252
-
253
-
254
-
255
-
256
-
257
-
258
-
259
-
260
-
261
-
262
-
263
-
264
-
265
-
266
-
267
-
268
-
269
-
270
-
271
-
272
-
273
-
274
-
275
-
276
-
277
-
278
-
279
-
280
-
281
-
282
-
283
-
284
-
285
-
286
-
287
-
288
-
289
-
290
-
291
-
292
-
293
-
294
-
295
-
296
-
297
-
298
-
299
-
300
-
301
-
302
-
303
-
304
-
305
-
306
-
307
-
308
-
309
-
310
-
311
-
312
-
313
-
314
-
315
-
316
-
317
-
318
-
319
-
320
-
321
-
322
-
323
-
324
-
325
-
326
-
327
-
328
-
329
-
330
-
331
-
332
-
333
-
334
-
335
-
336
-
337
-
338
-
339
-
340
-
341
-
342
-
343
-
344
-
345
-
346
-
347
-
348
-
349
-
350
-
351
-
352
-
353
-
354
-
355
-
356
-
357
-
358
-
359
-
360
-
361
-
362
-
363
-
364
-
365
-
366
-
367
-
368
-
369
-
370
-
371
-
372
-
373
-
374
-
375
-
376
-
377
-
378
-
379
-
380
-
381
-
382
-
383
-
384
-
385
-
386
-
387
-
388
-
389
-
390
-
391
-
392
-
393
-
394
-
395
-
396
-
397
-
398
-
399
-
400
-
401
-
402
-
403
-
404
-
405
-
406
-
407
-
408
-
409
-
410
-
411
-
412
-
413
-
414
-
415
-
416
-
417
-
418
-
419
-
420
-
421
-
422
-
423
-
424
-
425
-
426
-
427
-
428
-
429
-
430
-
431
-
432
-
433
-
434
-
435
-
436
-
437
-
438
-
439
-
440
-
441
-
442
-
443
-
444
-
445
-
446
-
447
-
448
-
449
-
450
-
451
-
452
-
453
-
454
-
455
-
456
-
457
-
458
-
459
-
460
-
461
-
462
-
463
-
464
-
465
-
466
-
467
-
468
-
469
-
470
-
471
-
472
-
473
-
474
-
475
-
476
-
477
-
478
-
479
-
480
-
481
-
482
-
483
-
484
-
485
-
486
-
487
-
488
-
489
-
490
-
491
-
492
-
493
-
494
-
495
-
496
-
497
-
498
-
499
-
500
-
501
-
502
-
503
-
504
-
505
-
506
-
507
-
508
-
509
-
510
-
511
-
512
-
513
-
514
-
515
-
516
-
517
-
518
-
519
-
520
-
521
-
522
-
523
-
524
-
525
-
526
-
527
-
528
-
529
-
530
-
531
-
532
-
533
-
534
-
535
-
536
-
537
-
538
-
539
-
540
-
541
-
542
-
543
-
544
-
545
-
546
-
547
-
548
-
549
-
550
-
551
-
552
-
553
-
554
-
555
-
556
-
557
-
558
// SPDX-FileCopyrightText: 2024 Shota FUJI <pockawoooh@gmail.com>
//
// SPDX-License-Identifier: Apache-2.0
import { extname } from "../deps/deno.land/std/path/mod.ts";
import type { BuildParameters, TreeBuilder } from "./interface.ts";
import type {
AssetToken,
DirectoryReader,
Document,
DocumentDirectory,
DocumentMetadata,
DocumentToken,
DocumentTree,
FileReader,
RootDirectoryReader,
} from "../types.ts";
const INTERNAL_PATH_SEPARATOR = "/";
export type TreeBuildStrategyFunctionReturns = {
skip: true;
} | {
skip?: false;
metadata: DocumentMetadata;
};
export interface TreeBuildStrategy {
(
fileOrDirectory: FileReader | DirectoryReader,
metadata: DocumentMetadata,
):
| TreeBuildStrategyFunctionReturns
| Promise<TreeBuildStrategyFunctionReturns>;
}
/**
* Only accepts files having specific file extension.
* Files not having an extension in the list will be excluded from a document tree.
*
* @param exts - A list of file extensions, including leading dot.
*/
export function fileExtensions(exts: readonly string[]): TreeBuildStrategy {
return (node, metadata) => {
if (node.type !== "file") {
return { metadata };
}
if (exts.some((ext) => node.name.endsWith(ext))) {
return { metadata };
}
return { skip: true };
};
}
/**
* Excludes certain files and directories.
*
* @param f - If this function returned `true`, the file will be excluded from a document tree.
*/
export function ignore(
f: (fileOrDirectory: FileReader | DirectoryReader) => boolean,
): TreeBuildStrategy {
return (node, metadata) => {
if (f(node)) {
return { skip: true };
}
return { metadata };
};
}
/**
* Excludes dotfiles from a document tree.
*/
export function ignoreDotfiles(): TreeBuildStrategy {
return ignore((node) => node.name.startsWith("."));
}
export function langDir(
langs: Record<string, string>,
topLevelOnly: boolean = false,
): TreeBuildStrategy {
const map = new Map(Object.entries(langs));
return (node, metadata) => {
if (topLevelOnly && node.parent.type !== "root") {
return { metadata };
}
if (node.type !== "directory") {
return { metadata };
}
const title = map.get(node.name);
if (!title) {
return { metadata };
}
return {
metadata: {
...metadata,
title,
language: node.name,
},
};
};
}
/**
* Do not include file extension in the metadata.
* For example, "Bar.md" will be `{ title: "Bar", name: "Bar" }`.
*/
export function removeExtFromMetadata(): TreeBuildStrategy {
return (node, metadata) => {
if (node.type !== "file") {
return { metadata };
}
const ext = extname(node.name);
const stem = ext ? node.name.slice(0, -ext.length) : node.name;
return {
metadata: {
...metadata,
title: stem,
name: stem,
},
};
};
}
/**
* Mark file at specific path to be the default document.
*
* @param path - Relative path from the root directory (FileSystem Reader).
*/
export function defaultDocumentAt(path: readonly string[]): TreeBuildStrategy {
return (node, metadata) => {
if (node.type !== "file") {
return { metadata };
}
if (node.path.every((segment, i) => segment === path[i])) {
return {
metadata: {
...metadata,
isDefaultDocument: true,
},
};
}
return { metadata };
};
}
function isAssetToken(token: unknown): token is AssetToken {
return typeof token === "string" && token.startsWith("mxa_");
}
function isDocumentToken(token: unknown): token is DocumentToken {
return typeof token === "string" && token.startsWith("mxt_");
}
function resolveFsrPath(
path: readonly string[],
base: readonly string[],
): readonly string[] {
// Absolute path
if (path[0] === "") {
return path.slice(1);
}
let buf: string[] = base.slice(0, -1);
for (const fragment of path) {
switch (fragment) {
case ".":
break;
case "..":
buf = buf.slice(0, -1);
break;
default:
buf.push(fragment);
break;
}
}
return buf;
}
/**
* @param root - Vault root directory.
* @param path - Resolved path.
*/
function resolveExtensionLessPath(
root: RootDirectoryReader,
path: readonly string[],
): readonly string[] | Promise<readonly string[]> {
const [filename, ...dirPathReversed] = path.toReversed();
if (!filename || filename.includes(".")) {
return path;
}
const findClosestFile = async (
dir: DirectoryReader | RootDirectoryReader,
): Promise<readonly string[]> => {
const entries = await dir.read();
const match = entries.filter((entry) => {
if (entry.type !== "file") {
return false;
}
const stem = entry.name.split(".").slice(0, -1).join(".");
return stem === filename;
});
if (match.length > 1) {
// TODO: Custom error class
throw new Error(
"DefaultTreeBuilder: cannot resolve extension-less reference, " +
"there is several files with same stem but different extensions: " +
`requested = ${path.join(INTERNAL_PATH_SEPARATOR)}, ` +
`found = [${match.map((entry) => entry.name).join(", ")}].`,
);
}
if (!match.length) {
const dirPath = dirPathReversed.length > 0
? dirPathReversed.toReversed().join(
INTERNAL_PATH_SEPARATOR,
)
: "Root directory ";
throw new Error(
"DefaultTreeBuilder: cannot resolve extension-less reference, " +
`${dirPath} does not contain any files whose stem is "${filename}".`,
);
}
return match[0].path;
};
const dir = !dirPathReversed.length
? root
: root.openDirectory(dirPathReversed.toReversed());
if (dir instanceof Promise) {
return dir.then(findClosestFile);
}
return findClosestFile(dir);
}
interface InternalBuildParameters {
contentParser: BuildParameters["contentParser"];
root: RootDirectoryReader;
parentPath?: readonly string[];
assetTokensToFiles: Map<AssetToken, FileReader>;
documentTokenToPaths: Map<DocumentToken, string>;
pathToDocuments: Map<string, Document>;
}
export interface DefaultTreeBuilderConfig {
/**
* Default language tag (BCP 47).
*/
defaultLanguage: string;
/**
* A list of callback functions that control whether a file or a directory should be
* included in the document tree and override document metadata.
*/
strategies?: readonly TreeBuildStrategy[];
/**
* Sort function for document and document directory.
* This function is directly passed to `Array.prototype.toSorted`.
* @default A function compares `metadata.title` using `String.prototype.localeCompare` with default language as a locale.
*/
sorter?(
a: Document | DocumentDirectory,
b: Document | DocumentDirectory,
): number;
}
export class DefaultTreeBuilder implements TreeBuilder {
#defaultLanguage: string;
#strategies: readonly TreeBuildStrategy[];
#sorter: (
a: Document | DocumentDirectory,
b: Document | DocumentDirectory,
) => number;
constructor(
{ defaultLanguage, strategies, sorter }: DefaultTreeBuilderConfig,
) {
this.#defaultLanguage = defaultLanguage;
this.#strategies = strategies || [];
this.#sorter = sorter ||
((a, b) =>
a.metadata.title.localeCompare(
b.metadata.title,
this.#defaultLanguage,
));
}
async build(
{ fileSystemReader, contentParser }: BuildParameters,
): Promise<DocumentTree> {
const root = await fileSystemReader.getRootDirectory();
const assetTokensToFiles = new Map<AssetToken, FileReader>();
const documentTokenToPaths = new Map<DocumentToken, string>();
const pathToDocuments = new Map<string, Document>();
const children = await root.read();
const entries = await Promise.all(
children.map((child) =>
this.#build(child, {
contentParser,
root,
assetTokensToFiles,
documentTokenToPaths,
pathToDocuments,
})
),
);
const nodes = entries.filter((entry): entry is NonNullable<typeof entry> =>
!!entry
).toSorted(this.#sorter);
const defaultDocument = this.#findDefaultDocument(nodes);
if (!defaultDocument) {
throw new Error(
"No document found. Document tree must have at least one document.",
);
}
return {
type: "tree",
nodes,
defaultDocument,
defaultLanguage: this.#defaultLanguage,
exchangeToken: ((token) => {
if (isAssetToken(token)) {
const found = assetTokensToFiles.get(token);
if (!found) {
throw new Error(
`DefaultTreeBuilder: No asset file correspond to Asset Token ${token}`,
);
}
return found;
}
if (isDocumentToken(token)) {
const path = documentTokenToPaths.get(token);
if (!path) {
throw new Error(
`DefaultTreeBuilder: No document path registered for the Document Token ${token}`,
);
}
const doc = pathToDocuments.get(path);
if (!doc) {
throw new Error(
`DefaultTreeBuilder: No document at the path ${path}, referenced by token ${token}`,
);
}
return doc;
}
throw new Error(`DefaultTreeBuilder: Invalid token type: ${token}`);
}) as DocumentTree["exchangeToken"],
};
}
async #build(
node: FileReader | DirectoryReader,
{
contentParser,
root,
assetTokensToFiles,
documentTokenToPaths,
pathToDocuments,
parentPath = [],
}: InternalBuildParameters,
): Promise<DocumentDirectory | Document | null> {
let metadata: DocumentMetadata = {
name: node.name,
title: node.name,
};
for (const strategy of this.#strategies) {
const result = await strategy(node, metadata);
if (result.skip) {
// TODO: Debug log (or this should be in the each strategies?)
return null;
}
metadata = result.metadata;
}
if (node.type === "file") {
const result = await contentParser.parse({
fileReader: node,
documentMetadata: metadata,
async getAssetToken(path) {
if (!path.length) {
throw new Error(
`Asset link cannot be empty (processing ${
node.path.join(INTERNAL_PATH_SEPARATOR)
})`,
);
}
const id = crypto.randomUUID();
const token: AssetToken = `mxa_${id}`;
const resolvedPath = await resolveExtensionLessPath(
root,
resolveFsrPath(path, node.path),
);
assetTokensToFiles.set(
token,
await root.openFile(resolvedPath),
);
return token;
},
async getDocumentToken(path) {
if (!path.length) {
throw new Error(
`Document link cannot be empty (processing ${
node.path.join(INTERNAL_PATH_SEPARATOR)
})`,
);
}
const id = crypto.randomUUID();
const token: DocumentToken = `mxt_${id}`;
const resolvedPath = await resolveExtensionLessPath(
root,
resolveFsrPath(path, node.path),
);
documentTokenToPaths.set(
token,
resolvedPath.join(INTERNAL_PATH_SEPARATOR),
);
return token;
},
});
const finalMetadata: DocumentMetadata = "documentMetadata" in result
? result.documentMetadata
: metadata;
const document: Document = {
type: "document",
metadata: finalMetadata,
file: node,
content: "documentContent" in result ? result.documentContent : result,
path: [...parentPath, finalMetadata.name],
};
pathToDocuments.set(node.path.join(INTERNAL_PATH_SEPARATOR), document);
return document;
}
const children = await node.read();
const entries = await Promise.all(
children.map((child) =>
this.#build(child, {
contentParser,
root,
assetTokensToFiles,
documentTokenToPaths,
pathToDocuments,
parentPath: [
...parentPath,
metadata.name,
],
})
),
);
const includingEntries = entries.filter((
child,
): child is NonNullable<typeof child> => !!child).toSorted(this.#sorter);
if (!includingEntries.length) {
return null;
}
return {
type: "directory",
metadata,
directory: node,
entries: includingEntries,
path: [...parentPath, metadata.name],
};
}
#findDefaultDocument(
tree: ReadonlyArray<Document | DocumentDirectory>,
depth: number = 0,
registry: Map<number, Document> | null = null,
): Document | null {
const map = registry || new Map<number, Document>();
for (const item of tree) {
if (item.type === "document") {
if (item.metadata.isDefaultDocument) {
return item;
}
if (!map.has(depth)) {
map.set(depth, item);
}
continue;
}
const found = this.#findDefaultDocument(item.entries, depth + 1, map);
if (found) {
return found;
}
}
if (depth === 0) {
const topmost = Array.from(map.entries()).toSorted(([a], [b]) =>
a - b
)[0];
if (!topmost) {
return null;
}
return topmost[1];
}
return null;
}
}