-
1
-
2
-
3
-
4
-
5
-
6
-
7
-
8
-
9
-
10
-
11
-
12
-
13
-
14
-
15
-
16
-
17
-
18
-
19
-
20
-
21
-
22
-
23
-
24
-
25
-
26
-
27
-
28
-
29
-
30
-
31
-
32
-
33
-
34
-
35
-
36
-
37
-
38
-
39
-
40
-
41
-
42
-
43
-
44
-
45
-
46
-
47
-
48
-
49
-
50
-
51
-
52
-
53
-
54
-
55
-
56
-
57
-
58
-
59
-
60
-
61
-
62
-
63
-
64
-
65
-
66
-
67
-
68
-
69
-
70
-
71
-
72
-
73
-
74
-
75
-
76
-
77
-
78
-
79
-
80
-
81
-
82
-
83
-
84
-
85
-
86
-
87
-
88
-
89
-
90
-
91
-
92
-
93
-
94
-
95
-
96
-
97
-
98
-
99
-
100
-
101
-
102
-
103
-
104
-
105
-
106
-
107
-
108
-
109
-
110
-
111
-
112
-
113
-
114
-
115
-
116
-
117
-
118
-
119
-
120
-
121
-
122
-
123
-
124
-
125
-
126
-
127
-
128
-
129
-
130
-
131
-
132
-
133
-
134
-
135
-
136
-
137
-
138
-
139
-
140
-
141
-
142
-
143
-
144
-
145
-
146
-
147
-
148
-
149
-
150
-
151
-
152
-
153
-
154
-
155
-
156
-
157
-
158
-
159
-
160
-
161
-
162
-
163
-
164
-
165
-
166
-
167
-
168
-
169
-
170
-
171
-
172
-
173
-
174
-
175
-
176
-
177
-
178
-
179
-
180
-
181
-
182
-
183
-
184
-
185
-
186
-
187
-
188
-
189
-
190
-
191
-
192
-
193
-
194
-
195
-
196
-
197
-
198
-
199
-
200
-
201
-
202
-
203
-
204
-
205
-
206
-
207
-
208
-
209
-
210
-
211
-
212
-
213
-
214
-
215
-
216
-
217
-
218
-
219
-
220
-
221
-
222
-
223
-
224
-
225
-
226
-
227
-
228
-
229
-
230
-
231
-
232
-
233
-
234
-
235
-
236
-
237
-
238
-
239
-
240
-
241
-
242
-
243
-
244
-
245
-
246
-
247
-
248
-
249
-
250
-
251
-
252
-
253
-
254
-
255
-
256
-
257
-
258
-
259
-
260
-
261
-
262
-
263
-
264
-
265
-
266
-
267
-
268
-
269
-
270
-
271
-
272
-
273
-
274
-
275
-
276
-
277
-
278
-
279
-
280
-
281
-
282
-
283
-
284
-
285
-
286
-
287
-
288
-
289
-
290
-
291
-
292
-
293
-
294
-
295
-
296
-
297
// SPDX-FileCopyrightText: 2024 Shota FUJI <pockawoooh@gmail.com>
//
// SPDX-License-Identifier: Apache-2.0
import { test as testFrontmatter } from "../../deps/deno.land/std/front_matter/test.ts";
import * as yamlFrontmatter from "../../deps/deno.land/std/front_matter/yaml.ts";
import type * as Mdast from "../../deps/esm.sh/mdast/types.ts";
import { fromMarkdown } from "../../deps/esm.sh/mdast-util-from-markdown/mod.ts";
import { toString } from "../../deps/esm.sh/mdast-util-to-string/mod.ts";
import { headingRange } from "../../deps/esm.sh/mdast-util-heading-range/mod.ts";
import { find as findNode } from "../../deps/esm.sh/unist-util-find/mod.ts";
import { ofm } from "../../lib/micromark_extension_ofm/mod.ts";
import {
type OfmBlockIdentifier,
ofmFromMarkdown,
} from "../../lib/mdast_util_ofm/mod.ts";
import { macanaMarkAssets } from "./obsidian_markdown/mdast_util_macana_mark_assets.ts";
import { macanaMarkDocumentToken } from "./obsidian_markdown/mdast_util_macana_mark_document_token.ts";
import { autoHeadingIdFromMarkdown } from "../../lib/mdast_util_auto_heading_id/mod.ts";
import { logger } from "../logger.ts";
import type {
ContentParser,
ContentParseResult,
ParseParameters,
} from "./interface.ts";
import type { DocumentContent } from "../types.ts";
function getFrontMatterBooleanValue(
frontmatter: Record<string, unknown>,
key: string,
): boolean | undefined {
if (!(key in frontmatter)) {
return undefined;
}
const value = frontmatter[key];
if (typeof value !== "boolean") {
return undefined;
}
return value;
}
function getFrontMatterValue(
frontmatter: Record<string, unknown>,
key: string,
): string | undefined {
if (!(key in frontmatter)) {
return undefined;
}
const value = frontmatter[key];
if (typeof value !== "string") {
return undefined;
}
return value;
}
function getFrontMatterDate(
frontmatter: Record<string, unknown>,
key: string,
): Date | undefined {
if (!(key in frontmatter)) {
return undefined;
}
const value = frontmatter[key];
if (!(value instanceof Date) || isNaN(+value)) {
return undefined;
}
return value;
}
export type ObsidianMarkdownDocument = DocumentContent<
"obsidian_markdown",
Mdast.Nodes
>;
export interface ObsidianMarkdownParserOptions {
/**
* Whether to enable reading of YAML frontmatter.
* @default false
*/
frontmatter?: boolean;
}
/**
* @internal
*/
export async function parseMarkdown(
markdown: string | Uint8Array,
{ getAssetToken, getDocumentToken }: Pick<
ParseParameters,
"getAssetToken" | "getDocumentToken"
>,
): Promise<Mdast.Root> {
const mdast = fromMarkdown(markdown, {
extensions: [ofm()],
mdastExtensions: [
ofmFromMarkdown({ blockIdentifier: { hoist: true } }),
autoHeadingIdFromMarkdown(),
],
});
await macanaMarkDocumentToken(mdast, getDocumentToken);
await macanaMarkAssets(mdast, getAssetToken);
return mdast;
}
function haveId<Node extends Mdast.Node>(
node: Node,
): node is Node & { data: { hProperties: { id: string } } } {
if (
!node.data || !("hProperties" in node.data) ||
typeof node.data.hProperties !== "object" || !node.data.hProperties
) {
return false;
}
if (
!("id" in node.data.hProperties) ||
typeof node.data.hProperties.id !== "string"
) {
return false;
}
return true;
}
function findNodeId(
root: Mdast.Root,
selectors: readonly string[],
): string | null {
if (!selectors.length) {
return null;
}
const [selector, ...rest] = selectors;
if (selector.startsWith("^")) {
const ident = selector.slice(1);
const found = findNode(root, (node) => {
// Non-hoisted block identifier
if (
node.type === "ofmBlockIdentifier" &&
(node as OfmBlockIdentifier).value === ident
) {
return true;
}
// Hoisted parent block
if (!haveId(node)) {
return false;
}
return node.data.hProperties.id === ident;
});
if (!found) {
logger().error(
`Macana couldn't find a block having a block ID "${selector}".` +
` You have to manually define the block identifier at the target location.`,
{ selector },
);
return null;
}
return ident;
}
const text = toString(fromMarkdown(selector, {
extensions: [ofm()],
mdastExtensions: [ofmFromMarkdown()],
}));
let found: string | null = null;
headingRange(
root,
(textContent) => textContent === text,
(start, nodes) => {
if (rest.length) {
found = findNodeId({ type: "root", children: nodes }, rest);
return;
}
if (!haveId(start)) {
return;
}
found = start.data.hProperties.id;
return;
},
);
return found;
}
async function ok(
markdown: string | Uint8Array,
{ fileReader, getDocumentToken, getAssetToken }: Pick<
ParseParameters,
"getAssetToken" | "getDocumentToken" | "fileReader"
>,
): Promise<ObsidianMarkdownDocument> {
const mdast = await parseMarkdown(markdown, {
getDocumentToken,
getAssetToken,
});
return {
kind: "obsidian_markdown",
content: mdast,
getHash(selectors) {
const id = findNodeId(mdast, selectors);
if (!id) {
const filepath = fileReader.path.join("/");
throw new Error(
`${filepath} does not contain heading or custom block matching "${
selectors.join(" > ")
}".`,
);
}
return id;
},
};
}
/**
* Content parser for Obsidian Flavored Markdown documents.
*/
export class ObsidianMarkdownParser
implements ContentParser<ObsidianMarkdownDocument> {
#frontmatter: boolean;
constructor({ frontmatter = false }: ObsidianMarkdownParserOptions = {}) {
this.#frontmatter = frontmatter;
}
async parse(
{ fileReader, documentMetadata, getDocumentToken, getAssetToken }:
ParseParameters,
): Promise<ContentParseResult<ObsidianMarkdownDocument>> {
const bytes = await fileReader.read();
if (!this.#frontmatter) {
return ok(bytes, { getDocumentToken, getAssetToken, fileReader });
}
const decoded = new TextDecoder().decode(bytes);
if (!testFrontmatter(decoded)) {
return ok(bytes, { getDocumentToken, getAssetToken, fileReader });
}
const frontmatter = yamlFrontmatter.extract(decoded);
const name = getFrontMatterValue(frontmatter.attrs, "name");
const title = getFrontMatterValue(frontmatter.attrs, "title");
const description = getFrontMatterValue(frontmatter.attrs, "description");
const lang = getFrontMatterValue(frontmatter.attrs, "lang") ||
getFrontMatterValue(frontmatter.attrs, "language");
const createdAt = getFrontMatterDate(frontmatter.attrs, "createdAt");
const updatedAt = getFrontMatterDate(frontmatter.attrs, "updatedAt");
const isDefaultDocument = getFrontMatterBooleanValue(
frontmatter.attrs,
"defaultDocument",
);
return {
documentMetadata: {
...documentMetadata,
name: name || documentMetadata.name,
title: title || documentMetadata.title,
description: description || documentMetadata.description,
language: lang || documentMetadata.language,
createdAt: createdAt || documentMetadata.createdAt,
updatedAt: updatedAt || documentMetadata.updatedAt,
isDefaultDocument: isDefaultDocument ||
documentMetadata.isDefaultDocument,
},
documentContent: await ok(frontmatter.body, {
getDocumentToken,
getAssetToken,
fileReader,
}),
};
}
}