diff --git a/.github/workflows/test.yml b/.github/workflows/test.yml
index 1d9ca3ad..7ea47b94 100644
--- a/.github/workflows/test.yml
+++ b/.github/workflows/test.yml
@@ -72,6 +72,14 @@ jobs:
       - name: Build editor-ext
         run: pnpm --filter @docmost/editor-ext build
 
+      # @docmost/prosemirror-markdown is the shared converter (#293/#326); its
+      # build/ is gitignored, and plain `pnpm -r test` does NOT honour nx
+      # `dependsOn: ^build`, so its consumers (mcp `pretest: tsc`, git-sync vitest
+      # typecheck) fail with TS2307 Cannot find module '@docmost/prosemirror-markdown'
+      # unless it is built first. Build it before the recursive test run.
+      - name: Build prosemirror-markdown
+        run: pnpm --filter @docmost/prosemirror-markdown build
+
       - name: Run unit tests
         run: pnpm -r test
 
diff --git a/.gitignore b/.gitignore
index bbc6abc1..0f97bb35 100644
--- a/.gitignore
+++ b/.gitignore
@@ -4,12 +4,21 @@
 data
 # compiled output
 /dist
-node_modules/
+node_modules
 
 # git-sync compiled output (built in CI/Docker via `pnpm build`, never committed,
 # so src/ and prod can never silently diverge).
 packages/git-sync/build/
 
+# prosemirror-markdown compiled output (built in CI/Docker via `pnpm build`,
+# never committed, so src/ and prod can never silently diverge).
+packages/prosemirror-markdown/build/
+
+# mcp compiled output (built in CI/Docker via `pnpm build`, never committed, so
+# src/ and prod can never silently diverge). Matches the git-sync/prosemirror-
+# markdown convention; the package is private and rebuilt at deploy.
+packages/mcp/build/
+
 # Logs
 logs
 *.log
diff --git a/AGENTS.md b/AGENTS.md
index 1a13dea6..9bedbc39 100644
--- a/AGENTS.md
+++ b/AGENTS.md
@@ -200,7 +200,8 @@ pnpm workspace (`pnpm@10.4.0`) orchestrated by **Nx**. Four workspace packages:
 | `apps/server` | `server` | NestJS 11 + Fastify, Kysely (Postgres), Redis | Backend API, collaboration, AI |
 | `apps/client` | `client` | React 18 + Vite + Mantine 8 + TanStack Query + Jotai | SPA frontend |
 | `packages/editor-ext` | `@docmost/editor-ext` | Tiptap/ProseMirror | Shared Tiptap node/mark extensions, imported by both the client and the server |
-| `packages/mcp` | `@docmost/mcp` | MCP SDK, Tiptap, Yjs | Standalone MCP server, also bundled into the server at `/mcp`. Does **not** import `editor-ext` — it keeps its own vendored mirror of the schema in `packages/mcp/src/lib/` |
+| `packages/mcp` | `@docmost/mcp` | MCP SDK, Tiptap, Yjs | Standalone MCP server, also bundled into the server at `/mcp`. Consumes the shared converter/schema from `@docmost/prosemirror-markdown` (#293) — it no longer carries its own vendored converter/schema copy |
+| `packages/prosemirror-markdown` | `@docmost/prosemirror-markdown` | Tiptap, marked, jsdom | The single, canonical ProseMirror↔Markdown converter + Docmost schema mirror (#293). Consumed by `mcp` and `git-sync`; there is exactly ONE copy of the converter now |
 
 `build` targets are Nx-cached and dependency-ordered (`dependsOn: ["^build"]`), so `editor-ext` builds before the apps. `nx.json` sets `affected.defaultBase: main`.
 
@@ -282,7 +283,7 @@ The API server is a Fastify app with a global `/api` prefix (`main.ts` excludes
 ### Client structure
 Vite SPA. Code is organized by feature under `apps/client/src/features/*` (mirrors the server domains: `page`, `space`, `comment`, `ai-chat`, `editor`, …). Conventions:
 - **TanStack Query** for server state (one `queries/` file per feature), **Jotai** atoms for local/shared UI state, **Mantine 8** + CSS modules (`*.module.css`) + `postcss-preset-mantine` for UI.
-- The editor is Tiptap; shared node/mark extensions live in `packages/editor-ext` and are imported by **both the client and the server** (collaboration, import/export) — editor schema changes often need to be made in `editor-ext`, not just the client. Note `packages/mcp` does *not* depend on `editor-ext`; it carries its own mirrored copy of the schema, so keep the two in sync manually when the document schema changes.
+- The editor is Tiptap; shared node/mark extensions live in `packages/editor-ext` and are imported by **both the client and the server** (collaboration, import/export) — editor schema changes often need to be made in `editor-ext`, not just the client. The ProseMirror↔Markdown converter and its Docmost schema mirror now live in a SINGLE package, `@docmost/prosemirror-markdown` (#293), consumed by both `mcp` and `git-sync` — do NOT reintroduce a per-package copy. `editor-ext` is the upstream source of the Tiptap schema; the package's `docmost-schema.ts` mirrors it and a serializer-contract test (`packages/prosemirror-markdown/test/serializer-contract.test.ts`) guards the boundary (every schema node must have a converter case), so a drift surfaces as a failing test rather than silent divergence.
 - API access goes through `apps/client/src/lib/api-client.ts` (axios). The `@` alias maps to `apps/client/src`.
 - Runtime config is injected at build time by `vite.config.ts` via `define` (`APP_URL`, `COLLAB_URL`, `APP_VERSION`, …) — these come from the root `.env`, not from `import.meta.env`.
 
@@ -293,7 +294,7 @@ Vite SPA. Code is organized by feature under `apps/client/src/features/*` (mirro
 - The version string shown in the UI comes from `APP_VERSION` (CI/Docker) or `git describe --tags --always` (local), resolved in `vite.config.ts` — not from `package.json`.
 - Server TS config is permissive (`noImplicitAny: false`, `strictNullChecks: false`, `no-explicit-any` lint disabled). Follow the existing relaxed style rather than tightening types broadly.
 - Dependency versions are heavily pinned via `pnpm.overrides` and `pnpm.patchedDependencies` (`scimmy`, `yjs`) in the root `package.json`. Don't bump pinned/patched deps casually; the patches and overrides exist for compatibility/security reasons.
-- **Adding/renaming/removing an MCP tool requires updating `SERVER_INSTRUCTIONS`** in `packages/mcp/src/index.ts` — the intent-routing guide MCP clients receive on initialize. This applies both to inline `server.registerTool(...)` calls in `index.ts` and to specs in `packages/mcp/src/tool-specs.ts`. Enforced by `packages/mcp/test/unit/server-instructions.test.mjs`, which fails when a registered tool is not mentioned in the guide (deliberate opt-outs go into its `EXCEPTIONS` list). Remember `packages/mcp/build/` is committed — rebuild after editing.
+- **Adding/renaming/removing an MCP tool requires updating `SERVER_INSTRUCTIONS`** in `packages/mcp/src/index.ts` — the intent-routing guide MCP clients receive on initialize. This applies both to inline `server.registerTool(...)` calls in `index.ts` and to specs in `packages/mcp/src/tool-specs.ts`. Enforced by `packages/mcp/test/unit/server-instructions.test.mjs`, which fails when a registered tool is not mentioned in the guide (deliberate opt-outs go into its `EXCEPTIONS` list). `packages/mcp/build/` is gitignored and rebuilt in CI/Docker via `pnpm build` (same convention as `git-sync`/`prosemirror-markdown`) — never commit it; rebuild locally after editing to run the tests.
 
 ## CI / release
 
diff --git a/Dockerfile b/Dockerfile
index e6daeb72..42f5a267 100644
--- a/Dockerfile
+++ b/Dockerfile
@@ -38,6 +38,14 @@ COPY --from=builder /app/packages/editor-ext/dist /app/packages/editor-ext/dist
 COPY --from=builder /app/packages/editor-ext/package.json /app/packages/editor-ext/package.json
 COPY --from=builder /app/packages/mcp/build /app/packages/mcp/build
 COPY --from=builder /app/packages/mcp/package.json /app/packages/mcp/package.json
+# mcp now depends on @docmost/prosemirror-markdown (workspace:*) and eager-imports
+# it at runtime (the in-app ai-chat DocmostClient loads build/index.js -> lib/
+# markdown-converter.js). Ship the built package + its manifest, or the prod
+# install resolves a broken workspace symlink and every ai-chat tool dies with
+# ERR_MODULE_NOT_FOUND (#293/#326 step 5). (git-sync has no runtime consumer yet;
+# revisit at step 6 when #119 lands.)
+COPY --from=builder /app/packages/prosemirror-markdown/build /app/packages/prosemirror-markdown/build
+COPY --from=builder /app/packages/prosemirror-markdown/package.json /app/packages/prosemirror-markdown/package.json
 
 # Copy root package files
 COPY --from=builder /app/package.json /app/package.json
diff --git a/apps/server/src/core/ai-chat/tools/ai-chat-tools.service.ts b/apps/server/src/core/ai-chat/tools/ai-chat-tools.service.ts
index 82f2ecb6..cc0c48fa 100644
--- a/apps/server/src/core/ai-chat/tools/ai-chat-tools.service.ts
+++ b/apps/server/src/core/ai-chat/tools/ai-chat-tools.service.ts
@@ -659,13 +659,21 @@ export class AiChatToolsService {
 
       listComments: tool({
         description:
-          'List ALL comments on a page in one call, including RESOLVED ' +
-          'threads — filter by resolvedAt when you need only open ones. ' +
-          'Content is returned as Markdown.',
+          'List comments on a page in one call. By DEFAULT only ACTIVE ' +
+          'threads are returned; resolved threads (a resolved top-level ' +
+          'comment and all its replies) are hidden and their count reported ' +
+          'as `resolvedThreadsHidden` so you can re-query with ' +
+          '`includeResolved: true` to see everything. Returns ' +
+          '`{ items, resolvedThreadsHidden }`. Content is returned as Markdown.',
         inputSchema: modelFriendlyInput({
           pageId: z.string().describe('The id of the page.'),
+          includeResolved: z
+            .boolean()
+            .optional()
+            .describe('default only active threads; true — include resolved'),
         }),
-        execute: async ({ pageId }) => await client.listComments(pageId),
+        execute: async ({ pageId, includeResolved }) =>
+          await client.listComments(pageId, includeResolved),
       }),
 
       getComment: tool({
diff --git a/apps/server/src/core/ai-chat/tools/docmost-client.loader.ts b/apps/server/src/core/ai-chat/tools/docmost-client.loader.ts
index 42bbd097..8e6ee0c2 100644
--- a/apps/server/src/core/ai-chat/tools/docmost-client.loader.ts
+++ b/apps/server/src/core/ai-chat/tools/docmost-client.loader.ts
@@ -61,7 +61,12 @@ export interface DocmostClientLike {
     opts?: { regex?: boolean; caseSensitive?: boolean; limit?: number },
   ): Promise<Record<string, unknown>>;
   getTable(pageId: string, tableRef: string): Promise<Record<string, unknown>>;
-  listComments(pageId: string): Promise<unknown[]>;
+  // Returns `{ items, resolvedThreadsHidden }`. DEFAULT (includeResolved unset/
+  // false) hides resolved threads wholesale; pass true for the full feed.
+  listComments(
+    pageId: string,
+    includeResolved?: boolean,
+  ): Promise<{ items: unknown[]; resolvedThreadsHidden: number }>;
   getComment(
     commentId: string,
   ): Promise<{ data: Record<string, unknown>; success: boolean }>;
diff --git a/packages/git-sync/package.json b/packages/git-sync/package.json
index 96765ffa..fe37b436 100644
--- a/packages/git-sync/package.json
+++ b/packages/git-sync/package.json
@@ -20,6 +20,7 @@
   },
   "license": "MIT",
   "dependencies": {
+    "@docmost/prosemirror-markdown": "workspace:*",
     "@tiptap/core": "3.20.4",
     "@tiptap/extension-highlight": "3.20.4",
     "@tiptap/extension-image": "3.20.4",
diff --git a/packages/git-sync/src/engine/pull.ts b/packages/git-sync/src/engine/pull.ts
index b541c67a..3d7868d5 100644
--- a/packages/git-sync/src/engine/pull.ts
+++ b/packages/git-sync/src/engine/pull.ts
@@ -31,7 +31,7 @@
  */
 import { dirname } from "node:path";
 import { sep } from "node:path";
-import { parsePageFile, serializePageFile } from "../lib/page-file.js";
+import { parsePageFile, serializePageFile } from "@docmost/prosemirror-markdown";
 import type { GitSyncClient } from "./client.types.js";
 import { buildVaultLayout, type PageNode } from "./layout.js";
 import {
diff --git a/packages/git-sync/src/engine/push.ts b/packages/git-sync/src/engine/push.ts
index 63d28530..903931be 100644
--- a/packages/git-sync/src/engine/push.ts
+++ b/packages/git-sync/src/engine/push.ts
@@ -26,8 +26,11 @@
  * the gitmost server drives the engine in-process (there is no standalone CLI
  * entry point).
  */
-import { type DocmostMdMeta } from "../lib/index.js";
-import { parsePageFile, serializePageFile } from "../lib/page-file.js";
+import {
+  type DocmostMdMeta,
+  parsePageFile,
+  serializePageFile,
+} from "@docmost/prosemirror-markdown";
 import type { GitSyncClient } from "./client.types.js";
 import type { DiffEntry } from "./git.js";
 import { VaultGit, DEFAULT_BRANCH } from "./git.js";
diff --git a/packages/git-sync/src/engine/stabilize.ts b/packages/git-sync/src/engine/stabilize.ts
index a075b634..ce1acdcf 100644
--- a/packages/git-sync/src/engine/stabilize.ts
+++ b/packages/git-sync/src/engine/stabilize.ts
@@ -17,7 +17,7 @@ import {
   markdownToProseMirror,
   serializeDocmostMarkdownBody,
   type DocmostMdMeta,
-} from "../lib/index.js";
+} from "@docmost/prosemirror-markdown";
 
 /**
  * Meta object as `exportPageBody` builds it (SPEC §4). Kept byte-for-byte
diff --git a/packages/git-sync/src/index.ts b/packages/git-sync/src/index.ts
index a52ca8d3..8c9e87eb 100644
--- a/packages/git-sync/src/index.ts
+++ b/packages/git-sync/src/index.ts
@@ -8,6 +8,10 @@
  */
 
 // Pure converter (markdown <-> ProseMirror, file envelope, canonicalization).
+// Re-exported from the standalone `@docmost/prosemirror-markdown` package,
+// which is the single source of truth for the converter core; git-sync keeps
+// only the engine (vault/git/orchestrator) and re-surfaces the converter for
+// in-process consumers of the git-sync barrel.
 export {
   serializeDocmostMarkdown,
   serializeDocmostMarkdownBody,
@@ -16,8 +20,8 @@ export {
   markdownToProseMirror,
   canonicalizeContent,
   docsCanonicallyEqual,
-} from "./lib/index.js";
-export type { DocmostMdMeta } from "./lib/index.js";
+} from "@docmost/prosemirror-markdown";
+export type { DocmostMdMeta } from "@docmost/prosemirror-markdown";
 
 // Pure engine (no IO): reconcile planner, vault layout, sanitize, stabilize,
 // loop-guard body hash.
@@ -123,4 +127,4 @@ export {
 } from "./engine/path-guard.js";
 export type { PathGuardIo, VaultPathUnsafeReason } from "./engine/path-guard.js";
 
-export { parsePageFile, serializePageFile } from "./lib/page-file.js";
+export { parsePageFile, serializePageFile } from "@docmost/prosemirror-markdown";
diff --git a/packages/git-sync/src/lib/markdown-converter.ts b/packages/git-sync/src/lib/markdown-converter.ts
deleted file mode 100644
index 013a54f3..00000000
--- a/packages/git-sync/src/lib/markdown-converter.ts
+++ /dev/null
@@ -1,1130 +0,0 @@
-import { encodeHtmlEmbedSource } from "./docmost-schema.js";
-
-/**
- * Hard cap on processNode recursion depth (see the depth guard below).
- *
- * Chosen well above any realistic document (the deepest legitimate nesting the
- * editor can produce is far shallower) yet far below the point where the
- * converter's own call stack overflows. The heaviest shape (deeply nested
- * lists) costs ~5 JS frames per level and the runtime stack holds ~10k frames,
- * so the measured overflow is around level ~650 (deeply nested lists); 400
- * leaves a comfortable margin while still rendering pathological-but-bounded
- * docs in full (the 200-level stress fixture reaches depth ~204).
- */
-const MAX_NODE_DEPTH = 400;
-
-/**
- * Convert ProseMirror/TipTap JSON content to Markdown
- * Supports all Docmost-specific node types and extensions
- */
-export function convertProseMirrorToMarkdown(content: any): string {
-  if (!content || !content.content) return "";
-
-  // Escape a value interpolated into an HTML double-quoted attribute value
-  // (textAlign, colors, image src, math `text`, all data-* attrs, etc.). In the
-  // ATTRIBUTE context only the quote that delimits the value and the ampersand
-  // that starts an entity are special, so we escape ONLY & " (and ' for safety
-  // when single-quoted delimiters are used). We deliberately do NOT escape < or
-  // >: the HTML re-parser (parse5/jsdom via @tiptap/html) does NOT decode
-  // &lt;/&gt; back inside attribute values, so escaping them would corrupt the
-  // stored data (e.g. a math node's LaTeX `a < b`) and ACCUMULATE escapes on
-  // every round-trip (`a < b` -> `a &lt; b` -> `a &amp;lt; b`). Escaping & "
-  // keeps the value inert against attribute-injection while staying idempotent.
-  // NOTE: escape ONLY & and " here. The value is always wrapped in double
-  // quotes, so " is the only delimiter; ' is NOT special in a double-quoted
-  // value, and parse5 does not decode &#39; back inside attribute values, so
-  // escaping ' would (like < >) corrupt the value and accumulate &amp; on every
-  // round-trip. Escaping & and " is idempotent (parse5 decodes them back).
-  const escapeAttr = (value: unknown): string =>
-    String(value)
-      .replace(/&/g, "&amp;")
-      .replace(/"/g, "&quot;");
-
-  // Escape a value placed as HTML element TEXT content (between tags), where
-  // <, >, and & are all significant. Used for text rendered inside raw-HTML
-  // blocks (table cells / columns) so stored characters cannot inject markup.
-  const escapeHtmlText = (value: unknown): string =>
-    String(value)
-      .replace(/&/g, "&amp;")
-      .replace(/</g, "&lt;")
-      .replace(/>/g, "&gt;");
-
-  // Percent-encode characters that would break out of a markdown URL target
-  // (...) — whitespace/newlines and parentheses — so a stored src stays a
-  // single inert token (used for image/video/youtube srcs).
-  const encodeMdUrl = (value: unknown): string =>
-    String(value || "")
-      .replace(/\s/g, (c: string) => (c === " " ? "%20" : encodeURIComponent(c)))
-      .replace(/\(/g, "%28")
-      .replace(/\)/g, "%29");
-
-  // Recursion depth guard. processNode is mutually recursive (directly and via
-  // processListItem/processTaskItem/blockToHtml), and a pathologically nested
-  // document (e.g. tens of thousands of nested blockquotes) would otherwise
-  // overflow the call stack and throw a RangeError, which would abort the sync
-  // and prevent the page from ever being written. We track the live nesting
-  // depth in a closure counter (the wrapper below) so we NEVER throw: past the
-  // limit we stop recursing and emit the node's own text (or nothing) instead.
-  // Normal documents never approach MAX_NODE_DEPTH, so their output is byte-
-  // identical. NOTE: the wrapper signature is (node) only — several callers use
-  // `.map(processNode)`, which would otherwise pass the array index as a second
-  // argument; the wrapper ignores extra arguments so that is harmless.
-  let nodeDepth = 0;
-
-  // A table cell whose content is NOT a single plain paragraph — a list, code
-  // block, blockquote, multiple paragraphs, etc. A GFM pipe cell can only hold
-  // inline content on one line, so such a cell must force the HTML <table> form
-  // or its structure is flattened/lost on round trip (review #8).
-  const cellIsMultiBlock = (cell: any): boolean => {
-    const blocks = cell.content || [];
-    if (blocks.length > 1) return true;
-    const only = blocks[0];
-    return only != null && only.type !== "paragraph";
-  };
-
-  // Render a whole table as raw HTML `<table>` (round-trips via the schema's
-  // table-family parseHTML). Used when a GFM pipe table would be wrong: merged
-  // cells (colspan/rowspan), multi-block cells (#8), OR the table sits inside a
-  // raw-HTML container like a column (marked does not parse markdown inside raw
-  // HTML, so a GFM pipe table there becomes literal "| a | b |" text — #7).
-  // `blockToHtml` is referenced lazily (defined below; only called at runtime).
-  const tableToHtml = (tableRows: any[]): string => {
-    const renderHtmlCell = (cell: any): string => {
-      const tag = cell.type === "tableHeader" ? "th" : "td";
-      const a = cell.attrs || {};
-      const cellParts: string[] = [];
-      if ((a.colspan ?? 1) > 1)
-        cellParts.push(`colspan="${escapeAttr(a.colspan)}"`);
-      if ((a.rowspan ?? 1) > 1)
-        cellParts.push(`rowspan="${escapeAttr(a.rowspan)}"`);
-      if (a.align) cellParts.push(`align="${escapeAttr(a.align)}"`);
-      const open = cellParts.length
-        ? `<${tag} ${cellParts.join(" ")}>`
-        : `<${tag}>`;
-      const inner = (cell.content || [])
-        .map((block: any) => blockToHtml(block))
-        .join("");
-      return `${open}${inner}</${tag}>`;
-    };
-    const htmlRows = tableRows
-      .map(
-        (row: any) =>
-          `<tr>${(row.content || []).map(renderHtmlCell).join("")}</tr>`,
-      )
-      .join("");
-    return `<table><tbody>${htmlRows}</tbody></table>`;
-  };
-
-  const processNode = (node: any): string => {
-    if (nodeDepth >= MAX_NODE_DEPTH) {
-      // Bail out of deeper recursion without throwing. A text node still has
-      // its own content worth keeping; a container at the limit collapses to
-      // "" (its already-too-deep subtree is dropped) rather than overflowing.
-      return typeof node?.text === "string" ? node.text : "";
-    }
-    nodeDepth++;
-    try {
-      return processNodeInner(node);
-    } finally {
-      nodeDepth--;
-    }
-  };
-
-  const processNodeInner = (node: any): string => {
-    const type = node.type;
-    const nodeContent = node.content || [];
-
-    switch (type) {
-      case "doc":
-        return nodeContent.map(processNode).join("\n\n");
-
-      case "paragraph":
-        const text = nodeContent.map(processNode).join("");
-        const align = node.attrs?.textAlign;
-        if (align && align !== "left") {
-          // Emit alignment as a styled `<p>` (review #10). The old
-          // `<div align="…">` had NO matching import parse rule — the div was
-          // unwrapped and alignment lost on every round trip. A styled `<p>`
-          // round-trips: the paragraph parse rule (tag:"p") matches and the
-          // textAlign global-attribute parseHTML (docmost-schema) reads the style.
-          return `<p style="text-align:${escapeAttr(align)}">${text}</p>`;
-        }
-        return text || "";
-
-      case "heading":
-        const level = node.attrs?.level || 1;
-        const headingText = nodeContent.map(processNode).join("");
-        const headingAlign = node.attrs?.textAlign;
-        if (headingAlign && headingAlign !== "left") {
-          // Emit alignment as a styled `<hN>` so it round-trips losslessly,
-          // symmetric to the paragraph case above (review F5/A1). The bare
-          // `## text` markdown form carries NO alignment, so an aligned heading
-          // would silently drop textAlign on export. A styled `<hN>` re-parses:
-          // the heading parse rule (tag:"h1".."h6") matches and the textAlign
-          // global-attribute parseHTML (docmost-schema) reads the style back,
-          // preserving BOTH level and textAlign. escapeAttr keeps the align
-          // value injection-safe, exactly like the paragraph arm.
-          return `<h${level} style="text-align:${escapeAttr(headingAlign)}">${headingText}</h${level}>`;
-        }
-        // No alignment (or the default "left"): keep the plain `## text`
-        // markdown form — HTML-ifying an unaligned heading would be needless
-        // churn, exactly as the paragraph case keeps plain text when unaligned.
-        return "#".repeat(level) + " " + headingText;
-
-      case "text":
-        let textContent = node.text || "";
-        // Apply marks (bold, italic, code, etc.)
-        if (node.marks) {
-          // The schema's `code` mark declares `excludes: "_"` — it excludes every
-          // other inline mark — so the editor can NEVER produce a text run that
-          // carries `code` together with another mark, and on import any
-          // co-occurring mark is always dropped (the run comes back as code-only).
-          // The lossless, byte-stable behavior is therefore: when a run has the
-          // `code` mark, emit ONLY the backtick code span and ignore every other
-          // mark, so md1 is already code-only and md2 === md1. Runs WITHOUT a code
-          // mark are rendered exactly as before.
-          const markTypes = node.marks.map((m: any) => m.type);
-          const hasCode = markTypes.includes("code");
-          if (hasCode) {
-            textContent = `\`${textContent}\``;
-            return textContent;
-          }
-          const codeCombined = false;
-          for (const mark of node.marks) {
-            switch (mark.type) {
-              case "bold":
-                textContent = codeCombined
-                  ? `<strong>${textContent}</strong>`
-                  : `**${textContent}**`;
-                break;
-              case "italic":
-                textContent = codeCombined
-                  ? `<em>${textContent}</em>`
-                  : `*${textContent}*`;
-                break;
-              case "code":
-                // When combined with another mark, wrap as <code> so the
-                // surrounding HTML marks can nest around it; otherwise use the
-                // plain backtick span.
-                textContent = codeCombined
-                  ? `<code>${textContent}</code>`
-                  : `\`${textContent}\``;
-                break;
-              case "link": {
-                const href = mark.attrs?.href || "";
-                const title = mark.attrs?.title;
-                if (codeCombined) {
-                  // Emit an HTML anchor so it can wrap the nested <code>.
-                  const safeHref = escapeAttr(href);
-                  if (title) {
-                    textContent = `<a href="${safeHref}" title="${escapeAttr(String(title))}">${textContent}</a>`;
-                  } else {
-                    textContent = `<a href="${safeHref}">${textContent}</a>`;
-                  }
-                } else if (title) {
-                  // Emit the optional markdown link title; escape an embedded
-                  // double-quote so it cannot terminate the title string early.
-                  const safeTitle = String(title).replace(/"/g, '\\"');
-                  textContent = `[${textContent}](${href} "${safeTitle}")`;
-                } else {
-                  textContent = `[${textContent}](${href})`;
-                }
-                break;
-              }
-              case "strike":
-                textContent = codeCombined
-                  ? `<s>${textContent}</s>`
-                  : `~~${textContent}~~`;
-                break;
-              case "underline":
-                textContent = `<u>${textContent}</u>`;
-                break;
-              case "subscript":
-                textContent = `<sub>${textContent}</sub>`;
-                break;
-              case "superscript":
-                textContent = `<sup>${textContent}</sup>`;
-                break;
-              case "highlight": {
-                // Preserve a null/empty color as a plain highlight (a bare
-                // <mark> with no background-color); only emit the style when a
-                // color is actually set, so a plain highlight is not forced to
-                // yellow on export.
-                const color = mark.attrs?.color;
-                textContent = color
-                  ? `<mark style="background-color: ${escapeAttr(color)}">${textContent}</mark>`
-                  : `<mark>${textContent}</mark>`;
-                break;
-              }
-              case "textStyle":
-                if (mark.attrs?.color) {
-                  textContent = `<span style="color: ${escapeAttr(mark.attrs.color)}">${textContent}</span>`;
-                }
-                break;
-              case "spoiler":
-                // Markdown has no native spoiler syntax, so emit the same raw
-                // inline HTML the editor-ext/MCP stack uses. The schema's Spoiler
-                // mark parses span[data-spoiler] back on import, so the mark
-                // survives the PM -> MD -> PM round-trip.
-                textContent = `<span data-spoiler="true">${textContent}</span>`;
-                break;
-              case "comment": {
-                // Emit the inline comment anchor so highlights round-trip. The
-                // schema's Comment mark parses span[data-comment-id] (attrs
-                // commentId/resolved).
-                const cid = mark.attrs?.commentId;
-                if (cid) {
-                  const resolvedAttr = mark.attrs?.resolved
-                    ? ` data-resolved="true"`
-                    : "";
-                  textContent = `<span data-comment-id="${escapeAttr(cid)}"${resolvedAttr}>${textContent}</span>`;
-                }
-                break;
-              }
-            }
-          }
-        }
-        return textContent;
-
-      case "codeBlock":
-        const language = node.attrs?.language || "";
-        // Strip ALL trailing newlines so the export is idempotent: marked
-        // re-adds exactly one trailing "\n" on import, so trimming only one
-        // here would let the text grow by "\n" on each round-trip. Removing
-        // every trailing newline makes repeated cycles stable.
-        const code = nodeContent
-          .map(processNode)
-          .join("")
-          .replace(/\n+$/, "");
-        // CommonMark: an inner ``` run inside the code would prematurely close
-        // a 3-backtick fence (corrupting the block on re-import). Use an outer
-        // fence one backtick longer than the longest backtick run in the code
-        // (minimum 3) so the inner fence is always content.
-        const longestBacktickRun = (code.match(/`+/g) || []).reduce(
-          (max: number, run: string) => Math.max(max, run.length),
-          0,
-        );
-        const fence = "`".repeat(Math.max(3, longestBacktickRun + 1));
-        return fence + language + "\n" + code + "\n" + fence;
-
-      case "bulletList":
-        return nodeContent
-          .map((item: any) => processListItem(item, "-"))
-          .join("\n");
-
-      case "orderedList":
-        return nodeContent
-          .map((item: any, index: number) =>
-            processListItem(item, `${index + 1}.`),
-          )
-          .join("\n");
-
-      case "taskList":
-        return nodeContent.map((item: any) => processTaskItem(item)).join("\n");
-
-      case "taskItem":
-        // Delegate to the same helper used by taskList so multi-block and
-        // nested task items render and indent consistently.
-        return processTaskItem(node);
-
-      case "listItem":
-        return nodeContent.map(processNode).join("\n");
-
-      case "blockquote":
-        // Prefix EVERY line of EVERY child with "> " and separate block-level
-        // children with a blank ">" line so code blocks / multi-paragraph
-        // quotes round-trip correctly.
-        return nodeContent
-          .map((n: any) =>
-            processNode(n)
-              .split("\n")
-              .map((line: string) => (line.length ? `> ${line}` : ">"))
-              .join("\n"),
-          )
-          .join("\n>\n");
-
-      case "horizontalRule":
-        return "---";
-
-      case "hardBreak":
-        // Two trailing spaces before the newline encode a markdown hard break;
-        // a bare "\n" would be reimported as a soft break and lost.
-        return "  \n";
-
-      case "image": {
-        const imgAttrs = node.attrs || {};
-        // A top-level image with layout/identity attrs beyond src/alt cannot be
-        // expressed by markdown `![](src)` — width/height/align/size/
-        // attachmentId/aspectRatio would be silently dropped on export and lost
-        // on re-import. Emit the SAME schema-matching <img> used inside columns
-        // (imageToHtml) so those attrs survive the round-trip. A bare image
-        // (only src/alt, optionally a title — which has no schema attr) keeps
-        // the lighter markdown form so existing image round-trip tests hold.
-        const hasLayoutAttrs =
-          imgAttrs.width != null ||
-          imgAttrs.height != null ||
-          imgAttrs.align ||
-          imgAttrs.size != null ||
-          imgAttrs.attachmentId ||
-          imgAttrs.aspectRatio != null ||
-          // A caption (issue #221) cannot be expressed by markdown `![](src)`,
-          // so route a captioned image through imageToHtml's raw <img> form
-          // (data-caption) — the same lossless form used for the other
-          // Docmost-specific image attrs.
-          imgAttrs.caption;
-        if (hasLayoutAttrs) {
-          return imageToHtml(node);
-        }
-        const imgAlt = imgAttrs.alt || "";
-        // Neutralize characters that could break out of the markdown image
-        // URL: spaces/newlines and parentheses would terminate the (...) target
-        // and let a stored src inject following markdown/HTML. Percent-encode
-        // them so the URL stays a single inert token.
-        const imgSrc = encodeMdUrl(imgAttrs.src);
-        // A bare image (only src/alt, optionally a title) has no caption, so the
-        // lighter markdown form is lossless here; captioned images took the
-        // imageToHtml branch above.
-        return `![${imgAlt}](${imgSrc})`;
-      }
-
-      case "video": {
-        // Emit the schema-matching <video> element so generateJSON rebuilds the
-        // node with its attrs intact. The schema's parseHTML reads src/aria-label
-        // from the standard attributes and the remaining attrs from data-*.
-        const attrs = node.attrs || {};
-        const parts: string[] = [`src="${escapeAttr(attrs.src ?? "")}"`];
-        if (attrs.alt) parts.push(`aria-label="${escapeAttr(attrs.alt)}"`);
-        if (attrs.attachmentId)
-          parts.push(
-            `data-attachment-id="${escapeAttr(attrs.attachmentId)}"`,
-          );
-        if (attrs.width != null)
-          parts.push(`width="${escapeAttr(attrs.width)}"`);
-        if (attrs.height != null)
-          parts.push(`height="${escapeAttr(attrs.height)}"`);
-        if (attrs.size != null)
-          parts.push(`data-size="${escapeAttr(attrs.size)}"`);
-        if (attrs.align)
-          parts.push(`data-align="${escapeAttr(attrs.align)}"`);
-        if (attrs.aspectRatio != null)
-          parts.push(`data-aspect-ratio="${escapeAttr(attrs.aspectRatio)}"`);
-        // Wrap in a block <div> so marked treats it as a block (a bare <video>
-        // is inline-level HTML and marked wraps it in <p>, leaving a spurious
-        // empty paragraph beside the hoisted block atom). The wrapper has no
-        // data-type, so the schema parser ignores it and just hoists the video.
-        return `<div><video ${parts.join(" ")}></video></div>`;
-      }
-
-      case "youtube": {
-        // Emit the schema-matching div[data-type="youtube"]; the schema reads
-        // src from data-src and width/height/align from data-* attributes.
-        const attrs = node.attrs || {};
-        const parts: string[] = [
-          `data-type="youtube"`,
-          `data-src="${escapeAttr(attrs.src ?? "")}"`,
-        ];
-        if (attrs.width != null)
-          parts.push(`data-width="${escapeAttr(attrs.width)}"`);
-        if (attrs.height != null)
-          parts.push(`data-height="${escapeAttr(attrs.height)}"`);
-        if (attrs.align)
-          parts.push(`data-align="${escapeAttr(attrs.align)}"`);
-        return `<div ${parts.join(" ")}></div>`;
-      }
-
-      case "table": {
-        // A GFM pipe table cannot represent merged cells. If ANY cell carries
-        // colspan>1 or rowspan>1, a pipe table would corrupt the grid on
-        // re-import, so emit the WHOLE table as raw HTML <table> instead: the
-        // schema's table family parseHTML (tag table/tr/td/th, with colspan/
-        // rowspan read from the same-named HTML attrs and align via parseHTML)
-        // round-trips it faithfully. Otherwise keep the lighter GFM pipe table.
-        const tableRows: any[] = nodeContent;
-        if (tableRows.length === 0) return "";
-        const hasSpan = tableRows.some((row: any) =>
-          (row.content || []).some(
-            (cell: any) =>
-              (cell.attrs?.colspan ?? 1) > 1 || (cell.attrs?.rowspan ?? 1) > 1,
-          ),
-        );
-        // A GFM pipe table also cannot hold a cell with block content (a list,
-        // code block, paragraphs) — it would be flattened to one line and lost
-        // (review #8). Force the HTML form for those too.
-        const hasMultiBlockCell = tableRows.some((row: any) =>
-          (row.content || []).some((cell: any) => cellIsMultiBlock(cell)),
-        );
-
-        if (hasSpan || hasMultiBlockCell) {
-          return tableToHtml(tableRows);
-        }
-
-        // No merged cells: emit a GFM table (header row + separator) so the
-        // markdown can be parsed back into a table on re-import.
-        const rows = tableRows.map(processNode);
-        const headerCells = tableRows[0]?.content || [];
-        const columns = headerCells.length || 1;
-        // Derive alignment markers (:--, :-:, --:) from each header cell.
-        const markers = Array.from({ length: columns }, (_, i) => {
-          const align = headerCells[i]?.attrs?.align;
-          switch (align) {
-            case "left":
-              return ":--";
-            case "center":
-              return ":-:";
-            case "right":
-              return "--:";
-            default:
-              return "---";
-          }
-        });
-        const separator = "| " + markers.join(" | ") + " |";
-        return [rows[0], separator, ...rows.slice(1)].join("\n");
-      }
-
-      case "tableRow":
-        return "| " + nodeContent.map(processNode).join(" | ") + " |";
-
-      case "tableCell":
-      case "tableHeader": {
-        // Join multiple block children with a space (not "") so adjacent blocks
-        // like a paragraph followed by a list don't collide into "line1- a".
-        // Then collapse newlines and escape pipes so a cell containing "|" or a
-        // line break cannot corrupt the surrounding GFM row.
-        return nodeContent
-          .map(processNode)
-          .join(" ")
-          .replace(/\r?\n/g, " ")
-          .replace(/\|/g, "\\|");
-      }
-
-      case "callout": {
-        // Obsidian-native callout: `> [!type]` opener + a blockquote (`>`-prefixed)
-        // body, so it renders as a callout in Obsidian. The importer parses both
-        // this and the legacy `:::type` fence (existing vaults). Each body line is
-        // blockquote-prefixed; a blank line becomes a bare `>` so the callout is
-        // not split.
-        const calloutType = (node.attrs?.type || "info").toLowerCase();
-        const calloutBody = nodeContent
-          .map(processNode)
-          .join("\n")
-          .split("\n")
-          .map((l: string) => (l.length ? `> ${l}` : ">"))
-          .join("\n");
-        return `> [!${calloutType}]\n${calloutBody}`;
-      }
-
-      case "details": {
-        // The `open` (collapsed/expanded) state lives on the details node, NOT on
-        // the summary, so emit the <details> wrapper HERE carrying it — otherwise
-        // the open state is dropped on a round trip. The schema's details node
-        // parses `open` back from the attribute.
-        const open = node.attrs?.open ? " open" : "";
-        return `<details${open}>\n${nodeContent.map(processNode).join("")}</details>`;
-      }
-
-      case "detailsSummary":
-        return `<summary>${nodeContent.map(processNode).join("")}</summary>\n\n`;
-
-      case "detailsContent":
-        return `${nodeContent.map(processNode).join("\n")}\n`;
-
-      case "mathInline": {
-        // The schema's `text` attribute has no parseHTML, so TipTap's default
-        // parser reads it from the `text` HTML attribute (NOT the element's text
-        // content). Emit span[data-type="mathInline"] carrying the LaTeX in a
-        // `text="..."` attribute so it round-trips. marked cannot parse $...$
-        // back, so the previous form was lossy.
-        const inlineMath = node.attrs?.text || "";
-        return `<span data-type="mathInline" data-katex="true" text="${escapeAttr(inlineMath)}"></span>`;
-      }
-
-      case "mathBlock": {
-        // Same as mathInline: the LaTeX must ride in the `text` HTML attribute
-        // for the schema's default parser to recover it.
-        const blockMath = node.attrs?.text || "";
-        return `<div data-type="mathBlock" data-katex="true" text="${escapeAttr(blockMath)}"></div>`;
-      }
-
-      case "mention": {
-        // Emit span[data-type="mention"] with the schema's data-* attributes so
-        // generateJSON rebuilds the mention node instead of leaving "@label"
-        // plain text that cannot re-parse.
-        const attrs = node.attrs || {};
-        const parts: string[] = [`data-type="mention"`];
-        if (attrs.id) parts.push(`data-id="${escapeAttr(attrs.id)}"`);
-        if (attrs.label)
-          parts.push(`data-label="${escapeAttr(attrs.label)}"`);
-        if (attrs.entityType)
-          parts.push(`data-entity-type="${escapeAttr(attrs.entityType)}"`);
-        if (attrs.entityId)
-          parts.push(`data-entity-id="${escapeAttr(attrs.entityId)}"`);
-        if (attrs.slugId)
-          parts.push(`data-slug-id="${escapeAttr(attrs.slugId)}"`);
-        if (attrs.creatorId)
-          parts.push(`data-creator-id="${escapeAttr(attrs.creatorId)}"`);
-        if (attrs.anchorId)
-          parts.push(`data-anchor-id="${escapeAttr(attrs.anchorId)}"`);
-        // Keep the label as visible text content too; the schema reads attrs
-        // from data-*, so the inner text is purely cosmetic and harmless.
-        const mentionLabel = attrs.label || attrs.id || "";
-        // The label is visible element TEXT content here (the data-* attrs above
-        // carry the real values), so escape it for the text context, not attrs.
-        return `<span ${parts.join(" ")}>@${escapeHtmlText(mentionLabel)}</span>`;
-      }
-
-      case "attachment": {
-        // BUG FIX: the old code read node.attrs.fileName / node.attrs.src, but
-        // the schema stores name/url (plus mime/size/attachmentId). Emit the
-        // schema-matching div[data-type="attachment"] with data-attachment-*
-        // attrs so the node round-trips instead of degrading to a markdown link.
-        const attrs = node.attrs || {};
-        const parts: string[] = [
-          `data-type="attachment"`,
-          `data-attachment-url="${escapeAttr(attrs.url ?? "")}"`,
-        ];
-        if (attrs.name)
-          parts.push(`data-attachment-name="${escapeAttr(attrs.name)}"`);
-        if (attrs.mime)
-          parts.push(`data-attachment-mime="${escapeAttr(attrs.mime)}"`);
-        if (attrs.size != null)
-          parts.push(`data-attachment-size="${escapeAttr(attrs.size)}"`);
-        if (attrs.attachmentId)
-          parts.push(
-            `data-attachment-id="${escapeAttr(attrs.attachmentId)}"`,
-          );
-        return `<div ${parts.join(" ")}></div>`;
-      }
-
-      case "drawio":
-      case "excalidraw": {
-        // Emit the schema-matching div[data-type=...] carrying the diagram's
-        // attrs as data-* (the schema's diagramAttributes reads src/title/alt/
-        // width/height/size/aspectRatio/align/attachmentId from data-*), so the
-        // diagram round-trips instead of degrading to a lossy placeholder.
-        const attrs = node.attrs || {};
-        const parts: string[] = [
-          `data-type="${type}"`,
-          `data-src="${escapeAttr(attrs.src ?? "")}"`,
-        ];
-        if (attrs.title != null)
-          parts.push(`data-title="${escapeAttr(attrs.title)}"`);
-        if (attrs.alt != null) parts.push(`data-alt="${escapeAttr(attrs.alt)}"`);
-        if (attrs.width != null)
-          parts.push(`data-width="${escapeAttr(attrs.width)}"`);
-        if (attrs.height != null)
-          parts.push(`data-height="${escapeAttr(attrs.height)}"`);
-        if (attrs.size != null)
-          parts.push(`data-size="${escapeAttr(attrs.size)}"`);
-        if (attrs.aspectRatio != null)
-          parts.push(`data-aspect-ratio="${escapeAttr(attrs.aspectRatio)}"`);
-        if (attrs.align)
-          parts.push(`data-align="${escapeAttr(attrs.align)}"`);
-        if (attrs.attachmentId)
-          parts.push(
-            `data-attachment-id="${escapeAttr(attrs.attachmentId)}"`,
-          );
-        return `<div ${parts.join(" ")}></div>`;
-      }
-
-      case "embed": {
-        // Emit the schema-matching div[data-type="embed"]; the schema reads
-        // src/provider/align/width/height from data-* attributes so the node
-        // (and its provider iframe info) survives the round-trip.
-        const attrs = node.attrs || {};
-        const parts: string[] = [
-          `data-type="embed"`,
-          `data-src="${escapeAttr(attrs.src ?? "")}"`,
-          `data-provider="${escapeAttr(attrs.provider ?? "")}"`,
-        ];
-        if (attrs.align)
-          parts.push(`data-align="${escapeAttr(attrs.align)}"`);
-        if (attrs.width != null)
-          parts.push(`data-width="${escapeAttr(attrs.width)}"`);
-        if (attrs.height != null)
-          parts.push(`data-height="${escapeAttr(attrs.height)}"`);
-        return `<div ${parts.join(" ")}></div>`;
-      }
-
-      case "audio": {
-        // Emit the schema-matching <audio> element (was emitting nothing). The
-        // schema reads src from src and attachmentId/size from data-*.
-        const attrs = node.attrs || {};
-        const parts: string[] = [`src="${escapeAttr(attrs.src ?? "")}"`];
-        if (attrs.attachmentId)
-          parts.push(
-            `data-attachment-id="${escapeAttr(attrs.attachmentId)}"`,
-          );
-        if (attrs.size != null)
-          parts.push(`data-size="${escapeAttr(attrs.size)}"`);
-        // Wrap in a block <div> for the same reason as video: a bare <audio> is
-        // inline-level HTML that marked would wrap in <p>.
-        return `<div><audio ${parts.join(" ")}></audio></div>`;
-      }
-
-      case "pdf": {
-        // Emit the schema-matching div[data-type="pdf"] (was emitting nothing).
-        // The schema reads src/width/height from standard attrs and name/
-        // attachmentId/size from data-*.
-        const attrs = node.attrs || {};
-        const parts: string[] = [
-          `data-type="pdf"`,
-          `src="${escapeAttr(attrs.src ?? "")}"`,
-        ];
-        if (attrs.name) parts.push(`data-name="${escapeAttr(attrs.name)}"`);
-        if (attrs.attachmentId)
-          parts.push(
-            `data-attachment-id="${escapeAttr(attrs.attachmentId)}"`,
-          );
-        if (attrs.size != null)
-          parts.push(`data-size="${escapeAttr(attrs.size)}"`);
-        if (attrs.width != null)
-          parts.push(`width="${escapeAttr(attrs.width)}"`);
-        if (attrs.height != null)
-          parts.push(`height="${escapeAttr(attrs.height)}"`);
-        return `<div ${parts.join(" ")}></div>`;
-      }
-
-      case "columns": {
-        // Emit the schema-matching div[data-type="columns"] wrapper so the
-        // multi-column layout survives. Without a case the children were
-        // concatenated with no separator and the text merged. The schema reads
-        // layout from data-layout and widthMode from data-width-mode. The whole
-        // block is raw HTML, so render children via blockToHtml (NOT markdown,
-        // which marked would not re-parse inside a raw HTML block).
-        const attrs = node.attrs || {};
-        const parts: string[] = [`data-type="columns"`];
-        if (attrs.layout)
-          parts.push(`data-layout="${escapeAttr(attrs.layout)}"`);
-        if (attrs.widthMode && attrs.widthMode !== "normal")
-          parts.push(`data-width-mode="${escapeAttr(attrs.widthMode)}"`);
-        const inner = nodeContent.map((n: any) => blockToHtml(n)).join("");
-        return `<div ${parts.join(" ")}>${inner}</div>`;
-      }
-
-      case "column": {
-        // Emit the schema-matching div[data-type="column"]; the schema reads the
-        // column width from data-width. Children are rendered as HTML so their
-        // formatting survives inside this raw HTML block.
-        const attrs = node.attrs || {};
-        const parts: string[] = [`data-type="column"`];
-        if (attrs.width)
-          parts.push(`data-width="${escapeAttr(attrs.width)}"`);
-        const inner = nodeContent.map((n: any) => blockToHtml(n)).join("");
-        return `<div ${parts.join(" ")}>${inner}</div>`;
-      }
-
-      case "pageBreak":
-        // Emit the schema-matching div[data-type="pageBreak"] so marked passes
-        // it through as a block and generateJSON rebuilds the pageBreak atom.
-        // Without this case the node fell through to `default` and rendered ""
-        // (the divider silently disappeared and could not round-trip).
-        return `<div data-type="pageBreak"></div>`;
-
-      case "subpages": {
-        // Emit the schema-matching div[data-type="subpages"] so marked passes it
-        // through as a block and generateJSON rebuilds the subpages atom. The old
-        // `{{SUBPAGES}}` literal had no parseHTML inverse, so on import it stayed
-        // as plain text — the embed rendered as the literal "{{SUBPAGES}}" on the
-        // page after a round-trip (red-team: subpages round-trip data loss).
-        // `data-recursive` carries the recursive toggle so it round-trips too.
-        const recursive = node.attrs?.recursive ? ` data-recursive="true"` : "";
-        return `<div data-type="subpages"${recursive}></div>`;
-      }
-
-      case "status": {
-        // Inline status pill. The schema reads the label from the element's
-        // TEXT content and the color from data-color, so emit both; without a
-        // case this inline atom fell through to `default` and collapsed to "".
-        const attrs = node.attrs || {};
-        const statusColor = attrs.color || "gray";
-        return `<span data-type="status" data-color="${escapeAttr(statusColor)}">${escapeHtmlText(attrs.text ?? "")}</span>`;
-      }
-
-      case "htmlEmbed": {
-        // Block atom; the schema reads the raw source from a base64-encoded
-        // data-source attribute (and an optional fixed height from data-height).
-        // Encode with the shared helper so it decodes symmetrically on import.
-        const attrs = node.attrs || {};
-        const parts: string[] = [
-          `data-type="htmlEmbed"`,
-          `data-source="${escapeAttr(encodeHtmlEmbedSource(attrs.source ?? ""))}"`,
-        ];
-        if (attrs.height != null)
-          parts.push(`data-height="${escapeAttr(attrs.height)}"`);
-        return `<div ${parts.join(" ")}></div>`;
-      }
-
-      case "footnoteReference": {
-        // Inline atom marker. The schema reads its id from data-id on a
-        // sup[data-footnote-ref]; the visible number is derived, not stored.
-        const attrs = node.attrs || {};
-        const idAttr = attrs.id ? ` data-id="${escapeAttr(attrs.id)}"` : "";
-        return `<sup data-footnote-ref${idAttr}></sup>`;
-      }
-
-      case "footnotesList": {
-        // Bottom container of footnote definitions (section[data-footnotes]).
-        const inner = nodeContent.map((n: any) => blockToHtml(n)).join("");
-        return `<section data-footnotes>${inner}</section>`;
-      }
-
-      case "footnoteDefinition": {
-        // One footnote note keyed by id (div[data-footnote-def]).
-        const attrs = node.attrs || {};
-        const idAttr = attrs.id ? ` data-id="${escapeAttr(attrs.id)}"` : "";
-        const inner = nodeContent.map((n: any) => blockToHtml(n)).join("");
-        return `<div data-footnote-def${idAttr}>${inner}</div>`;
-      }
-
-      case "pageEmbed": {
-        // Whole-page live embed; the schema reads data-source-page-id.
-        const attrs = node.attrs || {};
-        const parts: string[] = [`data-type="pageEmbed"`];
-        if (attrs.sourcePageId)
-          parts.push(`data-source-page-id="${escapeAttr(attrs.sourcePageId)}"`);
-        return `<div ${parts.join(" ")}></div>`;
-      }
-
-      case "transclusionReference": {
-        // Live reference to a transcluded block/page. Block atom; the schema
-        // reads data-source-page-id and data-transclusion-id.
-        const attrs = node.attrs || {};
-        const parts: string[] = [`data-type="transclusionReference"`];
-        if (attrs.sourcePageId)
-          parts.push(`data-source-page-id="${escapeAttr(attrs.sourcePageId)}"`);
-        if (attrs.transclusionId)
-          parts.push(
-            `data-transclusion-id="${escapeAttr(attrs.transclusionId)}"`,
-          );
-        return `<div ${parts.join(" ")}></div>`;
-      }
-
-      case "transclusionSource": {
-        // Sync-source container; the schema reads data-id and re-parses its
-        // block children, so render them as schema-matching HTML.
-        const attrs = node.attrs || {};
-        const idAttr = attrs.id ? ` data-id="${escapeAttr(attrs.id)}"` : "";
-        const inner = nodeContent.map((n: any) => blockToHtml(n)).join("");
-        return `<div data-type="transclusionSource"${idAttr}>${inner}</div>`;
-      }
-
-      default:
-        // Fallback: process children
-        return nodeContent.map(processNode).join("");
-    }
-  };
-
-  // Render inline content (text runs + their marks) to HTML. Used by the raw
-  // HTML fallbacks (spanned tables, columns) where marked will NOT re-parse
-  // markdown, so backtick/asterisk/bracket syntax would otherwise leak as
-  // literal characters. Each mark is mirrored to the HTML the schema's parseHTML
-  // accepts so it re-imports as the matching ProseMirror mark.
-  const inlineToHtml = (inlineNodes: any[]): string =>
-    (inlineNodes || [])
-      .map((n: any) => {
-        if (n.type === "hardBreak") return "<br>";
-        if (n.type !== "text") {
-          // Inline atoms (mention, mathInline) already emit schema HTML.
-          return processNode(n);
-        }
-        let t = escapeHtmlText(n.text || "");
-        for (const mark of n.marks || []) {
-          switch (mark.type) {
-            case "bold":
-              t = `<strong>${t}</strong>`;
-              break;
-            case "italic":
-              t = `<em>${t}</em>`;
-              break;
-            case "code":
-              t = `<code>${t}</code>`;
-              break;
-            case "strike":
-              t = `<s>${t}</s>`;
-              break;
-            case "underline":
-              t = `<u>${t}</u>`;
-              break;
-            case "subscript":
-              t = `<sub>${t}</sub>`;
-              break;
-            case "superscript":
-              t = `<sup>${t}</sup>`;
-              break;
-            case "link":
-              t = `<a href="${escapeAttr(mark.attrs?.href || "")}">${t}</a>`;
-              break;
-            case "highlight":
-              t = mark.attrs?.color
-                ? `<mark style="background-color: ${escapeAttr(mark.attrs.color)}">${t}</mark>`
-                : `<mark>${t}</mark>`;
-              break;
-            case "textStyle":
-              if (mark.attrs?.color)
-                t = `<span style="color: ${escapeAttr(mark.attrs.color)}">${t}</span>`;
-              break;
-            case "comment":
-              // Inline comment anchor inside a raw-HTML container (columns /
-              // spanned table cells), so commented text there also round-trips.
-              if (mark.attrs?.commentId) {
-                const r = mark.attrs?.resolved ? ` data-resolved="true"` : "";
-                t = `<span data-comment-id="${escapeAttr(mark.attrs.commentId)}"${r}>${t}</span>`;
-              }
-              break;
-          }
-        }
-        return t;
-      })
-      .join("");
-
-  // Emit the schema-matching <img> for an image node. Shared so the image is
-  // emitted as real HTML wherever a raw-HTML container needs it (inside a column
-  // or a spanned table cell), where markdown `![](...)` would NOT be re-parsed
-  // and would survive as literal text. The Image extension reads src/alt from
-  // the standard attributes; the Docmost extra attrs (width/height/align/size/
-  // attachmentId/aspectRatio) are global attributes read from same-named DOM
-  // attributes, so emit them by name.
-  const imageToHtml = (node: any): string => {
-    const attrs = node.attrs || {};
-    const parts: string[] = [`src="${escapeAttr(attrs.src ?? "")}"`];
-    if (attrs.alt) parts.push(`alt="${escapeAttr(attrs.alt)}"`);
-    if (attrs.title) parts.push(`title="${escapeAttr(attrs.title)}"`);
-    if (attrs.width != null) parts.push(`width="${escapeAttr(attrs.width)}"`);
-    if (attrs.height != null) parts.push(`height="${escapeAttr(attrs.height)}"`);
-    if (attrs.align) parts.push(`align="${escapeAttr(attrs.align)}"`);
-    if (attrs.size != null) parts.push(`data-size="${escapeAttr(attrs.size)}"`);
-    if (attrs.attachmentId)
-      parts.push(`data-attachment-id="${escapeAttr(attrs.attachmentId)}"`);
-    if (attrs.aspectRatio != null)
-      parts.push(`data-aspect-ratio="${escapeAttr(attrs.aspectRatio)}"`);
-    // Plain-text caption (issue #221). Markdown `![](src)` cannot carry it, so
-    // emit it as data-caption; the schema's image `caption` attr parses it back.
-    if (attrs.caption) parts.push(`data-caption="${escapeAttr(attrs.caption)}"`);
-    return `<img ${parts.join(" ")}>`;
-  };
-
-  // Emit the schema-matching div[data-type="callout"] for a callout node. The
-  // schema reads the banner type from data-callout-type. Children are rendered
-  // as HTML so they survive inside a raw-HTML container.
-  const calloutToHtml = (node: any): string => {
-    const type = (node.attrs?.type || "info").toLowerCase();
-    const inner = (node.content || []).map(blockToHtml).join("");
-    return `<div data-type="callout" data-callout-type="${escapeAttr(type)}">${inner}</div>`;
-  };
-
-  // Emit a schema-matching <details> tree. The schema parses <details>,
-  // summary[data-type="detailsSummary"], and div[data-type="detailsContent"].
-  // The `open` (collapsed/expanded) state lives on the details node and the
-  // schema parses it back from the attribute, so emit it here too — mirroring
-  // the top-level `details` case — or a NESTED details (inside columns/cells)
-  // would silently drop `open:true` every round trip.
-  const detailsToHtml = (node: any): string => {
-    const open = node.attrs?.open ? " open" : "";
-    const inner = (node.content || []).map(blockToHtml).join("");
-    return `<details${open}>${inner}</details>`;
-  };
-  const detailsSummaryToHtml = (node: any): string =>
-    `<summary data-type="detailsSummary">${inlineToHtml(node.content || [])}</summary>`;
-  const detailsContentToHtml = (node: any): string => {
-    const inner = (node.content || []).map(blockToHtml).join("");
-    return `<div data-type="detailsContent">${inner}</div>`;
-  };
-
-  // Emit the schema-matching taskList/taskItem HTML. bridgeTaskLists (in
-  // collaboration.ts) recognizes ul[data-type="taskList"] with
-  // li[data-type="taskItem"][data-checked]; emitting that directly here keeps
-  // task lists inside columns/cells from degrading to literal "- [ ]" text.
-  const taskListToHtml = (node: any): string => {
-    const items = (node.content || [])
-      .map((it: any) => {
-        const checked = it.attrs?.checked ? "true" : "false";
-        return `<li data-type="taskItem" data-checked="${checked}">${blockChildrenToHtml(it)}</li>`;
-      })
-      .join("");
-    return `<ul data-type="taskList">${items}</ul>`;
-  };
-
-  // Render a block node to HTML for the raw-HTML containers (spanned tables,
-  // columns). marked does NOT re-parse markdown inside a raw-HTML block, so
-  // EVERY block type that can appear inside a column or a spanned cell must be
-  // emitted as schema-matching HTML here — never as markdown, or it would land
-  // as literal text on re-import. Nodes whose processNode case already produces
-  // schema-matching HTML (math/media/embed/attachment/nested columns/spanned
-  // table) are delegated to processNode; the markdown-emitting cases
-  // (image/blockquote/callout/details/hr/taskList) get explicit HTML here.
-  const blockToHtml = (block: any): string => {
-    const children = block.content || [];
-    switch (block.type) {
-      case "paragraph": {
-        // Carry textAlign here too (symmetric with the processNode paragraph
-        // case): a paragraph nested inside an HTML container (column/table/
-        // callout) would otherwise drop its alignment on the round trip.
-        const pAlign = block.attrs?.textAlign;
-        const pStyle =
-          pAlign && pAlign !== "left"
-            ? ` style="text-align:${escapeAttr(pAlign)}"`
-            : "";
-        return `<p${pStyle}>${inlineToHtml(children)}</p>`;
-      }
-      case "heading": {
-        // Same for a heading nested in an HTML container: emit the alignment as
-        // an inline style (symmetric with the processNode heading case) so it is
-        // not silently dropped. Clamp the level to a valid HTML heading tag.
-        const level = Math.min(6, Math.max(1, block.attrs?.level || 1));
-        const hAlign = block.attrs?.textAlign;
-        const hStyle =
-          hAlign && hAlign !== "left"
-            ? ` style="text-align:${escapeAttr(hAlign)}"`
-            : "";
-        return `<h${level}${hStyle}>${inlineToHtml(children)}</h${level}>`;
-      }
-      case "bulletList":
-        return `<ul>${children
-          .map((li: any) => `<li>${blockChildrenToHtml(li)}</li>`)
-          .join("")}</ul>`;
-      case "orderedList":
-        return `<ol>${children
-          .map((li: any) => `<li>${blockChildrenToHtml(li)}</li>`)
-          .join("")}</ol>`;
-      case "codeBlock": {
-        const lang = block.attrs?.language || "";
-        // The code itself is element TEXT content (between <code> tags), so it
-        // must escape < > & — NOT the attribute escaper. The language rides in
-        // a class ATTRIBUTE, so it uses escapeAttr.
-        const code = escapeHtmlText(
-          children
-            .map(processNode)
-            .join("")
-            .replace(/\n+$/, ""),
-        );
-        const cls = lang ? ` class="language-${escapeAttr(lang)}"` : "";
-        return `<pre><code${cls}>${code}</code></pre>`;
-      }
-      case "image":
-        return imageToHtml(block);
-      case "blockquote":
-        return `<blockquote>${children.map(blockToHtml).join("")}</blockquote>`;
-      case "horizontalRule":
-        return "<hr>";
-      case "callout":
-        return calloutToHtml(block);
-      case "details":
-        return detailsToHtml(block);
-      case "detailsSummary":
-        return detailsSummaryToHtml(block);
-      case "detailsContent":
-        return detailsContentToHtml(block);
-      case "taskList":
-        return taskListToHtml(block);
-      case "taskItem":
-        // A bare taskItem (outside a taskList) still needs a wrapping list so
-        // the schema parses it; wrap it in a single-item taskList.
-        return taskListToHtml({ content: [block] });
-      // A table nested in a raw-HTML block (e.g. inside a column) MUST be the
-      // HTML <table> form — a GFM pipe table here would not be re-parsed by
-      // marked and would round-trip as literal "| a | b |" text (review #7).
-      case "table":
-        return tableToHtml(block.content || []);
-      // columns/column, math, media, embed, attachment, mention, etc. already
-      // emit schema-matching HTML from processNode.
-      case "columns":
-      case "column":
-      case "mathBlock":
-      case "video":
-      case "audio":
-      case "pdf":
-      case "youtube":
-      case "embed":
-      case "attachment":
-      case "drawio":
-      case "excalidraw":
-      case "htmlEmbed":
-      case "footnotesList":
-      case "footnoteDefinition":
-      case "pageEmbed":
-      case "transclusionSource":
-      case "transclusionReference":
-        return processNode(block);
-      default:
-        // Any still-unhandled block type: NEVER fall back to markdown inside a
-        // raw-HTML block (it would become literal text). Wrap its rendered
-        // children in a <div> so their content is preserved; if it has no block
-        // children, render its inline content instead.
-        if (children.length && children.some((c: any) => c.type !== "text")) {
-          return `<div>${children.map(blockToHtml).join("")}</div>`;
-        }
-        return `<div>${inlineToHtml(children)}</div>`;
-    }
-  };
-
-  // Render the block children of a list item to HTML (a listItem holds block+
-  // content). Mirrors processListItem but for the HTML fallback path.
-  const blockChildrenToHtml = (item: any): string =>
-    (item.content || []).map((b: any) => blockToHtml(b)).join("");
-
-  // Indent the rendered children of a list item under a marker prefix.
-  // Each child block is a (possibly multi-line) string. The very first physical
-  // line of the first child carries the marker (e.g. "- " or "1. "); EVERY
-  // other line — the remaining lines of the first child AND all lines of every
-  // subsequent child (nested lists, code blocks, extra paragraphs) — is indented
-  // to align under the marker. Without indenting these continuation lines, the
-  // 2nd/3rd line of a nested child collapses to column 0 and escapes the list.
-  //
-  // The continuation indent MUST equal the LIST marker width, which is not the
-  // same as the visible prefix width:
-  //   - bullet "- "          -> 2 columns
-  //   - task   "- [ ] "      -> marker is still "- " (the "[ ] " is content), 2
-  //   - ordered "1. "/"10. " -> 3/4 columns, scaling with the number's digits
-  // CommonMark anchors nested content to the marker column, so an ordered item
-  // indented to only 2 columns would be re-parsed as a sibling/loose content on
-  // re-import. Callers therefore pass the exact indent width to use.
-  const indentItemChildren = (
-    childStrings: string[],
-    prefix: string,
-    indentWidth: number,
-  ): string => {
-    const indent = " ".repeat(indentWidth);
-    const lines: string[] = [];
-    childStrings.forEach((child, childIndex) => {
-      child.split("\n").forEach((line, lineIndex) => {
-        if (childIndex === 0 && lineIndex === 0) {
-          // First physical line of the first block gets the marker.
-          lines.push(`${prefix} ${line}`);
-        } else {
-          // Indent every continuation line by the marker width; keep blank
-          // lines blank rather than emitting trailing whitespace.
-          lines.push(line.length ? `${indent}${line}` : "");
-        }
-      });
-    });
-    return lines.join("\n");
-  };
-
-  const processListItem = (item: any, prefix: string): string => {
-    const itemContent = item.content || [];
-    const childStrings = itemContent.map(processNode);
-    if (childStrings.length === 0) return prefix;
-    // The rendered marker is `${prefix} ` (prefix + one space), so its width —
-    // and thus the continuation indent — is prefix.length + 1. This is correct
-    // for both bullet ("-" -> 2) and ordered ("1." -> 3, "10." -> 4) markers,
-    // since for those the visible prefix IS the list marker.
-    return indentItemChildren(childStrings, prefix, prefix.length + 1);
-  };
-
-  const processTaskItem = (item: any): string => {
-    const checked = item.attrs?.checked || false;
-    const checkbox = checked ? "[x]" : "[ ]";
-    const prefix = `- ${checkbox}`;
-    const itemContent = item.content || [];
-    const childStrings = itemContent.map(processNode);
-    // An empty task item still needs its checkbox marker; without this guard
-    // the indent below produces "" and the "- [ ]"/"- [x]" row disappears.
-    if (childStrings.length === 0) return prefix;
-    // The list marker for a task item is just "- " (2 columns); the "[ ] "/"[x] "
-    // checkbox is item content, NOT part of the marker. So the continuation
-    // indent is a fixed 2 — do NOT derive it from the wider prefix.length.
-    return indentItemChildren(childStrings, prefix, 2);
-  };
-
-  return processNode(content).trim();
-}
diff --git a/packages/git-sync/src/lib/markdown-to-prosemirror.ts b/packages/git-sync/src/lib/markdown-to-prosemirror.ts
deleted file mode 100644
index 4466edf4..00000000
--- a/packages/git-sync/src/lib/markdown-to-prosemirror.ts
+++ /dev/null
@@ -1,365 +0,0 @@
-/**
- * Pure markdown -> ProseMirror conversion.
- *
- * The converter path is `markdownToProseMirror` (marked -> HTML ->
- * generateJSON) plus the two pre/post processors it needs (`preprocessCallouts`,
- * `bridgeTaskLists`). The gitmost server writes the resulting page bodies
- * natively through the collab gateway, so no websocket/Yjs write-path lives
- * here.
- */
-import { generateJSON } from "@tiptap/html";
-import { JSDOM } from "jsdom";
-import { marked } from "marked";
-import { docmostExtensions } from "./docmost-schema.js";
-
-// Setup DOM environment for Tiptap HTML parsing in Node.js
-const dom = new JSDOM("<!DOCTYPE html><html><body></body></html>");
-global.window = dom.window as any;
-global.document = dom.window.document;
-// @ts-ignore
-global.Element = dom.window.Element;
-
-/**
- * Hard ceiling above which we skip callout preprocessing entirely. The linear
- * scanner below has no quadratic blow-up, but we still cap input defensively so
- * a pathological multi-megabyte payload cannot tie up the event loop; in that
- * case the markdown is passed through verbatim (callouts are simply not
- * detected) rather than risking a slow scan.
- */
-const MAX_CALLOUT_PREPROCESS_BYTES = 4 * 1024 * 1024; // 4 MB
-
-/** Matches an opening callout fence: `:::type` (type captured, lower-cased). */
-const CALLOUT_OPEN_RE = /^:::\s*(\w+)\s*$/;
-/** Matches a bare closing callout fence: `:::`. */
-const CALLOUT_CLOSE_RE = /^:::\s*$/;
-/**
- * Matches an Obsidian-native callout opener: `> [!type]` (type captured). An
- * optional title after the type is allowed but ignored (the Docmost callout
- * schema has no title). The body is the following contiguous blockquote lines.
- */
-const CALLOUT_BQ_OPEN_RE = /^>\s*\[!(\w+)\]/;
-/** Matches any blockquote continuation line (`>` … ). */
-const BLOCKQUOTE_LINE_RE = /^>/;
-/** Matches the start/end of a code fence (``` or ~~~), capturing the marker. */
-const CODE_FENCE_RE = /^(\s*)(`{3,}|~{3,})/;
-
-/**
- * Pre-process Docmost-flavoured markdown: convert `:::type ... :::`
- * callout blocks (the syntax our markdown export produces) into HTML
- * divs that the callout extension parses. The inner content is rendered
- * through marked as regular markdown.
- *
- * Implemented as a single linear pass over the lines (no quadratic regex
- * rescan). It:
- *   - tracks fenced code regions (```...``` and ~~~...~~~) and never treats a
- *     `:::` line that lives inside a code fence as a callout delimiter, so a
- *     callout body that itself contains a fenced code block with a `:::` line is
- *     no longer corrupted;
- *   - matches an opening `:::type` line with the next CLOSING `:::` at the SAME
- *     nesting level, supporting NESTED callouts via a depth counter (an inner
- *     `:::type` opens a deeper level and consumes a matching `:::`);
- *   - emits the same `<div data-type="callout" data-callout-type="TYPE">` output
- *     (inner rendered through marked) as the previous regex implementation.
- */
-async function preprocessCallouts(markdown: string): Promise<string> {
-  // Defensive cap: skip preprocessing for pathologically large inputs.
-  if (markdown.length > MAX_CALLOUT_PREPROCESS_BYTES) {
-    return markdown;
-  }
-
-  // Recursively transform a slice of lines, converting top-level callouts in
-  // that slice into <div> blocks and rendering their inner content (which may
-  // itself contain nested callouts) through this same function.
-  const transform = async (lines: string[]): Promise<string> => {
-    const out: string[] = [];
-    let inCodeFence = false;
-    let codeFenceMarker = ""; // the exact run of backticks/tildes that opened it
-    let i = 0;
-
-    while (i < lines.length) {
-      const line = lines[i];
-
-      // Inside a code fence, only its matching closing fence is significant;
-      // everything else (including `:::` lines) is copied through verbatim.
-      if (inCodeFence) {
-        out.push(line);
-        const fence = line.match(CODE_FENCE_RE);
-        if (fence && fence[2].startsWith(codeFenceMarker[0]) &&
-            fence[2].length >= codeFenceMarker.length) {
-          inCodeFence = false;
-          codeFenceMarker = "";
-        }
-        i++;
-        continue;
-      }
-
-      // A code fence opening outside any callout body: enter code-fence mode.
-      const fenceOpen = line.match(CODE_FENCE_RE);
-      if (fenceOpen) {
-        inCodeFence = true;
-        codeFenceMarker = fenceOpen[2];
-        out.push(line);
-        i++;
-        continue;
-      }
-
-      // An opening callout fence: scan forward (with code-fence and nested
-      // callout awareness) for its matching closing `:::` at the same level.
-      const open = line.match(CALLOUT_OPEN_RE);
-      if (open) {
-        const type = open[1].toLowerCase();
-        const bodyLines: string[] = [];
-        let depth = 1;
-        let innerInCodeFence = false;
-        let innerCodeFenceMarker = "";
-        let j = i + 1;
-        for (; j < lines.length; j++) {
-          const bl = lines[j];
-          if (innerInCodeFence) {
-            const f = bl.match(CODE_FENCE_RE);
-            if (f && f[2].startsWith(innerCodeFenceMarker[0]) &&
-                f[2].length >= innerCodeFenceMarker.length) {
-              innerInCodeFence = false;
-              innerCodeFenceMarker = "";
-            }
-            bodyLines.push(bl);
-            continue;
-          }
-          const innerFence = bl.match(CODE_FENCE_RE);
-          if (innerFence) {
-            innerInCodeFence = true;
-            innerCodeFenceMarker = innerFence[2];
-            bodyLines.push(bl);
-            continue;
-          }
-          if (CALLOUT_OPEN_RE.test(bl)) {
-            depth++;
-            bodyLines.push(bl);
-            continue;
-          }
-          if (CALLOUT_CLOSE_RE.test(bl)) {
-            depth--;
-            if (depth === 0) break; // matching close for THIS callout
-            bodyLines.push(bl);
-            continue;
-          }
-          bodyLines.push(bl);
-        }
-
-        if (j < lines.length) {
-          // Found the matching closing fence: render the body (recursively, so
-          // nested callouts are handled) and emit the callout div.
-          const inner = await transform(bodyLines);
-          const renderedInner = await marked.parse(inner);
-          out.push(
-            `\n<div data-type="callout" data-callout-type="${type}">${renderedInner}</div>\n`,
-          );
-          i = j + 1; // skip past the closing `:::`
-          continue;
-        }
-        // No matching close (unterminated callout): treat the opener as a
-        // literal line and continue, preserving the original text.
-        out.push(line);
-        i++;
-        continue;
-      }
-
-      // An Obsidian-native callout: `> [!type]` opener; the body is the following
-      // CONTIGUOUS blockquote (`>`-prefixed) lines. Strip ONE blockquote level and
-      // recurse so nested callouts (`> > [!type]`) are handled, then emit the same
-      // callout div the `:::` path produces. A normal blockquote (no `[!type]` on
-      // its first line) does not match and stays a blockquote.
-      const bqOpen = line.match(CALLOUT_BQ_OPEN_RE);
-      if (bqOpen) {
-        const type = bqOpen[1].toLowerCase();
-        const bodyLines: string[] = [];
-        let j = i + 1;
-        for (; j < lines.length; j++) {
-          if (!BLOCKQUOTE_LINE_RE.test(lines[j])) break;
-          bodyLines.push(lines[j].replace(/^>\s?/, ""));
-        }
-        const inner = await transform(bodyLines);
-        const renderedInner = await marked.parse(inner);
-        out.push(
-          `\n<div data-type="callout" data-callout-type="${type}">${renderedInner}</div>\n`,
-        );
-        i = j;
-        continue;
-      }
-
-      out.push(line);
-      i++;
-    }
-
-    return out.join("\n");
-  };
-
-  return transform(markdown.split("\n"));
-}
-
-/**
- * Bridge marked's checkbox lists to TipTap task lists.
- *
- * marked renders GitHub task list items (`- [x] done`) as a plain
- * `<ul><li><p><input type="checkbox" checked> text</p></li></ul>` WITHOUT the
- * markup TipTap's TaskList/TaskItem extensions parse. This rewrites such lists
- * into the shape those extensions expect:
- *   TaskList parseHTML matches `ul[data-type="taskList"]`,
- *   TaskItem matches `li[data-type="taskItem"]`,
- *   the checked state is read from `data-checked === "true"`.
- *
- * A list is only converted when it has at least one `<li>` and EVERY direct
- * `<li>` contains a checkbox input. Both `<ul>` and `<ol>` are considered: a
- * numbered checklist (`1. [x] a`, which marked renders as an `<ol>` of checkbox
- * `<li>`s) would otherwise lose its task state. TipTap task lists are unordered,
- * so a matching `<ol>` is emitted as `data-type="taskList"` exactly like a
- * `<ul>`. Mixed or ordinary lists (including ordinary `<ol>` lists) are left
- * untouched so they keep rendering as bullet/numbered lists. The marked `<p>`
- * wrapper is kept inside the `<li>` because TaskItem content allows paragraphs.
- */
-function bridgeTaskLists(html: string): string {
-  // Cheap early-out: if the markup contains no checkbox input at all there is
-  // nothing to bridge, so skip the expensive JSDOM parse entirely. This is the
-  // common case (most pages have no task lists).
-  if (!/type=["']?checkbox/i.test(html)) {
-    return html;
-  }
-  // Defensive cap (consistent with preprocessCallouts): skip the bridge for
-  // pathologically large inputs rather than running a second expensive JSDOM
-  // parse on a multi-megabyte payload. The markup is passed through verbatim.
-  if (html.length > MAX_CALLOUT_PREPROCESS_BYTES) {
-    return html;
-  }
-  const dom = new JSDOM(html);
-  const document = dom.window.document;
-  // Collect the checkbox(es) that belong to THIS <li> directly: either direct
-  // child <input type="checkbox"> elements or ones inside the <li>'s direct <p>
-  // child (the shape marked emits: `<li><p><input type="checkbox"> text</p></li>`).
-  // Checkboxes nested deeper (e.g. inside a child <ul>/<ol>) are excluded so a
-  // bullet <li> that merely contains a nested task sublist is not misdetected.
-  // Raw inline HTML can put more than one checkbox in a single <li>; we gather
-  // ALL of them so none survive into the converted item.
-  const directCheckboxes = (li: Element): Element[] => {
-    const found: Element[] = [];
-    for (const child of Array.from(li.children)) {
-      if (
-        child.tagName === "INPUT" &&
-        child.getAttribute("type") === "checkbox"
-      ) {
-        found.push(child);
-        continue;
-      }
-      if (child.tagName === "P") {
-        for (const inp of Array.from(
-          child.querySelectorAll(":scope > input[type='checkbox']"),
-        )) {
-          found.push(inp);
-        }
-      }
-    }
-    return found;
-  };
-  // Both <ul> and <ol> are candidates: an <ol> whose every direct <li> carries
-  // its own checkbox is a numbered checklist that must also become a taskList.
-  const lists = Array.from(document.querySelectorAll("ul, ol"));
-  for (const list of lists) {
-    // Only consider DIRECT child <li> elements; nested lists are handled by
-    // their own iteration of the outer loop.
-    const items = Array.from(list.children).filter(
-      (child) => child.tagName === "LI",
-    );
-    if (items.length === 0) continue;
-    const itemCheckboxes = items.map((li) => directCheckboxes(li));
-    // Convert only when every direct <li> carries at least one OWN checkbox.
-    if (!itemCheckboxes.every((boxes) => boxes.length > 0)) continue;
-
-    // A numbered checklist arrives as an <ol>. We must NOT leave the tag as
-    // <ol> while tagging it data-type="taskList": generateJSON would then match
-    // BOTH the orderedList rule (tag ol) and the taskList rule (data-type),
-    // emitting a phantom empty orderedList beside the real taskList. So rename a
-    // qualifying <ol> to a <ul> — move its <li> children over and replace it —
-    // leaving only the taskList rule to match. Already-<ul> lists are unchanged.
-    let target: Element = list;
-    if (list.tagName === "OL") {
-      const ul = document.createElement("ul");
-      // Carry over existing attributes (e.g. class) so nothing is silently lost.
-      for (const attr of Array.from(list.attributes)) {
-        ul.setAttribute(attr.name, attr.value);
-      }
-      // Move every child node (including the <li>s we collected) into the <ul>.
-      while (list.firstChild) {
-        ul.appendChild(list.firstChild);
-      }
-      list.replaceWith(ul);
-      target = ul;
-    }
-
-    target.setAttribute("data-type", "taskList");
-    items.forEach((li, index) => {
-      const boxes = itemCheckboxes[index];
-      // The first checkbox determines the checked state (matches the previous
-      // single-checkbox behaviour); any extras only need removing.
-      const input = boxes[0] ?? null;
-      li.setAttribute("data-type", "taskItem");
-      const checked =
-        input != null &&
-        (input.hasAttribute("checked") || (input as any).checked);
-      li.setAttribute("data-checked", checked ? "true" : "false");
-      // Remove ALL direct checkbox inputs so none survive into the content
-      // (a raw-inline-HTML <li> may carry more than one).
-      for (const box of boxes) {
-        box.remove();
-      }
-    });
-  }
-  return document.body.innerHTML;
-}
-
-/**
- * Recursively strip content-less paragraph nodes from a generated doc.
- *
- * A block-level atom whose markdown form is INLINE (e.g. the block `image`'s
- * `![](url)`, or a bare media element) is wrapped by marked in a <p>; the schema
- * then HOISTS the block atom out of that paragraph, leaving an EMPTY paragraph
- * sibling. On the next export that empty `<p>` renders to "" and the doc "\n\n"
- * join injects a phantom blank gap, so the markdown is not byte-stable.
- *
- * Markdown blank lines are separators, never content, so generateJSON only ever
- * produces an empty paragraph as such a hoist artifact — removing them is safe
- * and general (it also subsumes the <div>-wrapper workaround the `video` case
- * uses). We remove ONLY `type === 'paragraph'` nodes whose `content` is absent
- * or an empty array; every other node (including atoms without `content`) is
- * preserved, and we recurse into the content of any node that has children.
- */
-function stripEmptyParagraphs(node: any): any {
-  if (!node || !Array.isArray(node.content)) {
-    // Atom / leaf node (no children to recurse into): keep as-is.
-    return node;
-  }
-  const mapped = node.content.map((child: any) => stripEmptyParagraphs(child));
-  const isEmptyParagraph = (child: any): boolean =>
-    !!child &&
-    child.type === "paragraph" &&
-    (!Array.isArray(child.content) || child.content.length === 0);
-  const filtered = mapped.filter((child: any) => !isEmptyParagraph(child));
-  // Schema-validity guard: several nodes require NON-empty block content
-  // (`content: "block+"` — tableCell, tableHeader, blockquote, column, callout,
-  // and the doc root). For an empty one of those, generateJSON materializes a
-  // single empty paragraph as its OBLIGATORY content — that is not a hoist
-  // artifact. If stripping would empty the container, keep ONE empty paragraph
-  // so the result stays schema-valid (an empty cell/quote must not become `[]`).
-  const cleaned =
-    filtered.length === 0 && mapped.length > 0 ? [mapped[0]] : filtered;
-  return { ...node, content: cleaned };
-}
-
-/** Convert markdown to a ProseMirror doc using the full Docmost schema. */
-export async function markdownToProseMirror(
-  markdownContent: string,
-): Promise<any> {
-  const withCallouts = await preprocessCallouts(markdownContent);
-  const html = await marked.parse(withCallouts);
-  const bridged = bridgeTaskLists(html);
-  const doc = generateJSON(bridged, docmostExtensions);
-  return stripEmptyParagraphs(doc);
-}
diff --git a/packages/git-sync/test/apply-push-actions.test.ts b/packages/git-sync/test/apply-push-actions.test.ts
index 1f0a8d9b..4e95d761 100644
--- a/packages/git-sync/test/apply-push-actions.test.ts
+++ b/packages/git-sync/test/apply-push-actions.test.ts
@@ -2,7 +2,7 @@ import { describe, expect, it, vi, beforeEach, afterEach } from 'vitest';
 import { applyPushActions, LAST_PUSHED_REF } from '../src/engine/push';
 import { bodyHash } from '../src/engine/loop-guard';
 import type { ApplyPushDeps, PushActions } from '../src/engine/push';
-import { parsePageFile, serializePageFile } from '../src/lib/page-file';
+import { parsePageFile, serializePageFile } from '@docmost/prosemirror-markdown';
 
 // The Docmost space this vault mirrors (native files carry no spaceId; the run
 // supplies it). A CREATE targets this space.
diff --git a/packages/git-sync/test/classify-rename-moves.test.ts b/packages/git-sync/test/classify-rename-moves.test.ts
index ceb00285..12fc34bd 100644
--- a/packages/git-sync/test/classify-rename-moves.test.ts
+++ b/packages/git-sync/test/classify-rename-moves.test.ts
@@ -5,7 +5,7 @@ import type {
   MetaSide,
   RenameMoveAction,
 } from '../src/engine/push';
-import type { DocmostMdMeta } from '../src/lib/index';
+import type { DocmostMdMeta } from '@docmost/prosemirror-markdown';
 
 // FS→Docmost push #3 (SPEC §5/§6/§16). `classifyRenameMoves` is the PURE half of
 // the move/rename apply: it resolves each `{pageId, oldPath, newPath}` into the
diff --git a/packages/git-sync/test/compute-push-actions.test.ts b/packages/git-sync/test/compute-push-actions.test.ts
index 28a2b59e..74a785a0 100644
--- a/packages/git-sync/test/compute-push-actions.test.ts
+++ b/packages/git-sync/test/compute-push-actions.test.ts
@@ -1,7 +1,7 @@
 import { describe, expect, it } from 'vitest';
 import { computePushActions } from '../src/engine/push';
 import type { DiffEntry, MetaSide } from '../src/engine/push';
-import type { DocmostMdMeta } from '../src/lib/index';
+import type { DocmostMdMeta } from '@docmost/prosemirror-markdown';
 
 // FS→Docmost push, FIRST increment (SPEC §6). `computePushActions` is the PURE
 // half: it classifies each `git diff --name-status` row into a Docmost action by
diff --git a/packages/git-sync/test/cycle-roundtrip.test.ts b/packages/git-sync/test/cycle-roundtrip.test.ts
index b1d7ca40..4c281b03 100644
--- a/packages/git-sync/test/cycle-roundtrip.test.ts
+++ b/packages/git-sync/test/cycle-roundtrip.test.ts
@@ -8,7 +8,7 @@ import { runCycle } from "../src/engine/cycle";
 import type { CycleFs } from "../src/engine/cycle";
 import { VaultGit } from "../src/engine/git";
 import type { Settings } from "../src/engine/settings";
-import { serializeDocmostMarkdownBody } from "../src/lib/index";
+import { serializeDocmostMarkdownBody } from "@docmost/prosemirror-markdown";
 
 const execFileAsync = promisify(execFile);
 
diff --git a/packages/git-sync/test/engine-gaps.test.ts b/packages/git-sync/test/engine-gaps.test.ts
index 3bb209eb..f582c9c7 100644
--- a/packages/git-sync/test/engine-gaps.test.ts
+++ b/packages/git-sync/test/engine-gaps.test.ts
@@ -8,7 +8,7 @@ import { firstDivergence } from './roundtrip-helpers';
 import { applyPullActions } from '../src/engine/pull';
 import type { PullActions, ApplyPullActionsDeps } from '../src/engine/pull';
 import type { DeletionDecision } from '../src/engine/reconcile';
-import { serializePageFile, parsePageFile } from '../src/lib/page-file';
+import { serializePageFile, parsePageFile } from '@docmost/prosemirror-markdown';
 
 // Engine-layer coverage gaps flagged by the PR #119 reviewers (test-strategy
 // report, Module 2 `src/engine`). Each block targets a specific under-covered
diff --git a/packages/git-sync/test/read-existing.test.ts b/packages/git-sync/test/read-existing.test.ts
index 4d2fabd1..af72d159 100644
--- a/packages/git-sync/test/read-existing.test.ts
+++ b/packages/git-sync/test/read-existing.test.ts
@@ -1,6 +1,6 @@
 import { describe, expect, it } from 'vitest';
 import { readExisting } from '../src/engine/pull';
-import { serializePageFile } from '../src/lib/page-file';
+import { serializePageFile } from '@docmost/prosemirror-markdown';
 
 // R-Pull-1 (test-strategy report §5): `readExisting` now takes injectable IO
 // (`listTracked` / `readFile`), so its parsing + skip rules are unit-testable
diff --git a/packages/git-sync/test/redteam-layout-title.test.ts b/packages/git-sync/test/redteam-layout-title.test.ts
index 3473145d..e505557c 100644
--- a/packages/git-sync/test/redteam-layout-title.test.ts
+++ b/packages/git-sync/test/redteam-layout-title.test.ts
@@ -6,7 +6,7 @@ import type {
   MetaSide,
   RenameMoveAction,
 } from '../src/engine/push.js';
-import type { DocmostMdMeta } from '../src/lib/index.js';
+import type { DocmostMdMeta } from '@docmost/prosemirror-markdown';
 
 // RED-TEAM finding #4 (two facets):
 //   (a) buildVaultLayout disambiguation is ORDER-DEPENDENT: which of two
diff --git a/packages/git-sync/test/redteam-push-cycle.test.ts b/packages/git-sync/test/redteam-push-cycle.test.ts
index c8b0bfe2..df202242 100644
--- a/packages/git-sync/test/redteam-push-cycle.test.ts
+++ b/packages/git-sync/test/redteam-push-cycle.test.ts
@@ -8,7 +8,7 @@ import {
 import type { PushDeps } from '../src/engine/push';
 import type { Settings } from '../src/engine/settings';
 import { runCycle, type RunCycleDeps } from '../src/engine/cycle';
-import { serializePageFile } from '../src/lib/page-file';
+import { serializePageFile } from '@docmost/prosemirror-markdown';
 
 // Red-team confirmations for PR #119 (git-sync). Each test asserts the DESIRED
 // behavior, so it FAILS today iff the bug is real.
diff --git a/packages/git-sync/test/roundtrip-corpus.test.ts b/packages/git-sync/test/roundtrip-corpus.test.ts
deleted file mode 100644
index b715b170..00000000
--- a/packages/git-sync/test/roundtrip-corpus.test.ts
+++ /dev/null
@@ -1,104 +0,0 @@
-import { readFile } from 'node:fs/promises';
-import { readdirSync } from 'node:fs';
-import { fileURLToPath } from 'node:url';
-import { dirname, join } from 'node:path';
-import { describe, expect, it } from 'vitest';
-import {
-  convertProseMirrorToMarkdown,
-  markdownToProseMirror,
-  docsCanonicallyEqual,
-} from 'docmost-client';
-
-// Resolve fixtures relative to this test file so the test is CWD-independent.
-const here = dirname(fileURLToPath(import.meta.url));
-const CORPUS_DIR = join(here, 'fixtures', 'corpus');
-const KNOWN_LIMITATIONS_DIR = join(here, 'fixtures', 'known-limitations');
-
-/** Run a single document through export -> import -> export. */
-async function roundTrip(doc: any) {
-  const md1 = convertProseMirrorToMarkdown(doc);
-  const doc2 = await markdownToProseMirror(md1);
-  const md2 = convertProseMirrorToMarkdown(doc2);
-  return { md1, md2, doc2 };
-}
-
-describe('round-trip corpus (SPEC §11)', () => {
-  // Discover the corpus synchronously at collection time so each fixture gets
-  // its own `it` with the file name in the test title.
-  const files = readdirSync(CORPUS_DIR)
-    .filter((name) => name.endsWith('.json'))
-    .sort();
-
-  it('has a non-empty corpus', () => {
-    expect(files.length).toBeGreaterThan(0);
-  });
-
-  for (const name of files) {
-    it(`${name}: markdown byte-stable AND canonically stable`, async () => {
-      const doc = JSON.parse(await readFile(join(CORPUS_DIR, name), 'utf8'));
-      const { md1, md2, doc2 } = await roundTrip(doc);
-
-      // 1) The byte-stable markdown property git actually needs.
-      expect(md2, `${name}: markdown not byte-stable`).toBe(md1);
-      // 2) Semantic stability (block ids stripped, default-null normalized).
-      expect(
-        docsCanonicallyEqual(doc, doc2),
-        `${name}: document not canonically stable`,
-      ).toBe(true);
-    });
-  }
-});
-
-// ---------------------------------------------------------------------------
-// KNOWN CONVERTER LIMITATIONS (isolated so they do NOT make CI red).
-//
-// SPEC §11 explicitly flags images and diagrams as high round-trip risk. These
-// fixtures are kept OUT of the green corpus above and asserted with `it.fails`
-// so the documented divergence is locked in (the test FAILS if the converter
-// ever starts round-tripping them — at which point promote the fixture into
-// the corpus). The precise divergences for `image-diagrams.json` are:
-//
-//   * A BLOCK-LEVEL image preceded by a paragraph is NOT byte-stable on the
-//     FIRST re-export. The HTML re-parser hoists the block <img> out of its
-//     line and leaves an empty paragraph behind, so `paragraph` + `![..](..)`
-//     re-imports as paragraph + empty-paragraph + image; the empty paragraph
-//     adds one blank line, so export #2 grows by a one-time "\n\n" (md1 !== md2).
-//     This is NOT non-convergence: the growth happens exactly ONCE. The doc
-//     CONVERGES to a fixpoint after one extra `export→import→export` pass — the
-//     empty paragraph is already present after the first import, so export #2
-//     and export #3 are byte-identical (md2 === md3, verified).
-//
-//   * drawio / excalidraw diagrams gain `data-align="center"` on the second
-//     export: the schema's diagram `align` attribute has a NON-null default of
-//     "center", which materializes on import; the converter only emits
-//     data-align when set, so it appears on export #2 but not #1. Like the
-//     image case, this is one-time and converges after one extra pass.
-//
-//   * A STANDALONE block image (no preceding paragraph) IS byte-stable from
-//     export #1 (md1 === md2) — but it is still NOT canonically stable: on
-//     import the bare <img> is wrapped, gaining a leading EMPTY paragraph, so
-//     the canonical doc differs by that spurious paragraph node even though the
-//     markdown bytes match.
-//
-// Resolution (SPEC §11, "normalize-on-write"): rather than deep-fixing the
-// converter, the engine runs ONE `export→import→export` pass when writing into
-// the vault; from that fixpoint onward the form is byte-stable, so git sees no
-// phantom diff. The green corpus above avoids these one-time asymmetries by
-// pre-authoring the materialized defaults (e.g. `align: "center"` on the
-// diagrams in 06-diagrams.json) so a single pass is already at the fixpoint.
-// ---------------------------------------------------------------------------
-describe('round-trip KNOWN LIMITATIONS (SPEC §11 image/diagram risk)', () => {
-  it.fails(
-    'image-diagrams.json is NOT byte-stable on export #1 (block image hoist + diagram align default; converges after one extra pass — SPEC §11 normalize-on-write)',
-    async () => {
-      const doc = JSON.parse(
-        await readFile(join(KNOWN_LIMITATIONS_DIR, 'image-diagrams.json'), 'utf8'),
-      );
-      const { md1, md2 } = await roundTrip(doc);
-      // This assertion FAILS today (documented divergence). `it.fails` turns a
-      // failing body into a PASS; if the converter is fixed this flips and the
-      // test goes red, prompting promotion into the green corpus.
-      expect(md2).toBe(md1);
-    },
-  );
-});
diff --git a/packages/git-sync/test/run-push-realgit.test.ts b/packages/git-sync/test/run-push-realgit.test.ts
index 0dc36aed..3d94ba3a 100644
--- a/packages/git-sync/test/run-push-realgit.test.ts
+++ b/packages/git-sync/test/run-push-realgit.test.ts
@@ -8,7 +8,7 @@ import { runPush, LAST_PUSHED_REF } from '../src/engine/push';
 import type { PushDeps } from '../src/engine/push';
 import { VaultGit } from '../src/engine/git';
 import type { Settings } from '../src/engine/settings';
-import { serializeDocmostMarkdownBody } from '../src/lib/index';
+import { serializeDocmostMarkdownBody } from '@docmost/prosemirror-markdown';
 
 const execFileAsync = promisify(execFile);
 
diff --git a/packages/git-sync/test/run-push.test.ts b/packages/git-sync/test/run-push.test.ts
index c5c4f060..adaf4f2b 100644
--- a/packages/git-sync/test/run-push.test.ts
+++ b/packages/git-sync/test/run-push.test.ts
@@ -2,7 +2,7 @@ import { describe, expect, it, vi } from 'vitest';
 import { runPush, LAST_PUSHED_REF, DOCMOST_BRANCH } from '../src/engine/push';
 import type { PushDeps } from '../src/engine/push';
 import type { Settings } from '../src/engine/settings';
-import { serializePageFile } from '../src/lib/page-file';
+import { serializePageFile } from '@docmost/prosemirror-markdown';
 
 /** A native page file: `gitmost_id` frontmatter + clean body (title = filename). */
 function fileFor(pageId: string, body = 'body'): string {
diff --git a/packages/git-sync/test/stabilize.test.ts b/packages/git-sync/test/stabilize.test.ts
index ebc63d35..d5303e9f 100644
--- a/packages/git-sync/test/stabilize.test.ts
+++ b/packages/git-sync/test/stabilize.test.ts
@@ -2,8 +2,8 @@ import { describe, expect, it } from 'vitest';
 import { stabilizePageFile, type PageMeta } from '../src/engine/stabilize.js';
 // markdownToProseMirror lives in collaboration.ts; importing it mutates the
 // global DOM via jsdom at module load time (required for @tiptap/html under Node).
-import { markdownToProseMirror } from '../src/lib/markdown-to-prosemirror.js';
-import { parseDocmostMarkdown } from '../src/lib/markdown-document.js';
+import { markdownToProseMirror } from '@docmost/prosemirror-markdown';
+import { parseDocmostMarkdown } from '@docmost/prosemirror-markdown';
 
 // stabilize.ts (SPEC §11 normalize-on-write) was 0% covered (only the gated e2e
 // touched it). stabilizePageFile is import-testable: build a small ProseMirror
@@ -22,16 +22,27 @@ const meta: PageMeta = {
 
 describe('stabilizePageFile — normalize-on-write fixpoint (SPEC §11)', () => {
   it('reaches a byte-identical fixpoint after one extra export/import/export pass', async () => {
-    // A diagram is the canonical one-pass asymmetry: drawio's `align` default of
-    // "center" materializes on import, so a NAIVE export differs on the second
-    // export. stabilizePageFile runs the convergence pass at write time, so the
-    // written body must already be at the fixpoint: re-importing its body and
+    // A diagram inside a column is the canonical one-pass asymmetry: on the
+    // raw-HTML/columns path a diagram's `align` default of "center" materializes
+    // on import, so a NAIVE export differs on the second export. (#293 canon #8
+    // made the TOP-LEVEL diagram form — `![](src)<!--drawio …-->` — byte-stable by
+    // omitting the default, so the asymmetry now lives only on the columns path
+    // where the schema `<div data-type="drawio">` form is retained.)
+    // stabilizePageFile runs the convergence pass at write time, so the written
+    // body must already be at the fixpoint: re-importing its body and
     // re-stabilizing yields the exact same bytes.
     const content = {
       type: 'doc',
       content: [
         { type: 'paragraph', content: [{ type: 'text', text: 'intro' }] },
-        { type: 'drawio', attrs: { src: '/d.drawio' } },
+        {
+          type: 'columns',
+          attrs: { layout: 'two_equal' },
+          content: [
+            { type: 'column', content: [{ type: 'drawio', attrs: { src: '/d.drawio' } }] },
+            { type: 'column', content: [{ type: 'paragraph', content: [{ type: 'text', text: 'side' }] }] },
+          ],
+        },
         { type: 'paragraph', content: [{ type: 'text', text: 'outro' }] },
       ],
     };
diff --git a/packages/git-sync/test/strip-empty-paragraphs-validity.test.ts b/packages/git-sync/test/strip-empty-paragraphs-validity.test.ts
index e5514ec2..d1f48b87 100644
--- a/packages/git-sync/test/strip-empty-paragraphs-validity.test.ts
+++ b/packages/git-sync/test/strip-empty-paragraphs-validity.test.ts
@@ -1,8 +1,8 @@
 import { describe, it, expect } from "vitest";
 import { getSchema } from "@tiptap/core";
 
-import { markdownToProseMirror } from "../src/lib/markdown-to-prosemirror";
-import { docmostExtensions } from "../src/lib/docmost-schema";
+import { markdownToProseMirror } from "@docmost/prosemirror-markdown";
+import { docmostExtensions } from "@docmost/prosemirror-markdown";
 
 // REGRESSION LOCK for the stripEmptyParagraphs schema-validity guard.
 //
diff --git a/packages/mcp/build/_vendored_editor_ext/copy.js b/packages/mcp/build/_vendored_editor_ext/copy.js
deleted file mode 100644
index 428db9cf..00000000
--- a/packages/mcp/build/_vendored_editor_ext/copy.js
+++ /dev/null
@@ -1,6 +0,0 @@
-"use strict";
-Object.defineProperty(exports, "__esModule", { value: true });
-exports.copy = copy;
-function copy(value) {
-    return JSON.parse(JSON.stringify(value));
-}
diff --git a/packages/mcp/build/_vendored_editor_ext/getFromPath.js b/packages/mcp/build/_vendored_editor_ext/getFromPath.js
deleted file mode 100644
index b5b56b0c..00000000
--- a/packages/mcp/build/_vendored_editor_ext/getFromPath.js
+++ /dev/null
@@ -1,18 +0,0 @@
-"use strict";
-Object.defineProperty(exports, "__esModule", { value: true });
-exports.getFromPath = getFromPath;
-/**
- * get target value from json-pointer (e.g. /content/0/content)
- * @param  {AnyObject} obj  object to resolve path into
- * @param  {string}    path json-pointer
- * @return {any} target value
- */
-function getFromPath(obj, path) {
-    const pathParts = path.split("/");
-    pathParts.shift(); // remove root-entry
-    while (pathParts.length) {
-        const property = pathParts.shift();
-        obj = obj[property];
-    }
-    return obj;
-}
diff --git a/packages/mcp/build/_vendored_editor_ext/getReplaceStep.js b/packages/mcp/build/_vendored_editor_ext/getReplaceStep.js
deleted file mode 100644
index 357ce0d7..00000000
--- a/packages/mcp/build/_vendored_editor_ext/getReplaceStep.js
+++ /dev/null
@@ -1,27 +0,0 @@
-"use strict";
-Object.defineProperty(exports, "__esModule", { value: true });
-exports.getReplaceStep = getReplaceStep;
-const transform_1 = require("@tiptap/pm/transform");
-function getReplaceStep(fromDoc, toDoc) {
-    let start = toDoc.content.findDiffStart(fromDoc.content);
-    if (start === null) {
-        return false;
-    }
-    // @ts-ignore property access to content
-    let { a: endA, b: endB } = toDoc.content.findDiffEnd(fromDoc.content);
-    const overlap = start - Math.min(endA, endB);
-    if (overlap > 0) {
-        // If there is an overlap, there is some freedom of choice in how to calculate the
-        // start/end boundary. for an inserted/removed slice. We choose the extreme with
-        // the lowest depth value.
-        if (fromDoc.resolve(start - overlap).depth <
-            toDoc.resolve(endA + overlap).depth) {
-            start -= overlap;
-        }
-        else {
-            endA += overlap;
-            endB += overlap;
-        }
-    }
-    return new transform_1.ReplaceStep(start, endB, toDoc.slice(start, endA));
-}
diff --git a/packages/mcp/build/_vendored_editor_ext/index.js b/packages/mcp/build/_vendored_editor_ext/index.js
deleted file mode 100644
index 37b373e2..00000000
--- a/packages/mcp/build/_vendored_editor_ext/index.js
+++ /dev/null
@@ -1,8 +0,0 @@
-"use strict";
-Object.defineProperty(exports, "__esModule", { value: true });
-exports.RecreateTransform = exports.recreateTransform = void 0;
-// https://gitlab.com/mpapp-public/prosemirror-recreate-steps - MIT
-// https://github.com/sueddeutsche/prosemirror-recreate-transform - MIT
-var recreateTransform_1 = require("./recreateTransform");
-Object.defineProperty(exports, "recreateTransform", { enumerable: true, get: function () { return recreateTransform_1.recreateTransform; } });
-Object.defineProperty(exports, "RecreateTransform", { enumerable: true, get: function () { return recreateTransform_1.RecreateTransform; } });
diff --git a/packages/mcp/build/_vendored_editor_ext/package.json b/packages/mcp/build/_vendored_editor_ext/package.json
deleted file mode 100644
index 0292b995..00000000
--- a/packages/mcp/build/_vendored_editor_ext/package.json
+++ /dev/null
@@ -1 +0,0 @@
-{"type":"commonjs"}
\ No newline at end of file
diff --git a/packages/mcp/build/_vendored_editor_ext/recreateTransform.js b/packages/mcp/build/_vendored_editor_ext/recreateTransform.js
deleted file mode 100644
index 0b2226bf..00000000
--- a/packages/mcp/build/_vendored_editor_ext/recreateTransform.js
+++ /dev/null
@@ -1,242 +0,0 @@
-"use strict";
-Object.defineProperty(exports, "__esModule", { value: true });
-exports.RecreateTransform = void 0;
-exports.recreateTransform = recreateTransform;
-const transform_1 = require("@tiptap/pm/transform");
-const rfc6902_1 = require("rfc6902");
-const diff_1 = require("diff");
-const getReplaceStep_1 = require("./getReplaceStep");
-const simplifyTransform_1 = require("./simplifyTransform");
-const removeMarks_1 = require("./removeMarks");
-const getFromPath_1 = require("./getFromPath");
-const copy_1 = require("./copy");
-class RecreateTransform {
-    constructor(fromDoc, toDoc, options = {}) {
-        const o = {
-            complexSteps: true,
-            wordDiffs: false,
-            simplifyDiff: true,
-            ...options,
-        };
-        this.fromDoc = fromDoc;
-        this.toDoc = toDoc;
-        this.complexSteps = o.complexSteps; // Whether to return steps other than ReplaceSteps
-        this.wordDiffs = o.wordDiffs; // Whether to make text diffs cover entire words
-        this.simplifyDiff = o.simplifyDiff;
-        this.schema = fromDoc.type.schema;
-        this.tr = new transform_1.Transform(fromDoc);
-    }
-    init() {
-        if (this.complexSteps) {
-            // For First steps: we create versions of the documents without marks as
-            // these will only confuse the diffing mechanism and marks won't cause
-            // any mapping changes anyway.
-            this.currentJSON = (0, removeMarks_1.removeMarks)(this.fromDoc).toJSON();
-            this.finalJSON = (0, removeMarks_1.removeMarks)(this.toDoc).toJSON();
-            this.ops = (0, rfc6902_1.createPatch)(this.currentJSON, this.finalJSON);
-            this.recreateChangeContentSteps();
-            this.recreateChangeMarkSteps();
-        }
-        else {
-            // We don't differentiate between mark changes and other changes.
-            this.currentJSON = this.fromDoc.toJSON();
-            this.finalJSON = this.toDoc.toJSON();
-            this.ops = (0, rfc6902_1.createPatch)(this.currentJSON, this.finalJSON);
-            this.recreateChangeContentSteps();
-        }
-        if (this.simplifyDiff) {
-            this.tr = (0, simplifyTransform_1.simplifyTransform)(this.tr) || this.tr;
-        }
-        return this.tr;
-    }
-    /** convert json-diff to prosemirror steps */
-    recreateChangeContentSteps() {
-        // First step: find content changing steps.
-        let ops = [];
-        while (this.ops.length) {
-            // get next
-            let op = this.ops.shift();
-            ops.push(op);
-            let toDoc;
-            const afterStepJSON = (0, copy_1.copy)(this.currentJSON); // working document receiving patches
-            const pathParts = op.path.split("/");
-            // collect operations until we receive a valid document:
-            // apply ops-patches until a valid prosemirror document is retrieved,
-            // then try to create a transformation step or retry with next operation
-            while (toDoc == null) {
-                (0, rfc6902_1.applyPatch)(afterStepJSON, [op]);
-                try {
-                    toDoc = this.schema.nodeFromJSON(afterStepJSON);
-                    toDoc.check();
-                }
-                catch (error) {
-                    toDoc = null;
-                    if (this.ops.length > 0) {
-                        op = this.ops.shift();
-                        ops.push(op);
-                    }
-                    else {
-                        throw new Error(`No valid diff possible applying ${op.path}`);
-                    }
-                }
-            }
-            // apply operation (ignoring afterStepJSON)
-            if (this.complexSteps &&
-                ops.length === 1 &&
-                (pathParts.includes("attrs") || pathParts.includes("type"))) {
-                // Node markup is changing
-                this.addSetNodeMarkup(); // a lost update is ignored
-                ops = [];
-                // console.log("%cop", logStyle, "- update node", ops);
-            }
-            else if (ops.length === 1 &&
-                op.op === "replace" &&
-                pathParts[pathParts.length - 1] === "text") {
-                // Text is being replaced, we apply text diffing to find the smallest possible diffs.
-                this.addReplaceTextSteps(op, afterStepJSON);
-                ops = [];
-                // console.log("%cop", logStyle, "- replace", ops);
-            }
-            else if (this.addReplaceStep(toDoc, afterStepJSON)) {
-                // operations have been applied
-                ops = [];
-                // console.log("%cop", logStyle, "- other", ops);
-            }
-        }
-    }
-    /** update node with attrs and marks, may also change type */
-    addSetNodeMarkup() {
-        // first diff in document is supposed to be a node-change (in type and/or attributes)
-        // thus simply find the first change and apply a node change step, then recalculate the diff
-        // after updating the document
-        const fromDoc = this.schema.nodeFromJSON(this.currentJSON);
-        const toDoc = this.schema.nodeFromJSON(this.finalJSON);
-        const start = toDoc.content.findDiffStart(fromDoc.content);
-        // @note start is the same (first) position for current and target document
-        const fromNode = fromDoc.nodeAt(start);
-        const toNode = toDoc.nodeAt(start);
-        if (start != null) {
-            // @note this completly updates all attributes in one step, by completely replacing node
-            const nodeType = fromNode.type === toNode.type ? null : toNode.type;
-            try {
-                this.tr.setNodeMarkup(start, nodeType, toNode.attrs, toNode.marks);
-            }
-            catch (e) {
-                // if nodetypes differ, the updated node-type and contents might not be compatible
-                // with schema and requires a replace
-                if (nodeType && e.message.includes("Invalid content")) {
-                    // @todo add test-case for this scenario
-                    this.tr.replaceWith(start, start + fromNode.nodeSize, toNode);
-                }
-                else {
-                    throw e;
-                }
-            }
-            this.currentJSON = (0, removeMarks_1.removeMarks)(this.tr.doc).toJSON();
-            // setting the node markup may have invalidated the following ops, so we calculate them again.
-            this.ops = (0, rfc6902_1.createPatch)(this.currentJSON, this.finalJSON);
-            return true;
-        }
-        return false;
-    }
-    recreateChangeMarkSteps() {
-        // Now the documents should be the same, except their marks, so everything should map 1:1.
-        // Second step: Iterate through the toDoc and make sure all marks are the same in tr.doc
-        this.toDoc.descendants((tNode, tPos) => {
-            if (!tNode.isInline) {
-                return true;
-            }
-            this.tr.doc.nodesBetween(tPos, tPos + tNode.nodeSize, (fNode, fPos) => {
-                if (!fNode.isInline) {
-                    return true;
-                }
-                const from = Math.max(tPos, fPos);
-                const to = Math.min(tPos + tNode.nodeSize, fPos + fNode.nodeSize);
-                fNode.marks.forEach((nodeMark) => {
-                    if (!nodeMark.isInSet(tNode.marks)) {
-                        this.tr.removeMark(from, to, nodeMark);
-                    }
-                });
-                tNode.marks.forEach((nodeMark) => {
-                    if (!nodeMark.isInSet(fNode.marks)) {
-                        this.tr.addMark(from, to, nodeMark);
-                    }
-                });
-            });
-        });
-    }
-    /**
-     * retrieve and possibly apply replace-step based from doc changes
-     * From http://prosemirror.net/examples/footnote/
-     */
-    addReplaceStep(toDoc, afterStepJSON) {
-        const fromDoc = this.schema.nodeFromJSON(this.currentJSON);
-        const step = (0, getReplaceStep_1.getReplaceStep)(fromDoc, toDoc);
-        if (!step) {
-            return false;
-        }
-        else if (!this.tr.maybeStep(step).failed) {
-            this.currentJSON = afterStepJSON;
-            return true; // @change previously null
-        }
-        throw new Error("No valid step found.");
-    }
-    /** retrieve and possibly apply text replace-steps based from doc changes */
-    addReplaceTextSteps(op, afterStepJSON) {
-        // We find the position number of the first character in the string
-        const op1 = { ...op, value: "xx" };
-        const op2 = { ...op, value: "yy" };
-        const afterOP1JSON = (0, copy_1.copy)(this.currentJSON);
-        const afterOP2JSON = (0, copy_1.copy)(this.currentJSON);
-        (0, rfc6902_1.applyPatch)(afterOP1JSON, [op1]);
-        (0, rfc6902_1.applyPatch)(afterOP2JSON, [op2]);
-        const op1Doc = this.schema.nodeFromJSON(afterOP1JSON);
-        const op2Doc = this.schema.nodeFromJSON(afterOP2JSON);
-        // get text diffs
-        const finalText = op.value;
-        const currentText = (0, getFromPath_1.getFromPath)(this.currentJSON, op.path);
-        const textDiffs = this.wordDiffs
-            ? (0, diff_1.diffWordsWithSpace)(currentText, finalText)
-            : (0, diff_1.diffChars)(currentText, finalText);
-        let offset = op1Doc.content.findDiffStart(op2Doc.content);
-        const marks = op1Doc.resolve(offset + 1).marks();
-        while (textDiffs.length) {
-            const diff = textDiffs.shift();
-            if (diff.added) {
-                const textNode = this.schema
-                    .nodeFromJSON({ type: "text", text: diff.value })
-                    .mark(marks);
-                if (textDiffs.length && textDiffs[0].removed) {
-                    const nextDiff = textDiffs.shift();
-                    this.tr.replaceWith(offset, offset + nextDiff.value.length, textNode);
-                }
-                else {
-                    this.tr.insert(offset, textNode);
-                }
-                offset += diff.value.length;
-            }
-            else if (diff.removed) {
-                if (textDiffs.length && textDiffs[0].added) {
-                    const nextDiff = textDiffs.shift();
-                    const textNode = this.schema
-                        .nodeFromJSON({ type: "text", text: nextDiff.value })
-                        .mark(marks);
-                    this.tr.replaceWith(offset, offset + diff.value.length, textNode);
-                    offset += nextDiff.value.length;
-                }
-                else {
-                    this.tr.delete(offset, offset + diff.value.length);
-                }
-            }
-            else {
-                offset += diff.value.length;
-            }
-        }
-        this.currentJSON = afterStepJSON;
-    }
-}
-exports.RecreateTransform = RecreateTransform;
-function recreateTransform(fromDoc, toDoc, options = {}) {
-    const recreator = new RecreateTransform(fromDoc, toDoc, options);
-    return recreator.init();
-}
diff --git a/packages/mcp/build/_vendored_editor_ext/recreateTransform.test.js b/packages/mcp/build/_vendored_editor_ext/recreateTransform.test.js
deleted file mode 100644
index 79323148..00000000
--- a/packages/mcp/build/_vendored_editor_ext/recreateTransform.test.js
+++ /dev/null
@@ -1,118 +0,0 @@
-"use strict";
-Object.defineProperty(exports, "__esModule", { value: true });
-const vitest_1 = require("vitest");
-const schema_basic_1 = require("@tiptap/pm/schema-basic");
-const transform_1 = require("@tiptap/pm/transform");
-const recreateTransform_1 = require("./recreateTransform");
-/**
- * recreateTransform diffs two documents and produces ProseMirror steps that turn
- * `fromDoc` into `toDoc`. It is the backbone of collaborative/version diffing, so
- * THE invariant that matters is: replaying the produced steps on `fromDoc` must
- * reproduce `toDoc` exactly. Every test below re-applies the steps onto a fresh
- * Transform seeded from `fromDoc` (not just trusting `tr.doc`) and asserts node
- * equality with `.eq()`. If a regression makes any step wrong, the round-trip
- * breaks and the test fails.
- */
-// Real ProseMirror schema (the standard basic schema) with paragraph/heading +
-// strong/em marks — the same primitives the editor diffs in production.
-const doc = (...c) => schema_basic_1.schema.node("doc", null, c);
-const p = (...c) => schema_basic_1.schema.node("paragraph", null, c.length ? c : undefined);
-const h = (level, ...c) => schema_basic_1.schema.node("heading", { level }, c);
-const t = (text, ...marks) => schema_basic_1.schema.text(text, marks.length ? marks : undefined);
-const strong = schema_basic_1.schema.marks.strong.create();
-const em = schema_basic_1.schema.marks.em.create();
-// Replay the diff's steps onto a fresh Transform built from `fromDoc`. This is
-// the faithful "apply(diff) == target" check — it exercises the actual Step
-// objects rather than the transform's internal accumulated doc.
-function applyDiff(fromDoc, toDoc, options) {
-    const tr = (0, recreateTransform_1.recreateTransform)(fromDoc, toDoc, options);
-    const replay = new transform_1.Transform(fromDoc);
-    tr.steps.forEach((s) => {
-        const result = replay.maybeStep(s);
-        if (result.failed)
-            throw new Error(`step failed: ${result.failed}`);
-    });
-    return replay.doc;
-}
-(0, vitest_1.describe)("recreateTransform round-trip (apply(diff) == target)", () => {
-    (0, vitest_1.it)("reconstructs the target on plain text insertion", () => {
-        // Inserting " world" must yield exactly the target paragraph.
-        const from = doc(p(t("hello")));
-        const to = doc(p(t("hello world")));
-        (0, vitest_1.expect)(applyDiff(from, to).eq(to)).toBe(true);
-    });
-    (0, vitest_1.it)("reconstructs the target on text deletion", () => {
-        // Deleting a trailing word is the inverse of insertion and must round-trip.
-        const from = doc(p(t("hello world")));
-        const to = doc(p(t("hello")));
-        (0, vitest_1.expect)(applyDiff(from, to).eq(to)).toBe(true);
-    });
-    (0, vitest_1.it)("reconstructs the target when a word is replaced mid-string", () => {
-        // A char-level replace in the middle must not corrupt the surrounding text.
-        const from = doc(p(t("the quick brown fox")));
-        const to = doc(p(t("the slow brown fox")));
-        (0, vitest_1.expect)(applyDiff(from, to).eq(to)).toBe(true);
-    });
-    (0, vitest_1.it)("reconstructs the target when a mark is added (complexSteps path)", () => {
-        // Mark-only changes are diffed in a separate pass; the bolded run must match.
-        const from = doc(p(t("hello")));
-        const to = doc(p(t("hello", strong)));
-        const out = applyDiff(from, to);
-        (0, vitest_1.expect)(out.eq(to)).toBe(true);
-        // Sanity: the produced doc actually carries the strong mark.
-        (0, vitest_1.expect)(out.firstChild.firstChild.marks.length).toBe(1);
-    });
-    (0, vitest_1.it)("reconstructs the target when a mark is removed", () => {
-        // Removing the only mark must leave the same text with no marks.
-        const from = doc(p(t("hello", strong)));
-        const to = doc(p(t("hello")));
-        const out = applyDiff(from, to);
-        (0, vitest_1.expect)(out.eq(to)).toBe(true);
-        (0, vitest_1.expect)(out.firstChild.firstChild.marks.length).toBe(0);
-    });
-    (0, vitest_1.it)("reconstructs the target on a paragraph split into two blocks", () => {
-        // Structural change (one block -> two) must replay as valid replace steps.
-        const from = doc(p(t("hello world")));
-        const to = doc(p(t("hello")), p(t("world")));
-        const out = applyDiff(from, to);
-        (0, vitest_1.expect)(out.eq(to)).toBe(true);
-        (0, vitest_1.expect)(out.childCount).toBe(2);
-    });
-    (0, vitest_1.it)("reconstructs the target on a node-type change (paragraph -> heading)", () => {
-        // Type/attrs changes drive the setNodeMarkup branch; the node must become a
-        // heading while keeping its text.
-        const from = doc(p(t("hello")));
-        const to = doc(h(1, t("hello")));
-        const out = applyDiff(from, to);
-        (0, vitest_1.expect)(out.eq(to)).toBe(true);
-        (0, vitest_1.expect)(out.firstChild.type.name).toBe("heading");
-    });
-    (0, vitest_1.it)("reconstructs a combined structural + mark change", () => {
-        // Several diff kinds at once (new block + italic run) still round-trips.
-        const from = doc(p(t("alpha")));
-        const to = doc(p(t("alpha")), p(t("beta", em)));
-        const out = applyDiff(from, to);
-        (0, vitest_1.expect)(out.eq(to)).toBe(true);
-    });
-    (0, vitest_1.it)("produces an empty step list for identical documents", () => {
-        // No diff => no work; spurious steps would mean wasted/incorrect history.
-        const from = doc(p(t("same")));
-        const to = doc(p(t("same")));
-        const tr = (0, recreateTransform_1.recreateTransform)(from, to);
-        (0, vitest_1.expect)(tr.steps.length).toBe(0);
-        (0, vitest_1.expect)(tr.doc.eq(to)).toBe(true);
-    });
-    (0, vitest_1.it)("round-trips with complexSteps:false (marks diffed as replaces)", () => {
-        // With complexSteps off, mark changes are folded into replace steps rather
-        // than dedicated mark steps — the result must still equal the target.
-        const from = doc(p(t("hello")));
-        const to = doc(p(t("hello", strong)));
-        (0, vitest_1.expect)(applyDiff(from, to, { complexSteps: false }).eq(to)).toBe(true);
-    });
-    (0, vitest_1.it)("round-trips with wordDiffs:true (whole-word text diffing)", () => {
-        // wordDiffs changes the granularity of the text diff, not the outcome.
-        const from = doc(p(t("the quick brown fox")));
-        const to = doc(p(t("the quick red fox")));
-        (0, vitest_1.expect)(applyDiff(from, to, { wordDiffs: true }).eq(to)).toBe(true);
-    });
-});
diff --git a/packages/mcp/build/_vendored_editor_ext/removeMarks.js b/packages/mcp/build/_vendored_editor_ext/removeMarks.js
deleted file mode 100644
index a0bedebc..00000000
--- a/packages/mcp/build/_vendored_editor_ext/removeMarks.js
+++ /dev/null
@@ -1,9 +0,0 @@
-"use strict";
-Object.defineProperty(exports, "__esModule", { value: true });
-exports.removeMarks = removeMarks;
-const transform_1 = require("@tiptap/pm/transform");
-function removeMarks(doc) {
-    const tr = new transform_1.Transform(doc);
-    tr.removeMark(0, doc.nodeSize - 2);
-    return tr.doc;
-}
diff --git a/packages/mcp/build/_vendored_editor_ext/simplifyTransform.js b/packages/mcp/build/_vendored_editor_ext/simplifyTransform.js
deleted file mode 100644
index 57fd9995..00000000
--- a/packages/mcp/build/_vendored_editor_ext/simplifyTransform.js
+++ /dev/null
@@ -1,27 +0,0 @@
-"use strict";
-Object.defineProperty(exports, "__esModule", { value: true });
-exports.simplifyTransform = simplifyTransform;
-const transform_1 = require("@tiptap/pm/transform");
-const getReplaceStep_1 = require("./getReplaceStep");
-// join adjacent ReplaceSteps
-function simplifyTransform(tr) {
-    if (!tr.steps.length) {
-        return undefined;
-    }
-    const newTr = new transform_1.Transform(tr.docs[0]);
-    const oldSteps = tr.steps.slice();
-    while (oldSteps.length) {
-        let step = oldSteps.shift();
-        while (oldSteps.length && step.merge(oldSteps[0])) {
-            const addedStep = oldSteps.shift();
-            if (step instanceof transform_1.ReplaceStep && addedStep instanceof transform_1.ReplaceStep) {
-                step = (0, getReplaceStep_1.getReplaceStep)(newTr.doc, addedStep.apply(step.apply(newTr.doc).doc).doc);
-            }
-            else {
-                step = step.merge(addedStep);
-            }
-        }
-        newTr.step(step);
-    }
-    return newTr;
-}
diff --git a/packages/mcp/build/_vendored_editor_ext/types.js b/packages/mcp/build/_vendored_editor_ext/types.js
deleted file mode 100644
index c8ad2e54..00000000
--- a/packages/mcp/build/_vendored_editor_ext/types.js
+++ /dev/null
@@ -1,2 +0,0 @@
-"use strict";
-Object.defineProperty(exports, "__esModule", { value: true });
diff --git a/packages/mcp/build/client.js b/packages/mcp/build/client.js
deleted file mode 100644
index 81a2ec29..00000000
--- a/packages/mcp/build/client.js
+++ /dev/null
@@ -1,2988 +0,0 @@
-import FormData from "form-data";
-import axios from "axios";
-import { basename, extname } from "path";
-import { filterWorkspace, filterSpace, filterPage, filterComment, filterSearchResult, } from "./lib/filters.js";
-import { HocuspocusProvider } from "@hocuspocus/provider";
-import { TiptapTransformer } from "@hocuspocus/transformer";
-import * as Y from "yjs";
-import WebSocket from "ws";
-import { convertProseMirrorToMarkdown } from "./lib/markdown-converter.js";
-import { collectInternalFileNodes, normalizeFileUrl, resolveInternalFilePath, } from "./lib/internal-file-urls.js";
-import { updatePageContentRealtime, replacePageContent, markdownToProseMirror, markdownToProseMirrorCanonical, mutatePageContent, buildCollabWsUrl, assertYjsEncodable, applyDocToFragment, } from "./lib/collaboration.js";
-import { footnoteWarningsField } from "./lib/footnote-analyze.js";
-import { buildPageTree } from "./lib/tree.js";
-import { serializeDocmostMarkdown, parseDocmostMarkdown, } from "./lib/markdown-document.js";
-import { replaceNodeById, deleteNodeById, assertUnambiguousMatch, insertNodeRelative, buildOutline, getNodeByRef, readTable, insertTableRow, deleteTableRow, updateTableCell, } from "./lib/node-ops.js";
-import { searchInDoc } from "./lib/page-search.js";
-import { withPageLock } from "./lib/page-lock.js";
-import { applyTextEdits, } from "./lib/json-edit.js";
-import { getCollabToken, performLogin } from "./lib/auth-utils.js";
-import { diffDocs, summarizeChange } from "./lib/diff.js";
-import { applyAnchorInDoc, canAnchorInDoc, countAnchorMatches, getAnchoredText, } from "./lib/comment-anchor.js";
-import { blockText, walk, getList, insertMarkerAfter, setCalloutRange, noteItem, mdToInlineNodes, commentsToFootnotes, canonicalizeFootnotes, insertInlineFootnote, } from "./lib/transforms.js";
-import vm from "node:vm";
-// Supported image types, kept as two lookup tables so both a local file
-// extension and a remote Content-Type can be mapped to the same canonical set.
-const EXT_TO_MIME = {
-    ".png": "image/png",
-    ".jpg": "image/jpeg",
-    ".jpeg": "image/jpeg",
-    ".gif": "image/gif",
-    ".webp": "image/webp",
-    ".svg": "image/svg+xml",
-};
-const MIME_TO_EXT = {
-    "image/png": ".png",
-    "image/jpeg": ".jpg",
-    "image/gif": ".gif",
-    "image/webp": ".webp",
-    "image/svg+xml": ".svg",
-};
-// Canonical UUID shape (versions 1–8, matching the `uuid` package's `validate`
-// that the server's isValidUUID uses). page.repo.ts treats any non-UUID pageId
-// as a slugId, so the MCP detects a UUID locally and skips a /pages/info
-// round-trip in resolvePageId. A 10-char nanoid slugId never contains dashes,
-// so it can never be misread as a UUID here.
-const UUID_RE = /^[0-9a-f]{8}-[0-9a-f]{4}-[1-8][0-9a-f]{3}-[89ab][0-9a-f]{3}-[0-9a-f]{12}$/i;
-function isUuid(value) {
-    return typeof value === "string" && UUID_RE.test(value);
-}
-export class DocmostClient {
-    client;
-    token = null;
-    apiUrl;
-    // email/password are only set on the service-account (credentials) variant;
-    // null on the getToken variant (where there are no credentials to log in with).
-    email = null;
-    password = null;
-    // Per-user token provider. When set, login() calls it to obtain a BARE access
-    // JWT instead of performLogin, and the 401/403 re-auth path re-calls it.
-    getTokenFn = null;
-    // Optional collab-token provider. When set, getCollabTokenWithReauth() returns
-    // its token instead of calling POST /auth/collab-token; on a 401/403 it is
-    // re-invoked once. Used by the internal agent to carry signed provenance.
-    getCollabTokenFn = null;
-    // Optional blob-sandbox sink for the stash tool. Null when not configured.
-    sandboxPut = null;
-    // Optional probes paired with the sink. `has` lets stashPage detect a blob
-    // FIFO-evicted by a LATER put in the same stash; `evict` lets it free this
-    // op's image blobs if the final doc put throws. Null when the sink omits them.
-    sandboxHas = null;
-    sandboxEvict = null;
-    // In-flight login dedup: when the token expires, the 401 interceptor,
-    // ensureAuthenticated, getCollabTokenWithReauth and the two multipart retries
-    // can all call login() at once. Memoizing a single promise collapses that
-    // thundering herd into ONE /auth/login request that everyone awaits.
-    loginPromise = null;
-    // Canonical-UUID cache for resolvePageId: maps an agent-supplied slugId to the
-    // page's canonical UUID, so repeated collab edits on the same page do not
-    // re-fetch /pages/info. A UUID input short-circuits before this cache (see
-    // resolvePageId), so only slugId->uuid entries are stored/read here.
-    pageIdCache = new Map();
-    constructor(configOrBaseURL, email, password) {
-        // Normalize the legacy positional form into the object union.
-        const config = typeof configOrBaseURL === "string"
-            ? { apiUrl: configOrBaseURL, email: email, password: password }
-            : configOrBaseURL;
-        this.apiUrl = config.apiUrl;
-        if ("getToken" in config) {
-            // Token variant: carry the user's JWT via getToken; no credentials, so
-            // login() must never call performLogin (there is nothing to log in with).
-            this.getTokenFn = config.getToken;
-        }
-        else {
-            // Service-account variant: behaves exactly as before (performLogin).
-            this.email = config.email;
-            this.password = config.password;
-        }
-        // Optional, available to both variants. When present, content mutations get
-        // their collab token from here instead of POST /auth/collab-token.
-        if (config.getCollabToken) {
-            this.getCollabTokenFn = config.getCollabToken;
-        }
-        if (config.sandbox) {
-            this.sandboxPut = config.sandbox.put;
-            this.sandboxHas = config.sandbox.has ?? null;
-            this.sandboxEvict = config.sandbox.evict ?? null;
-        }
-        this.client = axios.create({
-            baseURL: this.apiUrl,
-            // Default request timeout so a hung connection cannot wedge a per-page
-            // lock or block the server indefinitely. Multipart uploads override this
-            // with a longer per-request timeout.
-            timeout: 30000,
-            headers: {
-                "Content-Type": "application/json",
-            },
-        });
-        // Re-authenticate transparently on a 401/403 once: the JWT authToken can
-        // expire while the server is long-running, after which every cached-token
-        // request would otherwise fail until a manual restart. On such a response,
-        // clear the stale token, perform a fresh login, and replay the original
-        // request exactly once (guarded by config._retry to avoid infinite loops;
-        // the login request itself is never retried).
-        this.client.interceptors.response.use((response) => response, async (error) => {
-            const config = error.config;
-            const status = error.response?.status;
-            const isAuthError = status === 401 || status === 403;
-            const isLoginRequest = typeof config?.url === "string" && config.url.includes("/auth/login");
-            if (config && isAuthError && !config._retry && !isLoginRequest) {
-                config._retry = true;
-                // Drop the stale token + Authorization header before re-login.
-                this.token = null;
-                delete this.client.defaults.headers.common["Authorization"];
-                try {
-                    await this.login();
-                }
-                catch (loginError) {
-                    // Re-login failed: surface the original error to the caller.
-                    return Promise.reject(error);
-                }
-                // Re-issue the original request with the freshly minted Bearer token.
-                // Read it from the default header that login() just set, not from
-                // this.token, to avoid a theoretical "Bearer null" if this.token was
-                // cleared between login() resolving and this point.
-                config.headers = config.headers || {};
-                config.headers["Authorization"] =
-                    this.client.defaults.headers.common["Authorization"];
-                return this.client.request(config);
-            }
-            return Promise.reject(error);
-        });
-    }
-    /** Application base URL (API URL without the /api suffix). */
-    get appUrl() {
-        return this.apiUrl.replace(/\/api\/?$/, "");
-    }
-    async login() {
-        // Reuse an in-flight login if one is already running so concurrent callers
-        // share a single token fetch instead of each issuing their own.
-        if (!this.loginPromise) {
-            // Token variant: re-fetch a BARE JWT via getToken() (there are no
-            // credentials to log in with — on a 401/403 the interceptor below calls
-            // login() again, which re-invokes getToken()). Credentials variant:
-            // performLogin against /auth/login exactly as before.
-            const fetchToken = this.getTokenFn
-                ? this.getTokenFn()
-                : performLogin(this.apiUrl, this.email, this.password);
-            this.loginPromise = fetchToken
-                .then((token) => {
-                // Guard against an empty/invalid token (e.g. a getToken provider that
-                // resolves to "" or null): without this an empty token would set a
-                // literal "Authorization: Bearer null"/"Bearer " header and every
-                // request would 401 with a confusing error. Fail loudly instead.
-                if (typeof token !== "string" || token.length === 0) {
-                    throw new Error("getToken returned an empty token");
-                }
-                this.token = token;
-                this.client.defaults.headers.common["Authorization"] =
-                    `Bearer ${token}`;
-            })
-                .finally(() => {
-                this.loginPromise = null;
-            });
-        }
-        return this.loginPromise;
-    }
-    async ensureAuthenticated() {
-        if (!this.token) {
-            await this.login();
-        }
-    }
-    /**
-     * Fetch a collaboration token, transparently re-authenticating once on a
-     * 401/403. getCollabToken() uses bare axios internally, so it is NOT covered
-     * by this.client's response interceptor; this helper replicates that
-     * behaviour for collab-token requests: ensure a token, try once, and on an
-     * expired-token auth error perform a fresh login and retry exactly once.
-     */
-    async getCollabTokenWithReauth() {
-        // Collab-token PROVIDER path: when a getCollabToken provider was supplied
-        // (the internal agent's provenance collab token), use it instead of the
-        // REST /auth/collab-token endpoint. Re-invoke it once on a 401/403 (e.g. the
-        // signed token expired between content mutations in a long agent turn).
-        if (this.getCollabTokenFn) {
-            try {
-                const token = await this.getCollabTokenFn();
-                if (typeof token !== "string" || token.length === 0) {
-                    throw new Error("getCollabToken returned an empty token");
-                }
-                return token;
-            }
-            catch (e) {
-                const axiosStatus = axios.isAxiosError(e)
-                    ? e.response?.status
-                    : undefined;
-                const attachedStatus = e?.status;
-                const isAuthError = axiosStatus === 401 ||
-                    axiosStatus === 403 ||
-                    attachedStatus === 401 ||
-                    attachedStatus === 403;
-                if (isAuthError) {
-                    const token = await this.getCollabTokenFn();
-                    if (typeof token !== "string" || token.length === 0) {
-                        throw new Error("getCollabToken returned an empty token");
-                    }
-                    return token;
-                }
-                throw e;
-            }
-        }
-        await this.ensureAuthenticated();
-        try {
-            return await getCollabToken(this.apiUrl, this.token);
-        }
-        catch (e) {
-            // getCollabToken wraps the AxiosError in a plain Error but attaches the
-            // HTTP status as `.status`, so detect an auth failure via either the raw
-            // AxiosError shape OR the attached status.
-            const axiosStatus = axios.isAxiosError(e)
-                ? e.response?.status
-                : undefined;
-            const attachedStatus = e?.status;
-            const isAuthError = axiosStatus === 401 ||
-                axiosStatus === 403 ||
-                attachedStatus === 401 ||
-                attachedStatus === 403;
-            if (isAuthError) {
-                await this.login();
-                return await getCollabToken(this.apiUrl, this.token);
-            }
-            throw e;
-        }
-    }
-    /**
-     * Connect to the collaboration websocket, read the live doc, apply
-     * `transform`, write the result, and wait for the server to persist it —
-     * WITHOUT acquiring the per-page lock.
-     *
-     * This mirrors collaboration.mutatePageContent EXCEPT that it does not call
-     * withPageLock. It exists solely so replaceImage can hold ONE withPageLock
-     * across its scan -> upload -> write sequence: the per-page mutex is NOT
-     * reentrant, so calling the normal (self-locking) mutatePageContent inside an
-     * outer withPageLock for the same pageId would deadlock. The caller MUST hold
-     * the page lock for the whole operation; this helper assumes that invariant.
-     *
-     * `transform` receives the live ProseMirror doc and returns the NEW full doc
-     * to write, or `null` to abort with no write. Errors thrown by `transform`
-     * propagate to the caller.
-     *
-     * Resolves a `MutationResult { doc, verify }` mirroring mutatePageContent, so
-     * every content mutator (including replaceImage) can return a verifiable
-     * change report. The report is computed AFTER the atomic read->write and
-     * never throws.
-     */
-    mutateLiveContentUnlocked(pageId, collabToken, transform) {
-        const CONNECT_TIMEOUT_MS = 25000;
-        const PERSIST_TIMEOUT_MS = 20000;
-        const ydoc = new Y.Doc();
-        const wsUrl = buildCollabWsUrl(this.apiUrl);
-        return new Promise((resolve, reject) => {
-            let provider;
-            let applied = false; // onSynced may fire again on reconnect — apply once.
-            let settled = false;
-            let connectionLost = false;
-            let connectTimer;
-            let persistTimer;
-            let unsyncedHandler;
-            // The verifiable result resolved on every success/abort path. Set on abort
-            // (no-op report) and after a real write (computed change report).
-            let mutationResult;
-            const cleanup = () => {
-                if (connectTimer)
-                    clearTimeout(connectTimer);
-                if (persistTimer)
-                    clearTimeout(persistTimer);
-                if (provider) {
-                    if (unsyncedHandler) {
-                        try {
-                            provider.off("unsyncedChanges", unsyncedHandler);
-                        }
-                        catch (err) { }
-                    }
-                    try {
-                        provider.destroy();
-                    }
-                    catch (err) { }
-                }
-            };
-            const finish = (err, value) => {
-                if (settled)
-                    return;
-                settled = true;
-                cleanup();
-                if (err)
-                    reject(err);
-                else
-                    resolve(value);
-            };
-            connectTimer = setTimeout(() => {
-                finish(new Error("Connection timeout to collaboration server"));
-            }, CONNECT_TIMEOUT_MS);
-            const waitForPersistence = () => {
-                if (settled)
-                    return;
-                if (!provider) {
-                    finish(new Error("collab provider gone before persistence"));
-                    return;
-                }
-                if (provider.unsyncedChanges === 0) {
-                    finish(null, mutationResult);
-                    return;
-                }
-                persistTimer = setTimeout(() => {
-                    finish(new Error("Timeout waiting for collaboration server to persist the update"));
-                }, PERSIST_TIMEOUT_MS);
-                unsyncedHandler = (data) => {
-                    if (data.number === 0 && !connectionLost) {
-                        finish(null, mutationResult);
-                    }
-                };
-                provider.on("unsyncedChanges", unsyncedHandler);
-            };
-            provider = new HocuspocusProvider({
-                url: wsUrl,
-                name: `page.${pageId}`,
-                document: ydoc,
-                token: collabToken,
-                // @ts-ignore - Required for Node.js environment
-                WebSocketPolyfill: WebSocket,
-                onDisconnect: () => {
-                    connectionLost = true;
-                    finish(new Error("Collaboration connection closed before the update was persisted/synced"));
-                },
-                onClose: () => {
-                    connectionLost = true;
-                    finish(new Error("Collaboration connection closed before the update was persisted/synced"));
-                },
-                onSynced: () => {
-                    if (applied || settled)
-                        return;
-                    applied = true;
-                    // CRITICAL: keep everything between reading and writing the live doc
-                    // synchronous (no await) so no remote update can interleave.
-                    let newDoc;
-                    let beforeDoc;
-                    try {
-                        let liveDoc = TiptapTransformer.fromYdoc(ydoc, "default");
-                        if (!liveDoc ||
-                            typeof liveDoc !== "object" ||
-                            !Array.isArray(liveDoc.content)) {
-                            liveDoc = { type: "doc", content: [] };
-                        }
-                        // Snapshot the before-doc for the change report (safe deep clone).
-                        beforeDoc = JSON.parse(JSON.stringify(liveDoc));
-                        newDoc = transform(liveDoc);
-                        if (newDoc == null) {
-                            // Transform aborted — write nothing, return the live doc with a
-                            // no-op change report.
-                            mutationResult = {
-                                doc: liveDoc,
-                                verify: {
-                                    changed: false,
-                                    textInserted: 0,
-                                    textDeleted: 0,
-                                    blocksChanged: 0,
-                                    marks: {},
-                                    summary: "no changes (transform aborted)",
-                                },
-                            };
-                            finish(null, mutationResult);
-                            return;
-                        }
-                        // Structural diff into the live fragment (issue #152), mirroring
-                        // the main write path: preserves the Yjs ids of unchanged nodes so
-                        // an open editor's cursor is not yanked to the end of the document.
-                        // The previous destructive rewrite (delete-all + applyUpdate of a
-                        // fresh Y.Doc) discarded every node id, so replaceImage — the only
-                        // caller of this method — still reproduced the #152 cursor jump
-                        // (#164). applyDocToFragment runs its own atomic `transact`.
-                        applyDocToFragment(ydoc, newDoc);
-                    }
-                    catch (e) {
-                        finish(e instanceof Error ? e : new Error(String(e)));
-                        return;
-                    }
-                    // Compute the verifiable change report AFTER the transact write: it
-                    // only needs the JSON before/after, so it cannot affect the atomic
-                    // read->write window, and summarizeChange never throws.
-                    mutationResult = {
-                        doc: newDoc,
-                        verify: summarizeChange(beforeDoc, newDoc),
-                    };
-                    waitForPersistence();
-                },
-                onAuthenticationFailed: () => {
-                    finish(new Error("Authentication failed for collaboration connection"));
-                },
-            });
-        });
-    }
-    /**
-     * Generic pagination handler for Docmost API endpoints
-     */
-    async paginateAll(endpoint, basePayload = {}, limit = 100) {
-        await this.ensureAuthenticated();
-        const clampedLimit = Math.max(1, Math.min(100, limit));
-        // Hard ceiling on the number of pages to fetch: guards against a server
-        // that returns a perpetually-true hasNextPage (which would otherwise loop
-        // forever and accumulate duplicates).
-        const MAX_PAGES = 50;
-        let page = 1;
-        let allItems = [];
-        let hasNextPage = true;
-        while (hasNextPage && page <= MAX_PAGES) {
-            const response = await this.client.post(endpoint, {
-                ...basePayload,
-                limit: clampedLimit,
-                page,
-            });
-            const data = response.data;
-            const items = data.data?.items || data.items || [];
-            const meta = data.data?.meta || data.meta;
-            allItems = allItems.concat(items);
-            // Stop if the page is empty or shorter than the requested size: a full
-            // page worth of items is the only situation where another page can exist,
-            // so this defends against a stuck hasNextPage flag in addition to it.
-            if (items.length === 0 || items.length < clampedLimit) {
-                break;
-            }
-            hasNextPage = meta?.hasNextPage || false;
-            page++;
-        }
-        // If the loop stopped because it hit the MAX_PAGES ceiling while the server
-        // still reported more results (hasNextPage true and the last page was
-        // full), the result set is truncated — warn so the caller is not silently
-        // handed an incomplete list.
-        if (hasNextPage && page > MAX_PAGES) {
-            console.warn(`paginateAll: results from "${endpoint}" truncated at the ${MAX_PAGES}-page cap; more pages exist on the server`);
-        }
-        return allItems;
-    }
-    async getWorkspace() {
-        await this.ensureAuthenticated();
-        const response = await this.client.post("/workspace/info", {});
-        return {
-            data: filterWorkspace(response.data?.data ?? response.data),
-            success: response.data.success,
-        };
-    }
-    async getSpaces() {
-        const spaces = await this.paginateAll("/spaces", {});
-        return spaces.map((space) => filterSpace(space));
-    }
-    /**
-     * List pages in one of two modes.
-     *
-     * Default (`tree` false): most recent pages by updatedAt (descending),
-     * bounded. Fetching the whole space can exceed MCP response/time limits on
-     * large instances, so a single bounded page of results is returned (default
-     * 50, max 100) via the `/pages/recent` feed.
-     *
-     * Tree (`tree` true): the space's FULL page hierarchy as a nested tree (each
-     * node has a `children` array). This mode REQUIRES `spaceId` (a page tree is
-     * scoped to one space) and IGNORES `limit` — the whole hierarchy is returned.
-     * It walks the sidebar tree via `enumerateSpacePages`, which performs N
-     * sidebar requests and is bounded by that method's 10000-node cap (and skips
-     * soft-deleted pages server-side).
-     */
-    async listPages(spaceId, limit = 50, tree = false) {
-        await this.ensureAuthenticated();
-        if (tree) {
-            if (!spaceId) {
-                throw new Error("list_pages: tree mode requires a spaceId (a page tree is scoped to one space). Pass spaceId, or omit tree to get the recent-pages list.");
-            }
-            const nodes = await this.enumerateSpacePages(spaceId);
-            return buildPageTree(nodes);
-        }
-        const clampedLimit = Math.max(1, Math.min(100, limit));
-        const payload = { limit: clampedLimit, page: 1 };
-        if (spaceId)
-            payload.spaceId = spaceId;
-        const response = await this.client.post("/pages/recent", payload);
-        const data = response.data;
-        const items = data.data?.items || data.items || [];
-        return items.map((page) => filterPage(page));
-    }
-    /**
-     * List sidebar pages for a space. With no pageId the request returns the
-     * space ROOT pages; with a pageId it returns the direct CHILDREN of that
-     * page. pageId is therefore optional and is only included in the POST body
-     * when provided (an empty/undefined pageId would otherwise change the
-     * semantics on the server).
-     */
-    async listSidebarPages(spaceId, pageId) {
-        await this.ensureAuthenticated();
-        // Paginate: the endpoint returns server-paged children, so posting only
-        // { page: 1 } silently dropped every child beyond the first page. Loop on
-        // meta.hasNextPage (with a MAX_PAGES ceiling like paginateAll, guarding
-        // against a stuck hasNextPage flag) and accumulate all children.
-        const MAX_PAGES = 50;
-        let page = 1;
-        let allItems = [];
-        let hasNextPage = true;
-        while (hasNextPage && page <= MAX_PAGES) {
-            // Only send pageId when scoping to a page's children; omit it for roots.
-            const payload = { spaceId, page };
-            if (pageId)
-                payload.pageId = pageId;
-            const response = await this.client.post("/pages/sidebar-pages", payload);
-            const data = response.data?.data ?? response.data;
-            const items = data?.items || [];
-            allItems = allItems.concat(items);
-            hasNextPage = data?.meta?.hasNextPage || false;
-            page++;
-        }
-        return allItems;
-    }
-    /**
-     * Enumerate EVERY page in a space (or in a subtree, when rootPageId is given)
-     * by walking the sidebar-pages tree.
-     *
-     * Starting set: the children of rootPageId when provided, otherwise the
-     * space root pages. From there it does an iterative breadth-first walk: each
-     * node is collected, and when node.hasChildren is true its direct children
-     * are fetched via listSidebarPages(spaceId, node.id) and enqueued.
-     *
-     * This replaces the old "/pages/recent" enumeration, which is a bounded
-     * recent-activity feed (~5000 cap) and therefore misses comments on older
-     * pages that were never recently touched.
-     *
-     * Safeguards: a `visited` Set of page ids prevents re-processing a node
-     * (cycles / duplicate references), and a hard node cap bounds pathological
-     * trees so the walk always terminates.
-     */
-    async enumerateSpacePages(spaceId, rootPageId) {
-        const MAX_NODES = 10000;
-        const result = [];
-        const visited = new Set();
-        // Seed the queue with the starting level (subtree children or roots).
-        const queue = await this.listSidebarPages(spaceId, rootPageId);
-        while (queue.length > 0 && result.length < MAX_NODES) {
-            const node = queue.shift();
-            if (!node || typeof node !== "object" || !node.id)
-                continue;
-            // Skip already-seen ids to guard against cycles / duplicate references.
-            if (visited.has(node.id))
-                continue;
-            visited.add(node.id);
-            result.push(node);
-            if (node.hasChildren) {
-                try {
-                    const children = await this.listSidebarPages(spaceId, node.id);
-                    for (const child of children)
-                        queue.push(child);
-                }
-                catch (e) {
-                    // A failure fetching one node's children must not abort the whole
-                    // walk: skip this branch and keep enumerating the rest.
-                }
-            }
-        }
-        return result;
-    }
-    /** Raw page info including the ProseMirror JSON content and slugId. */
-    async getPageRaw(pageId) {
-        await this.ensureAuthenticated();
-        const response = await this.client.post("/pages/info", { pageId });
-        return response.data?.data ?? response.data;
-    }
-    /**
-     * Resolve an agent-supplied pageId to the page's CANONICAL UUID (`page.id`),
-     * so every collaboration document the MCP opens is named `page.<uuid>` — the
-     * SAME name the web editor always uses (`page.${page.id}`).
-     *
-     * The agent commonly passes a 10-char public slugId (from URLs/listings) as
-     * the pageId. The web editor opens the collab doc by UUID, but the MCP used to
-     * pass that slugId straight into the collab doc name (`page.<slugId>`). For one
-     * DB row that produced TWO independent Yjs documents whose debounced stores
-     * clobbered each other — the agent's edit was silently lost (#260).
-     *
-     * A UUID input short-circuits with no network round-trip. A slugId is resolved
-     * once via getPageRaw and cached (both slugId->uuid and uuid->uuid), so
-     * repeated edits on the same page add no extra request.
-     */
-    async resolvePageId(pageId) {
-        if (isUuid(pageId))
-            return pageId;
-        const cached = this.pageIdCache.get(pageId);
-        if (cached)
-            return cached;
-        const data = await this.getPageRaw(pageId);
-        const uuid = data?.id;
-        if (typeof uuid !== "string" || !uuid) {
-            throw new Error(`Could not resolve a canonical page id for "${pageId}"`);
-        }
-        this.pageIdCache.set(pageId, uuid);
-        return uuid;
-    }
-    async getPage(pageId) {
-        await this.ensureAuthenticated();
-        const resultData = await this.getPageRaw(pageId);
-        let content = resultData.content
-            ? convertProseMirrorToMarkdown(resultData.content)
-            : "";
-        // Always fetch subpages to provide context to the agent
-        let subpages = [];
-        try {
-            // `pageId` may be a slugId, but the sidebar-pages endpoint requires the
-            // UUID; `resultData.id` holds the resolved UUID returned by getPageRaw.
-            subpages = await this.listSidebarPages(resultData.spaceId, resultData.id);
-        }
-        catch (e) {
-            console.warn("Failed to fetch subpages:", e);
-        }
-        // Resolve subpages if the placeholder exists
-        if (content && content.includes("{{SUBPAGES}}")) {
-            if (subpages && subpages.length > 0) {
-                const list = subpages
-                    .map((p) => `- [${p.title}](page:${p.id})`)
-                    .join("\n");
-                content = content.replace("{{SUBPAGES}}", `### Subpages\n${list}`);
-            }
-            else {
-                content = content.replace("{{SUBPAGES}}", "");
-            }
-        }
-        return {
-            data: filterPage(resultData, content, subpages),
-            success: true,
-        };
-    }
-    /** Page info + raw ProseMirror JSON content (lossless representation). */
-    async getPageJson(pageId) {
-        const data = await this.getPageRaw(pageId);
-        return {
-            id: data.id,
-            slugId: data.slugId,
-            title: data.title,
-            parentPageId: data.parentPageId,
-            spaceId: data.spaceId,
-            updatedAt: data.updatedAt,
-            content: data.content || { type: "doc", content: [] },
-        };
-    }
-    /**
-     * Fetch an INTERNAL Docmost file (authed loopback) for sandbox mirroring.
-     * `src` is normalized to `/api/files/<id>/<file>`; `this.client.baseURL`
-     * already ends in `/api`, so we strip the leading `/api` and request the
-     * relative path with the client's Authorization header. Returns the raw bytes
-     * and the response Content-Type (mime), defaulting to octet-stream.
-     *
-     * The fetch is size-bounded (hard 64 MiB ceiling) purely to protect memory;
-     * the authoritative per-blob cap is enforced by the sandbox `put`. The path is
-     * resolved via resolveInternalFilePath, which REJECTS (throws) any traversal
-     * or percent-encoded src that would let an attacker-controlled `attrs.src`
-     * escape `/api/files/` and reach another internal endpoint (SSRF). That throw
-     * happens before this.client.get, so a malicious src is counted as a failed
-     * mirror — it never reaches the network.
-     */
-    async fetchInternalFile(src) {
-        const HARD_CEILING = 64 * 1024 * 1024; // 64 MiB memory guard
-        const relPath = resolveInternalFilePath(src);
-        const response = await this.client.get(relPath, {
-            responseType: "arraybuffer",
-            timeout: 30000,
-            maxContentLength: HARD_CEILING,
-            maxBodyLength: HARD_CEILING,
-        });
-        const buffer = Buffer.from(response.data);
-        if (buffer.length === 0) {
-            throw new Error(`Empty file response from "${src}"`);
-        }
-        const rawCt = response.headers?.["content-type"];
-        const mime = typeof rawCt === "string" && rawCt.length > 0
-            ? rawCt.split(";")[0].trim().toLowerCase()
-            : "application/octet-stream";
-        return { buffer, mime };
-    }
-    /**
-     * Stash a page's full content into the in-RAM blob sandbox and return ONLY a
-     * short anonymous URL — the body never enters the model context (this is the
-     * whole point: ~30KB+ ProseMirror docs blow the model context if passed as a
-     * tool argument). Every INTERNAL file/image src (the type-agnostic criterion,
-     * so drawio/excalidraw/video/file nodes are covered too) is mirrored into the
-     * sandbox and its `src` rewritten to the sandbox URL, so an external consumer
-     * can fetch the images anonymously. External http(s) srcs are left untouched.
-     *
-     * Blobs live in RAM with a short TTL and are cleared on restart — consume the
-     * URLs within the TTL and one uptime. A failed image fetch never aborts the
-     * doc: the original src is kept and the failure counted.
-     *
-     * Returns { uri, sha256, size, images:{mirrored, failed} }. `uri` and `sha256`
-     * are for the document blob; `sha256` is also the blob's ETag (integrity).
-     */
-    async stashPage(pageId) {
-        if (!this.sandboxPut) {
-            throw new Error("stash_page is unavailable: the blob sandbox is not configured on this server");
-        }
-        await this.ensureAuthenticated();
-        // Stash the SAME shape get_page_json returns (id/title/.../content), with a
-        // deep clone so the rewrite never mutates anything shared.
-        const pageJson = await this.getPageJson(pageId);
-        const cloned = structuredClone(pageJson);
-        // Group internal-file nodes by normalized src so each unique resource is
-        // fetched + stored ONCE (dedup), and every node sharing that src points at
-        // the one sandbox blob. Capture each node's ORIGINAL raw src per-node:
-        // dedup groups nodes whose normalized src is equal even when their raw srcs
-        // differ (e.g. `/api/files/...` vs the bare `/files/...`), so on a revert we
-        // must restore each node's own original value, not the group key.
-        const bySrc = new Map();
-        for (const node of collectInternalFileNodes(cloned.content)) {
-            const origSrc = String(node.attrs.src);
-            const src = normalizeFileUrl(origSrc);
-            const entry = { node, origSrc };
-            const group = bySrc.get(src);
-            if (group)
-                group.push(entry);
-            else
-                bySrc.set(src, [entry]);
-        }
-        let mirrored = 0;
-        let failed = 0;
-        // Record every successful mirror so it can be (a) reverted if its blob gets
-        // FIFO-evicted by a LATER put in this same stash, and (b) freed if the final
-        // doc put throws.
-        const mirrors = [];
-        const MAX_CONCURRENCY = 5;
-        const groups = [...bySrc.entries()];
-        for (let i = 0; i < groups.length; i += MAX_CONCURRENCY) {
-            const batch = groups.slice(i, i + MAX_CONCURRENCY);
-            await Promise.all(batch.map(async ([src, entries]) => {
-                try {
-                    const { buffer, mime } = await this.fetchInternalFile(src);
-                    // put may throw if the blob exceeds the per-blob/total caps.
-                    const stored = this.sandboxPut(buffer, mime);
-                    for (const entry of entries)
-                        entry.node.attrs.src = stored.uri;
-                    mirrors.push({ uri: stored.uri, entries });
-                    mirrored++;
-                }
-                catch (err) {
-                    // One bad/oversized image (or a rejected traversal src) must not
-                    // abort the document. Logged unconditionally (never the blob body),
-                    // matching the package's ungated console.warn convention.
-                    failed++;
-                    console.warn(`stash_page: failed to mirror "${src}": ${err instanceof Error ? err.message : String(err)}`);
-                }
-            }));
-        }
-        // Revert one mirror's nodes to their original internal srcs and re-count it
-        // as failed (its blob was FIFO-evicted before the doc could reference it
-        // safely).
-        const revertMirror = (mirror) => {
-            for (const entry of mirror.entries)
-                entry.node.attrs.src = entry.origSrc;
-            mirrored--;
-            failed++;
-            console.warn(`stash_page: mirrored blob ${mirror.uri} was evicted before the doc ` +
-                `could safely reference it; reverted its src and counted it as failed`);
-        };
-        // Pre-put reconciliation: an image put earlier in THIS stash can FIFO-evict
-        // an even-earlier image of the same stash. Drop those from the live set
-        // first so the first serialized doc is already mostly correct.
-        let liveMirrors = mirrors;
-        if (this.sandboxHas) {
-            liveMirrors = [];
-            for (const mirror of mirrors) {
-                if (this.sandboxHas(mirror.uri))
-                    liveMirrors.push(mirror);
-                else
-                    revertMirror(mirror);
-            }
-        }
-        // Put the document, then reconcile against eviction caused by the doc put
-        // ITSELF (the doc is newest, FIFO drops oldest = this stash's images). Each
-        // iteration reverts >=1 mirror, so the loop terminates (worst case: all
-        // images reverted and the doc references no sandbox image URLs).
-        let stored;
-        for (;;) {
-            const docBuf = Buffer.from(JSON.stringify(cloned), "utf8");
-            let docStored;
-            try {
-                docStored = this.sandboxPut(docBuf, "application/json");
-            }
-            catch (err) {
-                // The doc put failed (e.g. doc exceeds the cap). Free this op's image
-                // blobs instead of leaking them in RAM for the whole TTL, then
-                // re-throw.
-                if (this.sandboxEvict) {
-                    for (const mirror of liveMirrors)
-                        this.sandboxEvict(mirror.uri);
-                }
-                throw err;
-            }
-            if (!this.sandboxHas) {
-                stored = docStored;
-                break;
-            }
-            const evictedNow = liveMirrors.filter((m) => !this.sandboxHas(m.uri));
-            if (evictedNow.length === 0) {
-                stored = docStored;
-                break;
-            }
-            // The doc we just stored references now-dead blobs. Revert those nodes,
-            // drop the stale doc blob, and loop to re-serialize + re-put the
-            // corrected doc.
-            for (const mirror of evictedNow)
-                revertMirror(mirror);
-            liveMirrors = liveMirrors.filter((m) => this.sandboxHas(m.uri));
-            if (this.sandboxEvict)
-                this.sandboxEvict(docStored.uri);
-        }
-        return {
-            uri: stored.uri,
-            sha256: stored.sha256,
-            size: stored.size,
-            images: { mirrored, failed },
-        };
-    }
-    /**
-     * Compact outline of a page's top-level blocks (no full document body).
-     * Cheap way to locate sections/tables and grab block ids before drilling in
-     * with get_node / patch_node / insert_node.
-     */
-    async getOutline(pageId) {
-        await this.ensureAuthenticated();
-        const data = await this.getPageRaw(pageId);
-        return {
-            pageId,
-            slugId: data.slugId,
-            title: data.title,
-            outline: buildOutline(data.content ?? { type: "doc", content: [] }),
-        };
-    }
-    /**
-     * Fetch a single node's full ProseMirror subtree (lossless) by reference:
-     * a block id (headings/paragraphs/callouts/images), or `#<index>` to select
-     * a top-level block by its outline index (the only way to reach tables/rows/
-     * cells, which carry no id).
-     */
-    async getNode(pageId, nodeId) {
-        await this.ensureAuthenticated();
-        const data = await this.getPageRaw(pageId);
-        const hit = getNodeByRef(data.content ?? { type: "doc", content: [] }, nodeId);
-        if (!hit) {
-            throw new Error(`get_node: no node found for "${nodeId}" on page ${pageId} (use a block id from get_outline, or "#<index>" for a top-level block such as a table)`);
-        }
-        return {
-            pageId,
-            ref: nodeId,
-            path: hit.path,
-            type: hit.type,
-            node: hit.node,
-        };
-    }
-    /**
-     * Find every occurrence of `query` on a page IN MEMORY, over the plain text of
-     * each text container (reusing the same `getPageRaw` fetch as the other read
-     * tools) — no server search endpoint, no whole-document round-trip through the
-     * model. Returns `{ total, truncated, matches }`; each match carries a ref for
-     * get_node/patch_node (the `#<index>` form resolves with get_node but NOT
-     * patch_node — see SearchMatch.nodeId), plus the top-level block index and a
-     * short context window used to build a unique text `selection` for
-     * create_comment (create_comment has no nodeId param). The pure engine
-     * (`searchInDoc`) owns the traversal, glue, the RE2 ReDoS-safe regex engine
-     * and the empty-query / invalid-or-unsupported-regex errors.
-     */
-    async searchInPage(pageId, query, opts = {}) {
-        await this.ensureAuthenticated();
-        const data = await this.getPageRaw(pageId);
-        const result = searchInDoc(data.content ?? { type: "doc", content: [] }, query, opts);
-        return { pageId, query, ...result };
-    }
-    /**
-     * Read a table as a matrix. `tableRef` is `#<index>` (from get_outline) or a
-     * block id of any node inside the table. Returns the cell texts plus a
-     * parallel cellIds matrix (each cell's first paragraph id, or null) so a
-     * caller can patch_node a cell for rich-formatted edits. Throws when no table
-     * resolves for the reference.
-     */
-    async getTable(pageId, tableRef) {
-        await this.ensureAuthenticated();
-        const data = await this.getPageRaw(pageId);
-        const t = readTable(data.content ?? { type: "doc", content: [] }, tableRef);
-        if (!t) {
-            throw new Error(`table_get: no table found for "${tableRef}" on page ${pageId} (use "#<index>" from get_outline, or a block id inside the table)`);
-        }
-        return {
-            pageId,
-            table: tableRef,
-            rows: t.rows,
-            cols: t.cols,
-            path: t.path,
-            cells: t.cells,
-            cellIds: t.cellIds,
-        };
-    }
-    /**
-     * Insert a row of plain-text cells into a table on the LIVE collab document.
-     * `tableRef` is `#<index>` or a block id inside the target table. `cells` is
-     * padded to the table's column count (more cells than columns throws); `index`
-     * is a 0-based insert position (omit/out-of-range to append). Throws when no
-     * table resolves for the reference.
-     */
-    async tableInsertRow(pageId, tableRef, cells, index) {
-        await this.ensureAuthenticated();
-        const collabToken = await this.getCollabTokenWithReauth();
-        // Open the collab doc by the canonical UUID, never the slugId (#260).
-        const pageUuid = await this.resolvePageId(pageId);
-        // Track insertion in an outer var, reset per-transform, so a collab retry
-        // recomputes it cleanly (mirrors insertNode's pattern).
-        let inserted = false;
-        const mutation = await mutatePageContent(pageUuid, collabToken, this.apiUrl, (liveDoc) => {
-            inserted = false;
-            const { doc: nd, inserted: ins } = insertTableRow(liveDoc, tableRef, cells, index);
-            inserted = ins;
-            if (!inserted)
-                return null; // table not found -> skip the write entirely
-            return nd;
-        });
-        if (!inserted) {
-            throw new Error(`table_insert_row: no table found for "${tableRef}" on page ${pageId} (use "#<index>" from get_outline, or a block id inside the table)`);
-        }
-        return {
-            success: true,
-            table: tableRef,
-            inserted: true,
-            verify: mutation.verify,
-        };
-    }
-    /**
-     * Delete the row at 0-based `index` from a table on the LIVE collab document.
-     * `tableRef` is `#<index>` or a block id inside the target table. The helper's
-     * out-of-range and last-row errors propagate; a missing table throws here.
-     */
-    async tableDeleteRow(pageId, tableRef, index) {
-        await this.ensureAuthenticated();
-        const collabToken = await this.getCollabTokenWithReauth();
-        // Open the collab doc by the canonical UUID, never the slugId (#260).
-        const pageUuid = await this.resolvePageId(pageId);
-        let deleted = false;
-        const mutation = await mutatePageContent(pageUuid, collabToken, this.apiUrl, (liveDoc) => {
-            deleted = false;
-            const { doc: nd, deleted: del } = deleteTableRow(liveDoc, tableRef, index);
-            deleted = del;
-            if (!deleted)
-                return null; // table not found -> skip the write entirely
-            return nd;
-        });
-        if (!deleted) {
-            throw new Error(`table_delete_row: no table found for "${tableRef}" on page ${pageId} (use "#<index>" from get_outline, or a block id inside the table)`);
-        }
-        return {
-            success: true,
-            table: tableRef,
-            deleted: true,
-            verify: mutation.verify,
-        };
-    }
-    /**
-     * Set the plain-text content of cell `[row, col]` (0-based) in a table on the
-     * LIVE collab document, replacing the cell's content with a single text
-     * paragraph (the cell's first-paragraph id is preserved). `tableRef` is
-     * `#<index>` or a block id inside the target table. The helper's out-of-range
-     * error propagates; a missing table throws here.
-     */
-    async tableUpdateCell(pageId, tableRef, row, col, text) {
-        await this.ensureAuthenticated();
-        const collabToken = await this.getCollabTokenWithReauth();
-        // Open the collab doc by the canonical UUID, never the slugId (#260).
-        const pageUuid = await this.resolvePageId(pageId);
-        let updated = false;
-        const mutation = await mutatePageContent(pageUuid, collabToken, this.apiUrl, (liveDoc) => {
-            updated = false;
-            const { doc: nd, updated: upd } = updateTableCell(liveDoc, tableRef, row, col, text);
-            updated = upd;
-            if (!updated)
-                return null; // table not found -> skip the write entirely
-            return nd;
-        });
-        if (!updated) {
-            throw new Error(`table_update_cell: no table found for "${tableRef}" on page ${pageId} (use "#<index>" from get_outline, or a block id inside the table)`);
-        }
-        return {
-            success: true,
-            table: tableRef,
-            row,
-            col,
-            verify: mutation.verify,
-        };
-    }
-    /**
-     * Create a new page with title and content.
-     * Uses the /pages/import workaround (the only endpoint accepting content),
-     * then moves the page and restores the exact title: the import endpoint
-     * derives the title from the FILENAME and replaces spaces with
-     * underscores, so we explicitly re-set it via /pages/update afterwards.
-     */
-    async createPage(title, content, spaceId, parentPageId) {
-        await this.ensureAuthenticated();
-        if (parentPageId) {
-            try {
-                await this.getPage(parentPageId);
-            }
-            catch (e) {
-                throw new Error(`Parent page with ID ${parentPageId} not found.`);
-            }
-        }
-        // 1. Create content via Import (using multipart/form-data).
-        // Build a FRESH FormData per send attempt: a FormData body is a single-use
-        // stream consumed on the first send, so it cannot be replayed by
-        // this.client's response interceptor (replay fails with 'socket hang up').
-        // Multipart re-auth is therefore done here with bare axios and an explicit
-        // one-shot 401/403 retry that rebuilds the body.
-        const fileContent = Buffer.from(content, "utf-8");
-        const buildForm = () => {
-            const form = new FormData();
-            form.append("spaceId", spaceId);
-            form.append("file", fileContent, {
-                filename: `${title || "import"}.md`,
-                contentType: "text/markdown",
-            });
-            return form;
-        };
-        const importUrl = `${this.apiUrl}/pages/import`;
-        let response;
-        try {
-            // Call buildForm() ONCE per attempt and reuse the instance for both
-            // getHeaders() and the body so the Content-Type boundary matches the body.
-            const form = buildForm();
-            // Read the Authorization header from this.client's defaults (set by
-            // login(), only ever deleted — never set to null) instead of building
-            // `Bearer ${this.token}`: a concurrent JSON 401 can null this.token
-            // mid-flight, which would otherwise produce a literal "Bearer null".
-            // ensureAuthenticated() above guarantees login() ran, so the default
-            // header exists here.
-            response = await axios.post(importUrl, form, {
-                headers: {
-                    ...form.getHeaders(),
-                    Authorization: this.client.defaults.headers.common["Authorization"],
-                },
-                timeout: 60000,
-            });
-        }
-        catch (error) {
-            // On an expired-token auth error, re-login and retry exactly once with a
-            // freshly-rebuilt FormData (the previous one was already consumed).
-            if (axios.isAxiosError(error) &&
-                (error.response?.status === 401 || error.response?.status === 403)) {
-                await this.login();
-                const form2 = buildForm();
-                response = await axios.post(importUrl, form2, {
-                    headers: {
-                        ...form2.getHeaders(),
-                        Authorization: this.client.defaults.headers.common["Authorization"],
-                    },
-                    timeout: 60000,
-                });
-            }
-            else {
-                throw error;
-            }
-        }
-        const newPageId = (response.data?.data ?? response.data).id;
-        // 2. Move to parent if needed
-        if (parentPageId) {
-            await this.movePage(newPageId, parentPageId);
-        }
-        // 3. Restore the exact title (import mangles spaces into underscores)
-        if (title) {
-            await this.client.post("/pages/update", { pageId: newPageId, title });
-        }
-        const page = await this.getPage(newPageId);
-        // Surface non-fatal footnote problems (dangling refs, empty/duplicate
-        // definitions, markers in tables) so the agent can fix its markup (#166).
-        return { ...page, ...footnoteWarningsField(content) };
-    }
-    /**
-     * Update a page's content from markdown and optionally its title.
-     * NOTE: full re-import — block ids regenerate. For surgical changes
-     * use editPageText / updatePageJson instead.
-     */
-    async updatePage(pageId, content, title) {
-        await this.ensureAuthenticated();
-        // Open the collab doc by the canonical UUID, never the slugId (#260). The
-        // REST /pages/update title write below keeps the agent-supplied id (the
-        // server resolves a slugId there).
-        const pageUuid = await this.resolvePageId(pageId);
-        // Write the BODY first, then the title (#159 split-brain). If the collab
-        // body write fails (e.g. a persist timeout), the title must be left
-        // UNTOUCHED so the page never ends up with a new title over its old body.
-        // A title write failing AFTER a successful body is rarer (REST is fast) and
-        // leaves correct content under a stale title — the lesser inconsistency.
-        let collabToken = "";
-        let mutation;
-        try {
-            collabToken = await this.getCollabTokenWithReauth();
-            mutation = await updatePageContentRealtime(pageUuid, content, collabToken, this.apiUrl);
-        }
-        catch (error) {
-            // Verbose diagnostics (incl. anything that could expose a token prefix)
-            // are gated behind DEBUG; the thrown Error below carries no token data.
-            if (process.env.DEBUG) {
-                console.error("Failed to update page content via realtime collaboration:", error);
-                const tokenPreview = collabToken
-                    ? collabToken.substring(0, 15) + "..."
-                    : "null";
-                console.error(`Collab token preview: ${tokenPreview}`);
-            }
-            throw new Error(`Failed to update page content: ${error.message}`);
-        }
-        // Body persisted successfully — now it is safe to set the title.
-        if (title) {
-            await this.client.post("/pages/update", { pageId, title });
-        }
-        return {
-            success: true,
-            modified: true,
-            message: "Page updated successfully.",
-            pageId: pageId,
-            verify: mutation.verify,
-            // Non-fatal footnote diagnostics (#166); omitted when there are none.
-            ...footnoteWarningsField(content),
-        };
-    }
-    /**
-     * Validate a URL string against a scheme allowlist for a given context.
-     *
-     * The markdown link path enforces safe schemes via TipTap, but the raw
-     * JSON path (updatePageJson) bypasses that — so this is the sanitization
-     * choke point for ProseMirror JSON written directly by the caller.
-     *
-     * - "link":  reject javascript:, vbscript:, data: (any scheme that can
-     *            execute or smuggle script when the href is clicked).
-     * - "src":   allow only http(s):, mailto:, /api/files paths, or a
-     *            scheme-less relative/absolute path; reject
-     *            javascript:/vbscript:/data:/file:.
-     */
-    isSafeUrl(url, context) {
-        if (typeof url !== "string")
-            return false;
-        const trimmed = url.trim();
-        if (trimmed === "")
-            return true; // empty href/src is harmless
-        // Extract a leading "scheme:" if present. A scheme must start with a
-        // letter and contain only letters/digits/+/-/. before the colon. Strip
-        // whitespace and ASCII control chars first so a tab/newline embedded in
-        // the scheme cannot smuggle a dangerous scheme past the check.
-        const cleaned = trimmed.replace(/[\s\x00-\x1f]+/g, "");
-        const schemeMatch = /^([a-zA-Z][a-zA-Z0-9+.-]*):/.exec(cleaned);
-        const scheme = schemeMatch ? schemeMatch[1].toLowerCase() : null;
-        const dangerous = new Set(["javascript", "vbscript", "data", "file"]);
-        if (context === "link") {
-            if (scheme === null)
-                return true; // relative/anchor link is fine
-            // For links, data: is also blocked (can carry script payloads).
-            return !new Set(["javascript", "vbscript", "data"]).has(scheme);
-        }
-        // context === "src"
-        if (scheme === null)
-            return true; // relative/absolute path (incl. /api/files)
-        if (dangerous.has(scheme))
-            return false;
-        return scheme === "http" || scheme === "https" || scheme === "mailto";
-    }
-    /**
-     * Recursively walk a ProseMirror doc and reject any unsafe URL on a link
-     * mark href or on a media node's src/url. Media nodes covered: image,
-     * attachment, video, plus embed (rendered as an iframe), youtube, drawio
-     * and excalidraw — all of which carry a user-controlled URL that Docmost
-     * renders. Throws a clear error on the first violation. A max-depth guard
-     * turns an over-deep document into a clean error instead of a RangeError
-     * stack overflow.
-     */
-    validateDocUrls(node, depth = 0) {
-        const MAX_DEPTH = 200;
-        if (depth > MAX_DEPTH) {
-            throw new Error(`document nesting exceeds the maximum depth of ${MAX_DEPTH}`);
-        }
-        if (!node || typeof node !== "object")
-            return;
-        // Link marks on text nodes: validate the href.
-        if (Array.isArray(node.marks)) {
-            for (const mark of node.marks) {
-                if (mark && mark.type === "link" && mark.attrs) {
-                    if (!this.isSafeUrl(mark.attrs.href, "link")) {
-                        throw new Error(`unsafe link href rejected: "${mark.attrs.href}"`);
-                    }
-                }
-            }
-        }
-        // Media nodes: validate src/url against the stricter src allowlist.
-        // embed renders as an iframe (highest risk); youtube/drawio/excalidraw
-        // likewise carry a user-controlled URL Docmost renders, so they get the
-        // same scheme check as image/attachment/video.
-        if (node.type === "image" ||
-            node.type === "attachment" ||
-            node.type === "video" ||
-            node.type === "embed" ||
-            node.type === "youtube" ||
-            node.type === "drawio" ||
-            node.type === "excalidraw" ||
-            node.type === "audio" ||
-            node.type === "pdf") {
-            const attrs = node.attrs || {};
-            for (const key of ["src", "url"]) {
-                if (attrs[key] != null && !this.isSafeUrl(attrs[key], "src")) {
-                    throw new Error(`unsafe ${node.type} ${key} rejected: "${attrs[key]}"`);
-                }
-            }
-        }
-        if (Array.isArray(node.content)) {
-            for (const child of node.content) {
-                this.validateDocUrls(child, depth + 1);
-            }
-        }
-    }
-    /**
-     * Recursively validate the STRUCTURE of a ProseMirror node (reuses the
-     * recursion shape of validateDocUrls). Every node must be an object with a
-     * string `type`; when present, `content` must be an array, `marks` must be
-     * an array of objects each with a string `type`, and a text node's `text`
-     * must be a string. Throws a clear "invalid ProseMirror document" error on
-     * the first violation. A max-depth guard turns an over-deep document into a
-     * clean error instead of a RangeError stack overflow.
-     */
-    validateDocStructure(node, depth = 0) {
-        const MAX_DEPTH = 200;
-        if (depth > MAX_DEPTH) {
-            throw new Error(`invalid ProseMirror document: nesting exceeds the maximum depth of ${MAX_DEPTH}`);
-        }
-        if (!node || typeof node !== "object" || typeof node.type !== "string") {
-            throw new Error("invalid ProseMirror document: every node must be an object with a string `type`");
-        }
-        if ("text" in node &&
-            node.type === "text" &&
-            typeof node.text !== "string") {
-            throw new Error("invalid ProseMirror document: a text node must have a string `text`");
-        }
-        if (node.marks !== undefined) {
-            if (!Array.isArray(node.marks)) {
-                throw new Error("invalid ProseMirror document: `marks` must be an array");
-            }
-            for (const mark of node.marks) {
-                if (!mark ||
-                    typeof mark !== "object" ||
-                    typeof mark.type !== "string") {
-                    throw new Error("invalid ProseMirror document: every mark must be an object with a string `type`");
-                }
-            }
-        }
-        if (node.content !== undefined) {
-            if (!Array.isArray(node.content)) {
-                throw new Error("invalid ProseMirror document: `content` must be an array when present");
-            }
-            for (const child of node.content) {
-                this.validateDocStructure(child, depth + 1);
-            }
-        }
-    }
-    /**
-     * Replace page content with a raw ProseMirror JSON document (lossless) and/or
-     * update its title. Both `doc` and `title` are optional, but at least one must
-     * be supplied:
-     *  - `doc` provided   -> validate + full-overwrite the body (and update the
-     *                        title too when `title` is also given).
-     *  - `doc` omitted, `title` given -> title-only update; the body is NOT
-     *                        touched/resent (no collab write happens).
-     *  - neither given    -> throws (nothing to update).
-     */
-    async updatePageJson(pageId, doc, title) {
-        await this.ensureAuthenticated();
-        // Title-only / no-op handling: when no document is supplied, do NOT write
-        // the body. Update the title if one was given; otherwise there is nothing
-        // to do, so fail loudly rather than silently no-op.
-        if (doc == null) {
-            if (!title) {
-                throw new Error("update_page_json: nothing to update (provide content and/or title)");
-            }
-            await this.client.post("/pages/update", { pageId, title });
-            return {
-                success: true,
-                modified: true,
-                message: "Page title updated (content left unchanged).",
-                pageId,
-            };
-        }
-        // Validate the document shape before a full overwrite: a malformed doc
-        // would otherwise silently corrupt the page (full-overwrite is the
-        // documented behaviour; no optimistic-concurrency is applied here).
-        if (typeof doc !== "object" ||
-            doc.type !== "doc" ||
-            !Array.isArray(doc.content)) {
-            throw new Error('content must be a ProseMirror document ({"type":"doc","content":[...]}) ' +
-                "where content is an array of nodes each having a string `type`");
-        }
-        // Recurse the WHOLE document so a malformed nested node (e.g. a node with a
-        // non-string type, a non-array content/marks, or a text node missing its
-        // string text) is rejected up front rather than silently corrupting the
-        // page on overwrite.
-        this.validateDocStructure(doc);
-        // Sanitize URLs before writing. This closes the JSON-path bypass: unlike
-        // the markdown link path (which TipTap sanitizes), raw JSON could otherwise
-        // inject javascript:/data: link hrefs or media srcs straight into the doc.
-        this.validateDocUrls(doc);
-        // Canonicalize footnotes (idempotent): an agent-authored JSON doc cannot
-        // leave footnotes out of order, orphaned, or in multiple lists — the bottom
-        // list + numbering are always derived from reference order. No-op when the
-        // footnotes are already canonical.
-        doc = canonicalizeFootnotes(doc);
-        // Write the BODY first, then the title (#159 split-brain): a failed body
-        // write (e.g. persist timeout) must not leave a new title over the old body.
-        const collabToken = await this.getCollabTokenWithReauth();
-        // Open the collab doc by the canonical UUID, never the slugId (#260).
-        const pageUuid = await this.resolvePageId(pageId);
-        const mutation = await this.replacePage(pageUuid, doc, collabToken, this.apiUrl);
-        // Body persisted successfully — now it is safe to set the title.
-        if (title) {
-            await this.client.post("/pages/update", { pageId, title });
-        }
-        return {
-            success: true,
-            modified: true,
-            message: "Page content replaced from ProseMirror JSON.",
-            pageId,
-            verify: mutation.verify,
-        };
-    }
-    /**
-     * AUTHOR-INLINE footnote insertion. The agent supplies only WHERE
-     * (`anchorText`, a snippet of body text to attach the marker after) and WHAT
-     * (`text`, the footnote content as markdown). Numbering and the bottom
-     * `footnotesList` are derived deterministically server-side
-     * (`insertInlineFootnote` -> `canonicalizeFootnotes`): the agent never sees,
-     * assigns, or edits a footnote number or the list, so it CANNOT desync.
-     *
-     * Content DEDUP: when an existing definition has the same content, its id is
-     * reused (one number, one definition, several references). The write is atomic
-     * via `mutatePageContent` (single-writer, page-locked); if the anchor text is
-     * not found the transform aborts with a clear error and no write happens.
-     */
-    async insertFootnote(pageId, anchorText, text) {
-        await this.ensureAuthenticated();
-        if (!anchorText || !anchorText.trim()) {
-            throw new Error("insert_footnote: anchorText is required");
-        }
-        if (text == null || `${text}`.trim() === "") {
-            throw new Error("insert_footnote: text is required");
-        }
-        const collabToken = await this.getCollabTokenWithReauth();
-        // Open the collab doc by the canonical UUID, never the slugId (#260).
-        const pageUuid = await this.resolvePageId(pageId);
-        let result = null;
-        const mutation = await this.mutatePage(pageUuid, collabToken, this.apiUrl, (liveDoc) => {
-            const r = insertInlineFootnote(liveDoc, { anchorText, text });
-            if (!r.inserted) {
-                // Abort the page-locked write by throwing: mutatePageContent does not
-                // persist when the transform throws, so a missing anchor leaves the
-                // page untouched (no partial write).
-                throw new Error(`insert_footnote: anchor text not found: ${JSON.stringify(anchorText.slice(0, 80))}`);
-            }
-            result = { footnoteId: r.footnoteId, reused: r.reused };
-            return r.doc;
-        });
-        // The not-found path throws inside the transform (aborting mutatePage), so by
-        // here `result` is always set.
-        const r = result;
-        return {
-            success: true,
-            modified: true,
-            pageId,
-            footnoteId: r.footnoteId,
-            reused: r.reused,
-            message: r.reused
-                ? "Footnote inserted (reused an existing same-content definition)."
-                : "Footnote inserted.",
-            verify: mutation.verify,
-        };
-    }
-    /**
-     * Page-locked write seam over collaboration.mutatePageContent. Production just
-     * delegates; it exists as an overridable method so the insert_footnote wrapper
-     * (transform abort-on-not-found + response shaping) can be unit-tested without
-     * standing up a live Hocuspocus collab socket.
-     */
-    mutatePage(pageId, collabToken, apiUrl, transform) {
-        return mutatePageContent(pageId, collabToken, apiUrl, transform);
-    }
-    /**
-     * Full-document write seam over collaboration.replacePageContent. Production
-     * just delegates; it exists as an overridable method so the full-doc write
-     * tools (update_page_json, copy_page_content) can have their footnote-
-     * canonicalization binding unit-tested without a live Hocuspocus collab socket.
-     */
-    replacePage(pageId, doc, collabToken, apiUrl) {
-        return replacePageContent(pageId, doc, collabToken, apiUrl);
-    }
-    /**
-     * Export a page to a single self-contained Docmost-flavoured markdown file:
-     * meta block + body (with inline comment anchors + diagrams) + comment
-     * threads. Lossless round-trip target; see importPageMarkdown for the inverse.
-     */
-    async exportPageMarkdown(pageId) {
-        await this.ensureAuthenticated();
-        const page = await this.getPageRaw(pageId);
-        const body = page.content ? convertProseMirrorToMarkdown(page.content) : "";
-        let comments = [];
-        try {
-            comments = await this.listComments(pageId);
-        }
-        catch (e) {
-            // A comments fetch failure must not lose the body; export with [] and let
-            // the caller see the (empty) comments block. Log under DEBUG only.
-            if (process.env.DEBUG)
-                console.error("export: listComments failed", e);
-        }
-        const meta = {
-            version: 1,
-            pageId: page.id,
-            slugId: page.slugId,
-            title: page.title,
-            spaceId: page.spaceId,
-            parentPageId: page.parentPageId ?? null,
-        };
-        return serializeDocmostMarkdown(meta, body, comments);
-    }
-    /**
-     * Import a self-contained Docmost markdown file back into a page. Parses out
-     * the meta + comments metadata blocks, converts the body to ProseMirror
-     * (restoring comment marks + diagrams from their inline HTML), and replaces
-     * the page content. Comment THREAD records are NOT written to the server in
-     * this version — they are preserved in the file and the inline marks are
-     * re-applied so the highlights survive; managing comment records stays with
-     * the comment tools/UI.
-     */
-    async importPageMarkdown(pageId, fullMarkdown) {
-        await this.ensureAuthenticated();
-        const { meta, body, comments } = parseDocmostMarkdown(fullMarkdown);
-        // PAGE import: canonicalize footnotes (see markdownToProseMirrorCanonical).
-        const doc = await markdownToProseMirrorCanonical(body);
-        const collabToken = await this.getCollabTokenWithReauth();
-        // Open the collab doc by the canonical UUID, never the slugId (#260).
-        const pageUuid = await this.resolvePageId(pageId);
-        const mutation = await replacePageContent(pageUuid, doc, collabToken, this.apiUrl);
-        // Collect distinct comment ids that actually became comment marks in the doc.
-        const collectCommentIds = (node, acc) => {
-            if (!node || typeof node !== "object")
-                return acc;
-            if (Array.isArray(node.marks)) {
-                for (const mk of node.marks) {
-                    if (mk && mk.type === "comment" && mk.attrs?.commentId) {
-                        acc.add(mk.attrs.commentId);
-                    }
-                }
-            }
-            if (Array.isArray(node.content)) {
-                for (const child of node.content)
-                    collectCommentIds(child, acc);
-            }
-            return acc;
-        };
-        // Count reflects the comment marks present in the written document, so an id
-        // that only appears as inert text (e.g. inside a fenced code block) is not
-        // counted because it never becomes a comment mark.
-        const anchoredIds = collectCommentIds(doc, new Set());
-        const result = {
-            success: true,
-            pageId,
-            anchoredCommentCount: anchoredIds.size,
-            commentsInFile: Array.isArray(comments) ? comments.length : 0,
-            verify: mutation.verify,
-        };
-        // Warn (non-fatal) if the file was exported from a DIFFERENT page.
-        if (meta?.pageId && meta.pageId !== pageId) {
-            result.warning = `File was exported from page ${meta.pageId} but is being imported into ${pageId}.`;
-        }
-        // Non-fatal footnote diagnostics (#166), analyzed on the BODY (the part after
-        // the docmost:meta / docmost:comments blocks) — so a `[^x]`-like token inside
-        // those JSON blocks never produces a false warning, while real markers in the
-        // body do. `body` comes from parseDocmostMarkdown(fullMarkdown) above.
-        Object.assign(result, footnoteWarningsField(body));
-        return result;
-    }
-    /**
-     * Rename a page (change its title only) without touching or resending its
-     * content. The slug is derived from the page record, not the body, so it is
-     * left intact too.
-     */
-    async renamePage(pageId, title) {
-        await this.ensureAuthenticated();
-        await this.client.post("/pages/update", { pageId, title });
-        return { success: true, pageId, title };
-    }
-    /**
-     * Copy the WHOLE content of one page onto another, entirely server-side: the
-     * source's ProseMirror document is read and written verbatim onto the target
-     * via the live collab path, so the document never passes through the model.
-     *
-     * Only the target's BODY is replaced — its title and slug live on the page
-     * record (not in the content), so they are untouched. The source page is not
-     * modified at all.
-     */
-    async copyPageContent(sourcePageId, targetPageId) {
-        await this.ensureAuthenticated();
-        // A self-copy would be a no-op overwrite; reject it explicitly so a caller
-        // mistake surfaces as a clear error rather than a silent round-trip.
-        if (sourcePageId === targetPageId) {
-            throw new Error("copy_page_content: sourcePageId and targetPageId are the same page (no-op copy)");
-        }
-        const source = await this.getPageRaw(sourcePageId);
-        const content = source?.content;
-        if (!content ||
-            typeof content !== "object" ||
-            content.type !== "doc" ||
-            !Array.isArray(content.content)) {
-            throw new Error(`copy_page_content: source page ${sourcePageId} has no usable ProseMirror content to copy`);
-        }
-        // Defense-in-depth: run the same URL-scheme sanitizer the JSON write path
-        // uses, so copying never lands a javascript:/data: href/src on the target
-        // (parity with updatePageJson; harmless for already-stored source content).
-        this.validateDocUrls(content);
-        // Defense-in-depth (#228): this is a FULL-document write, so canonicalize
-        // footnotes before copying — a no-op on already-canonical source content, but
-        // it guarantees a copy can never propagate a non-canonical footnote topology
-        // to the target (parity with the other full-doc write paths).
-        const canonical = canonicalizeFootnotes(content);
-        const collabToken = await this.getCollabTokenWithReauth();
-        // Open the TARGET collab doc by its canonical UUID, never the slugId (#260).
-        const targetUuid = await this.resolvePageId(targetPageId);
-        const mutation = await this.replacePage(targetUuid, canonical, collabToken, this.apiUrl);
-        return {
-            success: true,
-            sourcePageId,
-            targetPageId,
-            copiedNodes: canonical.content.length,
-            verify: mutation.verify,
-        };
-    }
-    /**
-     * Surgical text edits: find/replace inside text nodes of the live
-     * document. Preserves all block ids, marks, callouts and tables.
-     */
-    async editPageText(pageId, edits) {
-        await this.ensureAuthenticated();
-        const collabToken = await this.getCollabTokenWithReauth();
-        // Open the collab doc by the canonical UUID, never the slugId (#260).
-        const pageUuid = await this.resolvePageId(pageId);
-        // Apply the edits against the LIVE synced document, not the debounced REST
-        // snapshot, so concurrent human edits/comments are preserved. applyTextEdits
-        // records per-edit match problems in `failed` instead of throwing, and
-        // applies whatever it can; we abort the write only when nothing applied.
-        let results;
-        let failed;
-        // Whether we actually wrote new content. Set inside the transform: a
-        // degenerate edit (e.g. find === replace, or a batch that nets to no change)
-        // can "apply" yet leave the document byte-for-byte identical, in which case
-        // we must NOT write (no spurious history version) and must not claim a write
-        // happened.
-        let wrote = false;
-        const mutation = await mutatePageContent(pageUuid, collabToken, this.apiUrl, (liveDoc) => {
-            wrote = false;
-            const r = applyTextEdits(liveDoc, edits);
-            results = r.results;
-            failed = r.failed;
-            // Nothing applied -> abort the write (mutatePageContent treats a null
-            // return from the transform as "write nothing").
-            if (r.results.length === 0)
-                return null;
-            // Edits "applied" but produced an identical document: skip the write so
-            // no new history version is created. Stable structural comparison via
-            // JSON.stringify (both docs come from the same deep-copied source, so
-            // key order is stable).
-            if (JSON.stringify(r.doc) === JSON.stringify(liveDoc))
-                return null;
-            wrote = true;
-            return r.doc;
-        });
-        if ((results?.length ?? 0) === 0 && (failed?.length ?? 0) > 0) {
-            // No edit applied: surface an aggregated, actionable error so the caller
-            // does not mistake a no-op for a partial success.
-            throw new Error("edit_page_text: no edits were applied (nothing written). " +
-                failed.map((f) => `"${f.find}": ${f.reason}`).join("; "));
-        }
-        // Edits matched but produced no content change (identical document): report
-        // a successful no-op — NOT a failure — and do not falsely claim a write.
-        if (!wrote) {
-            return {
-                success: true,
-                pageId,
-                applied: results,
-                failed,
-                message: "No changes written (edits produced identical content).",
-                verify: mutation.verify,
-            };
-        }
-        const result = {
-            success: true,
-            pageId,
-            applied: results,
-            failed,
-            message: (failed?.length ?? 0)
-                ? `Applied ${results?.length ?? 0} edit(s); ${failed.length} failed (see failed[]). Node ids and formatting preserved.`
-                : "Text edits applied (node ids and formatting preserved).",
-            verify: mutation.verify,
-        };
-        // If any applied edit matched only after stripping markdown (the
-        // normalized fallback), warn that edit_page_text preserved existing marks
-        // and did NOT change formatting — so a caller who intended a formatting
-        // change is pointed at patch_node.
-        if (results?.some((r) => r.normalized === true)) {
-            result.warning =
-                "Some edits matched only after stripping markdown from your find string; " +
-                    "edit_page_text preserved existing marks (it did not change bold/strike/etc.). " +
-                    "If you intended a formatting change, use patch_node.";
-        }
-        return result;
-    }
-    /**
-     * Replace EVERY node whose attrs.id === nodeId (recursively, including nodes
-     * nested in callouts/tables) with the supplied node. Operates on the LIVE
-     * collab document so comments and concurrent edits are preserved.
-     *
-     * The replacement node's block id is preserved: if node.attrs is missing it
-     * is created, and if node.attrs.id is missing it is set to nodeId so the
-     * replacement keeps the same id it replaced. Throws if no node matches.
-     */
-    async patchNode(pageId, nodeId, node) {
-        await this.ensureAuthenticated();
-        if (!node || typeof node !== "object" || typeof node.type !== "string") {
-            throw new Error("patch_node: `node` must be an object with a string `type`");
-        }
-        // Preserve the block id WITHOUT mutating the caller's object: build a local
-        // copy whose attrs.id === nodeId (so the swapped-in node keeps the id of the
-        // node it replaces).
-        const target = {
-            ...node,
-            attrs: {
-                ...(node.attrs && typeof node.attrs === "object" ? node.attrs : {}),
-            },
-        };
-        if (target.attrs.id == null) {
-            target.attrs.id = nodeId;
-        }
-        const collabToken = await this.getCollabTokenWithReauth();
-        // Open the collab doc by the canonical UUID, never the slugId (#260).
-        const pageUuid = await this.resolvePageId(pageId);
-        // Track the replacement count in an outer var, reset per-transform, so a
-        // collab retry recomputes it cleanly (mirrors replaceImage's pattern).
-        let replaced = 0;
-        const mutation = await mutatePageContent(pageUuid, collabToken, this.apiUrl, (liveDoc) => {
-            replaced = 0;
-            const { doc: nd, replaced: r } = replaceNodeById(liveDoc, nodeId, target);
-            replaced = r;
-            // 0 matches -> skip the write. >1 matches -> the id is AMBIGUOUS: Docmost
-            // duplicates block ids on copy/paste (and copyPageContent writes them
-            // verbatim), so replacing "the node with id X" would silently clobber
-            // EVERY duplicate (#159). Refuse: skip the write and throw below so the
-            // model re-targets with a more specific anchor instead of corrupting the
-            // page. Only an unambiguous single match is written.
-            if (replaced !== 1)
-                return null;
-            return nd;
-        });
-        // 0 -> "no node"; >1 -> "ambiguous, refused" (the transform already skipped
-        // the write for any count !== 1). Single shared guard (#159, #185 review).
-        assertUnambiguousMatch("patch_node", "replace", replaced, nodeId, pageId);
-        return { success: true, replaced, nodeId, verify: mutation.verify };
-    }
-    /**
-     * Insert a node relative to an anchor (or append it at the top level).
-     * Operates on the LIVE collab document so comments and concurrent edits are
-     * preserved.
-     *
-     * opts.position:
-     *  - "append": push the node at the end of the top-level content.
-     *  - "before"/"after": insert the node as a sibling of the anchor, just
-     *    before/after it. Exactly one of anchorNodeId / anchorText must be given;
-     *    anchorNodeId locates a node anywhere by attrs.id, anchorText matches the
-     *    first top-level block whose plain text includes it.
-     *
-     * Throws if the anchor cannot be found.
-     */
-    async insertNode(pageId, node, opts) {
-        await this.ensureAuthenticated();
-        if (!node || typeof node !== "object" || typeof node.type !== "string") {
-            throw new Error("insert_node: `node` must be an object with a string `type`");
-        }
-        if (!opts ||
-            (opts.position !== "before" &&
-                opts.position !== "after" &&
-                opts.position !== "append")) {
-            throw new Error('insert_node: `position` must be one of "before", "after", "append"');
-        }
-        if (opts.position === "before" || opts.position === "after") {
-            // before/after require EXACTLY ONE anchor (an id or a text fragment).
-            const hasId = typeof opts.anchorNodeId === "string" && opts.anchorNodeId.length > 0;
-            const hasText = typeof opts.anchorText === "string" && opts.anchorText.length > 0;
-            if (hasId === hasText) {
-                throw new Error(`insert_node: position "${opts.position}" requires exactly one of anchorNodeId or anchorText`);
-            }
-        }
-        const collabToken = await this.getCollabTokenWithReauth();
-        // Open the collab doc by the canonical UUID, never the slugId (#260).
-        const pageUuid = await this.resolvePageId(pageId);
-        // Track insertion in an outer var, reset per-transform, so a collab retry
-        // recomputes it cleanly (mirrors replaceImage's pattern).
-        let inserted = false;
-        const mutation = await mutatePageContent(pageUuid, collabToken, this.apiUrl, (liveDoc) => {
-            inserted = false;
-            const { doc: nd, inserted: ins } = insertNodeRelative(liveDoc, node, opts);
-            inserted = ins;
-            if (!inserted)
-                return null; // anchor not found -> skip the write entirely
-            return nd;
-        });
-        if (!inserted) {
-            const anchorDesc = opts.anchorNodeId
-                ? `anchorNodeId "${opts.anchorNodeId}"`
-                : `anchorText "${opts.anchorText}"`;
-            // anchorText is matched against the block's literal RENDERED plain text;
-            // markdown/emoji are tolerated only as a strip-and-retry fallback, so a
-            // miss usually means the text differs from what's on the page.
-            const hint = opts.anchorText
-                ? " anchorText must be the block's literal rendered plain text (no markdown wrappers or emoji); anchorNodeId from get_page_json is more reliable."
-                : "";
-            throw new Error(`insert_node: anchor not found (${anchorDesc}) on page ${pageId}.${hint}`);
-        }
-        return {
-            success: true,
-            inserted: true,
-            position: opts.position,
-            verify: mutation.verify,
-        };
-    }
-    /**
-     * Remove EVERY node whose attrs.id === nodeId (recursively, including nodes
-     * nested in callouts/tables) from its parent content array. Operates on the
-     * LIVE collab document so comments and concurrent edits are preserved.
-     * Throws if no node matches.
-     */
-    async deleteNode(pageId, nodeId) {
-        await this.ensureAuthenticated();
-        const collabToken = await this.getCollabTokenWithReauth();
-        // Open the collab doc by the canonical UUID, never the slugId (#260).
-        const pageUuid = await this.resolvePageId(pageId);
-        // Track the deletion count in an outer var, reset per-transform, so a
-        // collab retry recomputes it cleanly (mirrors replaceImage's pattern).
-        let deleted = 0;
-        const mutation = await mutatePageContent(pageUuid, collabToken, this.apiUrl, (liveDoc) => {
-            deleted = 0;
-            const { doc: nd, deleted: d } = deleteNodeById(liveDoc, nodeId);
-            deleted = d;
-            // 0 matches -> skip the write. >1 matches -> the id is AMBIGUOUS (block
-            // ids are duplicated on copy/paste, #159): deleting "the node with id X"
-            // would silently remove EVERY duplicate. Refuse: skip the write and throw
-            // below so the model re-targets. Only an unambiguous single match is
-            // deleted.
-            if (deleted !== 1)
-                return null;
-            return nd;
-        });
-        // 0 -> "no node"; >1 -> "ambiguous, refused" (the transform already skipped
-        // the write for any count !== 1). Single shared guard (#159, #185 review).
-        assertUnambiguousMatch("delete_node", "delete", deleted, nodeId, pageId);
-        return { success: true, deleted, nodeId, verify: mutation.verify };
-    }
-    /** Build the public share URL for a page. */
-    shareUrl(shareKey, slugId) {
-        return `${this.appUrl}/share/${shareKey}/p/${slugId}`;
-    }
-    /** Share a page publicly (idempotent) and return the public URL. */
-    async sharePage(pageId, searchIndexing = true) {
-        await this.ensureAuthenticated();
-        const response = await this.client.post("/shares/create", {
-            pageId,
-            includeSubPages: false,
-            searchIndexing,
-        });
-        const share = response.data?.data ?? response.data;
-        const slugId = share.page?.slugId || (await this.getPageRaw(pageId)).slugId;
-        return {
-            shareId: share.id,
-            key: share.key,
-            pageId: share.pageId,
-            publicUrl: this.shareUrl(share.key, slugId),
-            searchIndexing: share.searchIndexing,
-        };
-    }
-    /** List all public shares in the workspace with their URLs. */
-    async listShares() {
-        const shares = await this.paginateAll("/shares", {});
-        return shares.map((s) => ({
-            shareId: s.id,
-            key: s.key,
-            pageId: s.pageId,
-            pageTitle: s.page?.title,
-            publicUrl: s.page?.slugId ? this.shareUrl(s.key, s.page.slugId) : null,
-            searchIndexing: s.searchIndexing,
-            createdAt: s.createdAt,
-        }));
-    }
-    /** Remove the public share of a page. */
-    async unsharePage(pageId) {
-        await this.ensureAuthenticated();
-        const shares = await this.listShares();
-        const share = shares.find((s) => s.pageId === pageId);
-        if (!share) {
-            throw new Error(`Page ${pageId} is not shared.`);
-        }
-        await this.client.post("/shares/delete", { shareId: share.shareId });
-        return { success: true, removedShareId: share.shareId, pageId };
-    }
-    async search(query, spaceId, limit) {
-        await this.ensureAuthenticated();
-        const payload = { query, spaceId };
-        // Clamp an optional caller-supplied limit into a sane 1..100 range before
-        // forwarding it to the server; omit it entirely when not provided so the
-        // server applies its own default.
-        if (limit !== undefined) {
-            payload.limit = Math.max(1, Math.min(100, limit));
-        }
-        const response = await this.client.post("/search", payload);
-        // Normalize both response shapes: bare array and paginated { items: [...] }
-        const data = response.data?.data;
-        const items = Array.isArray(data) ? data : data?.items || [];
-        const filteredItems = items.map((item) => filterSearchResult(item));
-        return {
-            items: filteredItems,
-            success: response.data?.success || false,
-        };
-    }
-    async movePage(pageId, parentPageId, position) {
-        await this.ensureAuthenticated();
-        // Docmost requires position >= 5 chars.
-        const validPosition = position || "a00000";
-        return this.client
-            .post("/pages/move", {
-            pageId,
-            parentPageId,
-            position: validPosition,
-        })
-            .then((res) => res.data);
-    }
-    async deletePage(pageId) {
-        await this.ensureAuthenticated();
-        return this.client
-            .post("/pages/delete", { pageId })
-            .then((res) => res.data);
-    }
-    // --- Comment methods (ported from upstream PR #3 by Max Nikitin) ---
-    /**
-     * Normalize a comment's `content` into a ProseMirror doc object before
-     * markdown conversion. createComment/updateComment send content as a
-     * JSON.stringify(...) STRING, and the server stores it as-is, so on read it
-     * comes back as a string. convertProseMirrorToMarkdown returns "" for a
-     * string, so parse it first (guarded — fall back to the raw value on any
-     * parse failure so a non-JSON legacy value is still handled gracefully).
-     */
-    parseCommentContent(content) {
-        if (typeof content !== "string")
-            return content;
-        try {
-            return JSON.parse(content);
-        }
-        catch {
-            return content;
-        }
-    }
-    /** List all comments on a page (cursor-paginated), content as markdown. */
-    async listComments(pageId) {
-        await this.ensureAuthenticated();
-        let allComments = [];
-        let cursor = null;
-        do {
-            const payload = { pageId, limit: 100 };
-            if (cursor)
-                payload.cursor = cursor;
-            const response = await this.client.post("/comments", payload);
-            const data = response.data.data || response.data;
-            const items = data.items || [];
-            allComments = allComments.concat(items);
-            cursor = data.meta?.nextCursor || null;
-        } while (cursor);
-        return allComments.map((comment) => {
-            const markdown = comment.content
-                ? convertProseMirrorToMarkdown(this.parseCommentContent(comment.content))
-                : "";
-            return filterComment(comment, markdown);
-        });
-    }
-    async getComment(commentId) {
-        await this.ensureAuthenticated();
-        const response = await this.client.post("/comments/info", { commentId });
-        const comment = response.data.data || response.data;
-        const markdown = comment.content
-            ? convertProseMirrorToMarkdown(this.parseCommentContent(comment.content))
-            : "";
-        return {
-            data: filterComment(comment, markdown),
-            success: true,
-        };
-    }
-    /**
-     * Create an inline comment anchored to its `selection` text, or a reply.
-     *
-     * Top-level comments (no `parentCommentId`) are ALWAYS inline and MUST carry a
-     * `selection`: the `type` argument is kept for interface compatibility but the
-     * effective type is coerced to "inline". The selection has to anchor in the
-     * document; if it cannot, the comment is rolled back and an error is thrown so
-     * the caller is forced to supply a proper inline selection rather than leaving
-     * an orphan, unanchored comment behind. Replies (parentCommentId set) inherit
-     * their parent's anchor: they take NO selection and are not anchored.
-     */
-    async createComment(pageId, content, type = "page", selection, parentCommentId, suggestedText) {
-        await this.ensureAuthenticated();
-        const isReply = !!parentCommentId;
-        const hasSuggestion = suggestedText !== undefined && suggestedText !== null;
-        // Defense in depth mirroring the server DTO/service: a suggested edit rewrites
-        // the exact anchored text, so it is only meaningful on a top-level inline
-        // comment that carries a selection.
-        if (hasSuggestion) {
-            if (isReply) {
-                throw new Error("create_comment: a suggested edit (suggestedText) cannot be attached to a reply; it applies only to a top-level inline comment.");
-            }
-            if (!selection || !selection.trim()) {
-                throw new Error("create_comment: a suggested edit (suggestedText) requires a 'selection' to anchor and rewrite.");
-            }
-        }
-        // Only top-level comments are inline-anchored, so they are stored as
-        // "inline". Replies carry no inline selection, so they keep the historical
-        // general ("page") type — both backward-compatible and semantically correct.
-        // The `type` argument is kept for interface compatibility; createComment
-        // normalizes the effective type internally, so callers may pass "inline".
-        const effectiveType = isReply ? "page" : "inline";
-        if (!isReply && (!selection || !selection.trim())) {
-            throw new Error("create_comment: an inline 'selection' (exact text to anchor on) is required for a top-level comment");
-        }
-        // For a SUGGESTION, the value we store as the comment's `selection` must be
-        // the RAW document substring the mark lands on (typographic quotes/dashes,
-        // nbsp, collapsed whitespace), NOT the agent's ASCII input. The anchor is
-        // placed via normalization, so when the doc was auto-converted to
-        // typographic the raw substring differs from the agent input; apply-time
-        // compares the stored selection to the marked doc text STRICTLY, so storing
-        // the raw substring is what makes "Apply" succeed instead of a spurious 409.
-        // Captured in the pre-check below (which already reads the page) and used as
-        // payload.selection. Ordinary comments keep sending the raw agent selection.
-        let anchoredSelection = null;
-        // For a top-level comment, fail BEFORE creating anything when the selection
-        // is not present in the persisted document — this avoids leaving an orphan
-        // comment + notification behind. A read failure (network) is non-fatal: the
-        // live anchor step below still enforces the anchoring invariant.
-        if (!isReply && selection) {
-            try {
-                const page = await this.getPageJson(pageId);
-                if (hasSuggestion) {
-                    // A suggestion's anchor MUST be unambiguous: applying it rewrites the
-                    // exact anchored text, and ordinary anchoring silently takes the first
-                    // occurrence, so 0 matches -> not found and >=2 -> ambiguous, both
-                    // rejected BEFORE creating the comment.
-                    const matches = countAnchorMatches(page.content, selection);
-                    if (matches === 0) {
-                        throw new Error("create_comment: could not find the selection text in the page to anchor the comment. " +
-                            "Provide the EXACT contiguous text from a single paragraph/block (<=250 chars).");
-                    }
-                    if (matches >= 2) {
-                        throw new Error(`create_comment: the suggestion's selection is ambiguous — it occurs ${matches} times in the page. ` +
-                            "A suggested edit must anchor to a UNIQUE location; expand the selection with surrounding context " +
-                            "(still <=250 chars) so it appears exactly once.");
-                    }
-                    // Exactly one match: capture the RAW anchored substring to store as the
-                    // comment selection (so apply-time equality holds). If this returns
-                    // null despite countAnchorMatches===1 (shouldn't happen), fall back to
-                    // the raw agent selection below rather than crash.
-                    anchoredSelection = getAnchoredText(page.content, selection);
-                }
-                else if (!canAnchorInDoc(page.content, selection)) {
-                    throw new Error("create_comment: could not find the selection text in the page to anchor the comment. " +
-                        "Provide the EXACT contiguous text from a single paragraph/block (<=250 chars).");
-                }
-            }
-            catch (e) {
-                // Rethrow our own "not found"/"ambiguous" errors; swallow read/network
-                // errors so the live anchor step can still try (and enforce) anchoring.
-                if (e instanceof Error &&
-                    (e.message.startsWith("create_comment: could not find the selection") ||
-                        e.message.startsWith("create_comment: the suggestion's selection is ambiguous"))) {
-                    throw e;
-                }
-                if (process.env.DEBUG) {
-                    console.error("Pre-check getPageJson failed; deferring to live anchor step:", e);
-                }
-            }
-        }
-        // Convert through the full Docmost schema. Deliberately the NON-canonicalizing
-        // variant: a comment body may carry a footnote definition with no matching
-        // reference, and canonicalization would drop it (data loss). See
-        // markdownToProseMirror vs markdownToProseMirrorCanonical.
-        const jsonContent = await markdownToProseMirror(content);
-        const payload = {
-            pageId,
-            content: JSON.stringify(jsonContent),
-            type: effectiveType,
-        };
-        // For a suggestion, store the RAW anchored substring (anchoredSelection) so
-        // the stored selection === the text under the mark === apply-time
-        // expectedText. Ordinary comments (and the null fallback) keep the raw
-        // agent selection — their selection is only display/anchor and never used
-        // by apply, so their behavior is unchanged.
-        if (!isReply && selection)
-            payload.selection = anchoredSelection ?? selection;
-        if (parentCommentId)
-            payload.parentCommentId = parentCommentId;
-        // Only a top-level inline comment (with a selection) may carry a suggestion.
-        if (!isReply && selection && hasSuggestion) {
-            payload.suggestedText = suggestedText;
-        }
-        const response = await this.client.post("/comments/create", payload);
-        const comment = response.data.data || response.data;
-        const markdown = comment.content
-            ? convertProseMirrorToMarkdown(this.parseCommentContent(comment.content))
-            : content;
-        const result = {
-            data: filterComment(comment, markdown),
-            success: true,
-        };
-        // Replies inherit the parent's anchor: no selection, no anchoring.
-        if (isReply) {
-            return result;
-        }
-        // Anchor the comment in the document. The /comments/create API records the
-        // comment + its `selection` text, but it does NOT insert the comment MARK
-        // into the page content, so without this the inline comment has no
-        // highlight/anchor and is not clickable. If anchoring fails the comment is
-        // rolled back (deleted) and an error is thrown — never an orphan comment.
-        const newCommentId = comment.id;
-        // Guard: a create response without an id would mean writing a comment mark
-        // with commentId: undefined and a later delete of a falsy id. We have no id
-        // to roll back here (nothing was created with an id), so just fail loudly.
-        if (!newCommentId) {
-            throw new Error("create_comment: the server returned no comment id, so the comment could not be anchored");
-        }
-        let anchored = false;
-        // Set inside the transform when a suggestion's live anchor is ambiguous
-        // (>=2 occurrences), so the rollback path can surface the right error.
-        let ambiguousInLiveDoc = false;
-        try {
-            const collabToken = await this.getCollabTokenWithReauth();
-            // Open the collab doc by the canonical UUID, never the slugId (#260). The
-            // /comments/create REST call above keeps the agent-supplied id.
-            const pageUuid = await this.resolvePageId(pageId);
-            // Route through the mutatePage seam (not the free function) so this
-            // wrapper's uniqueness gate + rollback can be unit-tested without a live
-            // Hocuspocus collab socket.
-            const mutation = await this.mutatePage(pageUuid, collabToken, this.apiUrl, (liveDoc) => {
-                const doc = liveDoc && liveDoc.type === "doc"
-                    ? liveDoc
-                    : { type: "doc", content: [] };
-                if (hasSuggestion) {
-                    // Authoritative uniqueness check against the LIVE document: a
-                    // suggestion must anchor to EXACTLY ONE occurrence, otherwise
-                    // "Apply" would rewrite the wrong/ambiguous text. If the live doc
-                    // no longer has exactly one occurrence (it changed since the
-                    // pre-check), abort so the just-created comment is rolled back
-                    // rather than mis-anchored to the first occurrence.
-                    const liveCount = countAnchorMatches(doc, selection);
-                    if (liveCount !== 1) {
-                        ambiguousInLiveDoc = liveCount >= 2;
-                        return null;
-                    }
-                }
-                if (applyAnchorInDoc(doc, selection, newCommentId)) {
-                    anchored = true;
-                    return doc;
-                }
-                // Selection text not found in the LIVE document: abort the write. The
-                // rollback + throw below turns this into a hard error.
-                return null;
-            });
-            result.verify = mutation.verify;
-        }
-        catch (e) {
-            // The comment record already exists; roll it back so we never leave an
-            // orphan, then rethrow the original anchoring error.
-            await this.safeDeleteComment(newCommentId);
-            throw e;
-        }
-        if (!anchored) {
-            // Mutation aborted because the selection was not found (or, for a
-            // suggestion, was ambiguous) in the live document. Roll back the comment
-            // and surface a hard error.
-            await this.safeDeleteComment(newCommentId);
-            throw new Error(ambiguousInLiveDoc
-                ? "create_comment: the suggestion's selection is ambiguous in the live document (multiple occurrences); the comment was rolled back. Expand the selection with surrounding context so it is unique."
-                : "create_comment: failed to anchor the comment (selection not found in the live document); the comment was rolled back");
-        }
-        result.anchored = true;
-        return result;
-    }
-    /**
-     * Best-effort rollback of a just-created comment. Swallows any delete failure
-     * (logging under DEBUG) so a failed cleanup never masks the original error.
-     */
-    async safeDeleteComment(commentId) {
-        // Defense in depth: never call the delete API with a falsy id — there is
-        // nothing to roll back, and deleteComment(undefined) would hit a bad route.
-        if (!commentId)
-            return;
-        try {
-            await this.deleteComment(commentId);
-        }
-        catch (delErr) {
-            if (process.env.DEBUG) {
-                console.error("Failed to roll back comment after anchoring error:", delErr);
-            }
-        }
-    }
-    async updateComment(commentId, content) {
-        await this.ensureAuthenticated();
-        // NON-canonicalizing on purpose (comment body — see createComment).
-        const jsonContent = await markdownToProseMirror(content);
-        await this.client.post("/comments/update", {
-            commentId,
-            content: JSON.stringify(jsonContent),
-        });
-        return {
-            success: true,
-            commentId,
-            message: "Comment updated successfully.",
-        };
-    }
-    async deleteComment(commentId) {
-        await this.ensureAuthenticated();
-        return this.client
-            .post("/comments/delete", { commentId })
-            .then((res) => res.data);
-    }
-    /**
-     * Resolve or reopen a top-level comment thread (reversible — `resolved`
-     * toggles the state). Only top-level comments can be resolved; the server
-     * rejects resolving a reply. Hits POST /comments/resolve.
-     */
-    async resolveComment(commentId, resolved) {
-        await this.ensureAuthenticated();
-        const response = await this.client.post("/comments/resolve", {
-            commentId,
-            resolved,
-        });
-        const comment = response.data?.data ?? response.data;
-        return {
-            success: true,
-            commentId,
-            resolved,
-            comment,
-        };
-    }
-    /**
-     * Check for new comments across pages in a space (optionally scoped to a
-     * subtree): pages updated after `since` are scanned and their comments
-     * filtered by createdAt > since.
-     */
-    async checkNewComments(spaceId, since, parentPageId) {
-        await this.ensureAuthenticated();
-        const sinceDate = new Date(since);
-        // Reject an unparseable `since`: comparing against an Invalid Date silently
-        // yields zero new comments (every `>` against NaN is false), which would
-        // mask a malformed input as "nothing new" instead of erroring.
-        if (Number.isNaN(sinceDate.getTime())) {
-            throw new Error(`checkNewComments: invalid "since" date "${since}"; expected an ISO-8601 timestamp`);
-        }
-        // 1. Enumerate the FULL set of pages in scope by walking the sidebar-pages
-        // tree (a complete page index), NOT the bounded "/pages/recent" feed which
-        // caps at ~5000 recent items and silently misses comments on older pages.
-        //
-        // Subtree scope: when parentPageId is given, the scope is that page ITSELF
-        // plus every descendant (enumerateSpacePages walks its children). Otherwise
-        // the scope is the whole space (all roots and their descendants).
-        //
-        // NOTE: do NOT pre-filter by page.updatedAt — creating a comment does not
-        // bump it (verified on a live server), so such a filter silently misses
-        // comments on pages that were not otherwise edited. The complete tree walk
-        // already restricts the scope correctly, so no recent-feed allow-list is
-        // needed any more.
-        let pagesInScope;
-        if (parentPageId) {
-            const subtree = await this.enumerateSpacePages(spaceId, parentPageId);
-            // Include the parent page node itself alongside its descendants. Fetch it
-            // so its title/id are available even though it is not returned by its own
-            // children listing.
-            let parentNode = { id: parentPageId };
-            try {
-                parentNode = await this.getPageRaw(parentPageId);
-            }
-            catch (e) {
-                // Fall back to a minimal node if the parent can't be fetched; its
-                // comments are still attempted below (the fetch there is non-fatal).
-            }
-            pagesInScope = [parentNode, ...subtree];
-        }
-        else {
-            pagesInScope = await this.enumerateSpacePages(spaceId);
-        }
-        // 2. Fetch comments for each page, keep ones created after since
-        const results = [];
-        for (const page of pagesInScope) {
-            try {
-                const comments = await this.listComments(page.id);
-                const newComments = comments.filter((c) => new Date(c.createdAt) > sinceDate);
-                if (newComments.length > 0) {
-                    results.push({
-                        pageId: page.id,
-                        pageTitle: page.title,
-                        comments: newComments,
-                    });
-                }
-            }
-            catch (e) {
-                // Skip pages with errors (e.g. deleted between calls)
-            }
-        }
-        const totalNewComments = results.reduce((sum, r) => sum + r.comments.length, 0);
-        // enumerateSpacePages caps traversal at 10000 nodes; flag when that cap was
-        // hit so the caller knows the scan may be incomplete (some pages skipped).
-        const truncated = pagesInScope.length >= 10000;
-        return {
-            since,
-            scope: parentPageId ? `subtree of ${parentPageId}` : `space ${spaceId}`,
-            checkedPages: pagesInScope.length,
-            pagesWithNewComments: results.length,
-            totalNewComments,
-            truncated,
-            comments: results,
-        };
-    }
-    // --- Image upload / embedding ---
-    /** Map a Content-Type string to a supported MIME type, or null if unsupported. */
-    supportedImageMime(ct) {
-        return MIME_TO_EXT[ct] ? ct : null;
-    }
-    /**
-     * Download a remote image from a caller-supplied URL and resolve its bytes,
-     * MIME and a filename.
-     *
-     * SSRF / RESOURCE TRUST BOUNDARY: the URL comes from the MCP caller and is
-     * fetched BY THE SERVER, so it must be guarded before and after the request.
-     * The guards mirror the local-file trust boundary in uploadImage:
-     *   - scheme allowlist (http/https only) — rejects file:, data:, ftp:, etc.,
-     *     so the caller cannot use this path to read local files or other schemes;
-     *   - a size cap enforced both via axios maxContentLength/maxBodyLength AND a
-     *     post-download buffer.length re-check (defends against a missing/lying
-     *     Content-Length), so a huge response cannot exhaust memory;
-     *   - a 30s timeout. The timeout matters because replaceImage holds the
-     *     per-page lock across this upload, so a hung download would wedge the
-     *     lock for that page.
-     * We deliberately do NOT block private IP ranges: the MCP caller is already
-     * trusted to read arbitrary host files via the filePath path, so the marginal
-     * trust granted by fetching internal URLs is comparable, and blocking would
-     * break legitimate internal-image use.
-     */
-    async fetchRemoteImage(url, maxBytes) {
-        // Scheme allowlist first — cheapest guard, and rejects non-http(s) schemes
-        // (file:, data:, ftp:, ...) before any network request is made.
-        let parsed;
-        try {
-            parsed = new URL(url);
-        }
-        catch (e) {
-            throw new Error(`Invalid image URL "${url}": ${e.message}`);
-        }
-        if (parsed.protocol !== "http:" && parsed.protocol !== "https:") {
-            throw new Error(`unsupported image URL scheme "${parsed.protocol}"; only http and https are allowed`);
-        }
-        let response;
-        try {
-            response = await axios.get(url, {
-                responseType: "arraybuffer",
-                timeout: 30000,
-                maxContentLength: maxBytes,
-                maxBodyLength: maxBytes,
-                headers: { Accept: "image/*" },
-            });
-        }
-        catch (error) {
-            // Keep the thrown message free of the raw response body (it may echo
-            // server internals); surface only status/statusText. The full body is
-            // logged under DEBUG for diagnostics.
-            if (axios.isAxiosError(error)) {
-                if (process.env.DEBUG) {
-                    console.error("Image download failed; response body:", JSON.stringify(error.response?.data));
-                }
-                throw new Error(`Image download failed for "${url}": ${error.response?.status ?? ""} ${error.response?.statusText ?? error.message}`.trim());
-            }
-            throw error;
-        }
-        // axios returns an ArrayBuffer for responseType: "arraybuffer".
-        const buffer = Buffer.from(response.data);
-        // Re-check the size: maxContentLength relies on Content-Length, which may be
-        // absent or lie, so guard against the actual byte count too.
-        if (buffer.length === 0) {
-            throw new Error(`Empty image response from "${url}"`);
-        }
-        if (buffer.length > maxBytes) {
-            throw new Error(`Image too large: ${buffer.length} bytes exceeds the ${maxBytes}-byte cap`);
-        }
-        // Resolve MIME: prefer the response Content-Type (strip any "; charset=..."
-        // parameter, lowercase, trim) mapped through the supported set; if the
-        // header is generic/missing/unsupported, fall back to the URL path
-        // extension via the existing extension->MIME logic.
-        const rawCt = response.headers?.["content-type"];
-        let mime = null;
-        if (typeof rawCt === "string" && rawCt.length > 0) {
-            const ct = rawCt.split(";")[0].trim().toLowerCase();
-            mime = this.supportedImageMime(ct);
-        }
-        if (!mime) {
-            // Fall back to the URL path extension. Use the pathname so the query
-            // string never contaminates the extension lookup.
-            const ext = extname(parsed.pathname).toLowerCase();
-            mime = EXT_TO_MIME[ext] ?? null;
-        }
-        if (!mime) {
-            throw new Error(`cannot determine supported image type for "${url}"; supported: png, jpg, jpeg, gif, webp, svg`);
-        }
-        // Build a filename from the URL path basename (ignore the query string),
-        // defaulting to "image" when empty, and ensure it ends with the canonical
-        // extension for the resolved MIME (append it when missing/mismatched).
-        const canonicalExt = MIME_TO_EXT[mime];
-        let fileName = basename(parsed.pathname) || "image";
-        if (extname(fileName).toLowerCase() !== canonicalExt) {
-            fileName += canonicalExt;
-        }
-        return { buffer, mime, fileName };
-    }
-    /** Build a Docmost ProseMirror image node from an uploaded attachment. */
-    buildImageNode(att, align, alt) {
-        // Clean file URL, matching Docmost's native behaviour. No cache-busting
-        // query: the server serves the bare URL correctly, and replacement creates
-        // a new attachment id (a new URL) which busts caches naturally.
-        const src = `/api/files/${att.id}/${att.fileName}`;
-        const node = {
-            type: "image",
-            attrs: {
-                src,
-                attachmentId: att.id,
-                // Default to null when the server omits fileSize so the attr is never
-                // undefined (undefined would be dropped on serialization / break the
-                // ProseMirror image schema which expects size present).
-                size: att.fileSize ?? null,
-                align: align || "center",
-                width: null,
-            },
-        };
-        if (alt)
-            node.attrs.alt = alt;
-        return node;
-    }
-    /**
-     * Download a remote image from an http(s) URL and upload it as an attachment
-     * of a page, returning the attachment metadata plus a ready-to-insert
-     * ProseMirror image node. Local file paths are intentionally not supported:
-     * the MCP caller is a remote AI with no access to this server's filesystem.
-     */
-    async uploadImage(pageId, url) {
-        await this.ensureAuthenticated();
-        const MAX_IMAGE_BYTES = 20 * 1024 * 1024; // 20 MiB
-        // Fetch + validate the remote image (scheme allowlist, size cap, timeout).
-        // See fetchRemoteImage for the SSRF / resource trust boundary.
-        const fetched = await this.fetchRemoteImage(url, MAX_IMAGE_BYTES);
-        const fileBuffer = fetched.buffer;
-        const mime = fetched.mime;
-        const fileName = fetched.fileName;
-        // Build a FRESH FormData for every send attempt. A FormData body is a
-        // single-use stream that is CONSUMED on the first send, so it cannot be
-        // replayed by this.client's response interceptor (replaying a consumed
-        // stream fails with 'socket hang up'). Multipart re-auth is therefore done
-        // here with bare axios and an explicit one-shot 401/403 retry that rebuilds
-        // the body. Field order matters: text fields must precede the file part so
-        // the server reads them; the server always generates a fresh attachment id.
-        const buildForm = () => {
-            const form = new FormData();
-            form.append("pageId", pageId);
-            form.append("file", fileBuffer, {
-                filename: fileName,
-                contentType: mime,
-            });
-            return form;
-        };
-        // Local name distinct from the `url` parameter (the source image URL): this
-        // is the /files/upload endpoint we POST the multipart body to.
-        const uploadUrl = `${this.apiUrl}/files/upload`;
-        let response;
-        try {
-            // Call buildForm() ONCE per attempt and reuse the instance for both
-            // getHeaders() and the body so the Content-Type boundary matches the body.
-            const form = buildForm();
-            // Read the Authorization header from this.client's defaults (set by
-            // login(), only ever deleted — never set to null) instead of building
-            // `Bearer ${this.token}`: a concurrent JSON 401 can null this.token
-            // mid-flight, which would otherwise produce a literal "Bearer null".
-            // ensureAuthenticated() above guarantees login() ran, so the default
-            // header exists here. A 60s timeout keeps a hung upload from wedging the
-            // per-page lock (replaceImage holds withPageLock across this call).
-            response = await axios.post(uploadUrl, form, {
-                headers: {
-                    ...form.getHeaders(),
-                    Authorization: this.client.defaults.headers.common["Authorization"],
-                },
-                timeout: 60000,
-            });
-        }
-        catch (error) {
-            // On an expired-token auth error, re-login and retry exactly once with a
-            // freshly-rebuilt FormData (the previous one was already consumed).
-            if (axios.isAxiosError(error) &&
-                (error.response?.status === 401 || error.response?.status === 403)) {
-                await this.login();
-                const form2 = buildForm();
-                response = await axios.post(uploadUrl, form2, {
-                    headers: {
-                        ...form2.getHeaders(),
-                        Authorization: this.client.defaults.headers.common["Authorization"],
-                    },
-                    timeout: 60000,
-                });
-            }
-            else if (axios.isAxiosError(error)) {
-                // Keep the thrown message free of the raw response body (it may echo
-                // request data or server internals); surface only status/statusText.
-                // The full body is logged under DEBUG for diagnostics.
-                if (process.env.DEBUG) {
-                    console.error("Image upload failed; response body:", JSON.stringify(error.response?.data));
-                }
-                throw new Error(`Image upload failed: ${error.response?.status} ${error.response?.statusText}`);
-            }
-            else {
-                throw error;
-            }
-        }
-        // The attachment may arrive bare or wrapped in a { data } envelope.
-        const att = response.data?.data ?? response.data;
-        if (!att?.id || !att?.fileName) {
-            throw new Error("Unexpected /files/upload response: " + JSON.stringify(response.data));
-        }
-        // Some Docmost versions omit fileSize from the upload response. Fall back
-        // to the fetched byte length (the bytes we just uploaded) so callers never
-        // get an undefined size.
-        const resolvedSize = att.fileSize ?? fileBuffer.length;
-        return {
-            attachmentId: att.id,
-            fileName: att.fileName,
-            fileSize: resolvedSize,
-            src: `/api/files/${att.id}/${att.fileName}`,
-            imageNode: this.buildImageNode({ ...att, fileSize: resolvedSize }),
-        };
-    }
-    /**
-     * Upload an image from a web (http/https) URL and insert it into a page in
-     * one step.
-     * By default the image is appended at the end. With replaceText, the first
-     * top-level block whose text contains the string is replaced; with afterText,
-     * the image is inserted right after the first matching block. All other
-     * block ids are preserved (only one top-level block is added or swapped).
-     */
-    async insertImage(pageId, url, opts = {}) {
-        const up = await this.uploadImage(pageId, url);
-        // Reuse the node from uploadImage (clean /api/files/<id>/<file> src), then
-        // apply align/alt onto a shallow attrs copy.
-        const node = { ...up.imageNode, attrs: { ...up.imageNode.attrs } };
-        if (opts.align)
-            node.attrs.align = opts.align;
-        if (opts.alt)
-            node.attrs.alt = opts.alt;
-        const collabToken = await this.getCollabTokenWithReauth();
-        // Open the collab doc by the canonical UUID, never the slugId (#260). The
-        // uploadImage /files/upload call above keeps the agent-supplied id.
-        const pageUuid = await this.resolvePageId(pageId);
-        // Recursively collect the plain text of a top-level block.
-        const blockText = (n) => {
-            let out = "";
-            if (n.type === "text")
-                out += n.text || "";
-            for (const child of n.content || [])
-                out += blockText(child);
-            return out;
-        };
-        // Insert into the LIVE synced document, not the debounced REST snapshot, so
-        // concurrent edits/comments/images are preserved and parallel insert_image
-        // calls (serialized by the per-page lock) each see the previous insertion.
-        let placement;
-        const mutation = await mutatePageContent(pageUuid, collabToken, this.apiUrl, (liveDoc) => {
-            const doc = liveDoc && liveDoc.type === "doc"
-                ? liveDoc
-                : { type: "doc", content: [] };
-            if (!Array.isArray(doc.content))
-                doc.content = [];
-            if (opts.replaceText) {
-                // Ambiguity guard (mirrors editPageText): count matching top-level
-                // blocks first, so a non-unique fragment cannot silently replace the
-                // wrong block (e.g. text that also appears inside a callout/table).
-                const matches = doc.content.filter((b) => blockText(b).includes(opts.replaceText));
-                if (matches.length === 0) {
-                    throw new Error(`replaceText not found: "${opts.replaceText}"`);
-                }
-                if (matches.length > 1) {
-                    throw new Error(`replaceText "${opts.replaceText}" matches ${matches.length} blocks; use a longer unique fragment`);
-                }
-                const idx = doc.content.findIndex((b) => blockText(b).includes(opts.replaceText));
-                // Data-loss guard: replaceText swaps the WHOLE top-level block, so if
-                // the fragment only appears nested inside a container (table, callout,
-                // list, blockquote) the entire structure would be destroyed. Refuse
-                // when the matched block is a container rather than a leaf
-                // paragraph/heading and point the caller at a safer tool.
-                const CONTAINER_TYPES = new Set([
-                    "table",
-                    "callout",
-                    "bulletList",
-                    "orderedList",
-                    "taskList",
-                    "blockquote",
-                ]);
-                const matchedBlock = doc.content[idx];
-                if (matchedBlock && CONTAINER_TYPES.has(matchedBlock.type)) {
-                    throw new Error(`replaceText matched a ${matchedBlock.type} container block; replacing it would destroy the whole structure. ` +
-                        `Use afterText to insert near it, or update_page_json for surgical edits.`);
-                }
-                doc.content.splice(idx, 1, node);
-                placement = "replaced";
-            }
-            else if (opts.afterText) {
-                // Ambiguity guard (mirrors editPageText): refuse a non-unique fragment.
-                const matches = doc.content.filter((b) => blockText(b).includes(opts.afterText));
-                if (matches.length === 0) {
-                    throw new Error(`afterText not found: "${opts.afterText}"`);
-                }
-                if (matches.length > 1) {
-                    throw new Error(`afterText "${opts.afterText}" matches ${matches.length} blocks; use a longer unique fragment`);
-                }
-                const idx = doc.content.findIndex((b) => blockText(b).includes(opts.afterText));
-                doc.content.splice(idx + 1, 0, node);
-                placement = "after";
-            }
-            else {
-                doc.content.push(node);
-                placement = "appended";
-            }
-            return doc;
-        });
-        return {
-            success: true,
-            pageId,
-            attachmentId: up.attachmentId,
-            src: up.src,
-            placement,
-            verify: mutation.verify,
-        };
-    }
-    /**
-     * Replace an existing image in a page with a new image fetched from a web
-     * (http/https) URL. Uploads the new file as a brand-new attachment, which
-     * yields a fresh clean URL that both renders correctly and busts browser
-     * caches (the URL changed). Finds every image node
-     * whose attrs.attachmentId === oldAttachmentId (recursively, incl. nodes nested
-     * in callouts/tables) and repoints its src/attachmentId/size, preserving
-     * comments, alignment and alt. Operates on the live collab document so comments
-     * and concurrent edits are preserved. Throws if no matching image is found.
-     *
-     * The OLD attachment is left in place as an unreferenced orphan: Docmost
-     * exposes NO HTTP API to delete a single content attachment (verified against
-     * the attachment controller/service and by probing the live API — deletion
-     * happens only by cascade when the page, space or user is removed). This is the
-     * same outcome as Docmost's own editor when an image is removed/replaced.
-     * In-place byte overwrite is deliberately NOT used because some Docmost
-     * versions corrupt the attachment (HTTP 500) when its bytes are overwritten.
-     */
-    async replaceImage(pageId, oldAttachmentId, url, opts = {}) {
-        const collabToken = await this.getCollabTokenWithReauth();
-        // Open the collab doc by the canonical UUID, never the slugId (#260). The
-        // page lock must ALSO key on the UUID so this operation serializes against
-        // other writes to the same page (mutatePageContent now locks by the resolved
-        // UUID too); locking by the raw slugId here would desync the mutex key and
-        // reopen the TOCTOU/orphan-attachment window the lock closes. uploadImage
-        // keeps the agent-supplied id (it hits REST, not the collab doc).
-        const pageUuid = await this.resolvePageId(pageId);
-        // Hold ONE per-page lock for the WHOLE operation (scan -> upload -> write).
-        // Previously the scan and the write were two separate mutatePageContent
-        // calls, each acquiring + releasing the lock, with the upload happening in
-        // the UNLOCKED gap between them. A concurrent op could interleave there: it
-        // could remove the target image so the write pass matches nothing, leaving
-        // the freshly-uploaded attachment as an un-deletable orphan (Docmost has no
-        // API to delete a single content attachment). Acquiring the lock once and
-        // using the non-locking collab helper inside (the per-page mutex is NOT
-        // reentrant, so the self-locking mutatePageContent would deadlock here)
-        // closes that TOCTOU window. uploadImage hits /files/upload over plain HTTP
-        // and does not touch the page lock, so it is safe to call while held.
-        return withPageLock(pageUuid, async () => {
-            // STEP 1: read-only live check. Scan the live document for any image node
-            // matching oldAttachmentId BEFORE uploading anything, so a wrong/stale id
-            // throws without ever creating an orphan attachment.
-            let matchFound = false;
-            const scan = (nodes) => {
-                for (const node of nodes) {
-                    if (!node)
-                        continue;
-                    if (node.type === "image" &&
-                        node.attrs &&
-                        node.attrs.attachmentId === oldAttachmentId) {
-                        matchFound = true;
-                    }
-                    if (Array.isArray(node.content))
-                        scan(node.content);
-                }
-            };
-            await this.mutateLiveContentUnlocked(pageUuid, collabToken, (liveDoc) => {
-                matchFound = false; // reset per-transform (collab may retry the read).
-                const doc = liveDoc && liveDoc.type === "doc"
-                    ? liveDoc
-                    : { type: "doc", content: [] };
-                if (Array.isArray(doc.content))
-                    scan(doc.content);
-                return null; // read-only: never write on the check pass.
-            });
-            if (!matchFound) {
-                throw new Error(`replace_image: no image with attachmentId "${oldAttachmentId}" found on page ${pageId}`);
-            }
-            // STEP 2: a match exists — upload the new file as a FRESH attachment (new
-            // id, new clean URL) and repoint every matching node in a second pass.
-            // Still inside the SAME lock, so no other op can have changed the page
-            // since the scan.
-            const up = await this.uploadImage(pageId, url);
-            let replaced = 0;
-            // Swap the source of one image node, preserving align/alt/title/geometry.
-            const repoint = (node) => {
-                node.attrs = {
-                    ...node.attrs,
-                    src: up.src,
-                    attachmentId: up.attachmentId,
-                    // Default to null when fileSize is unknown so the attr is never
-                    // undefined.
-                    size: up.fileSize ?? null,
-                };
-                if (opts.align)
-                    node.attrs.align = opts.align;
-                if (opts.alt !== undefined)
-                    node.attrs.alt = opts.alt;
-                replaced++;
-            };
-            // Recursively repoint every image node (incl. ones nested in callouts/tables).
-            const walk = (nodes) => {
-                for (const node of nodes) {
-                    if (!node)
-                        continue;
-                    if (node.type === "image" &&
-                        node.attrs &&
-                        node.attrs.attachmentId === oldAttachmentId) {
-                        repoint(node);
-                    }
-                    if (Array.isArray(node.content))
-                        walk(node.content);
-                }
-            };
-            const mutation = await this.mutateLiveContentUnlocked(pageUuid, collabToken, (liveDoc) => {
-                // Reset per-transform so collab retries recompute cleanly (no double-count).
-                replaced = 0;
-                const doc = liveDoc && liveDoc.type === "doc"
-                    ? liveDoc
-                    : { type: "doc", content: [] };
-                if (!Array.isArray(doc.content))
-                    doc.content = [];
-                walk(doc.content);
-                if (replaced === 0)
-                    return null; // no match -> skip the write entirely
-                return doc;
-            });
-            // KNOWN LIMITATION: a same-count image SRC swap (image count unchanged, no
-            // text/mark change) may still report verify.changed === false, because the
-            // text+marks+integrity-count model in summarizeChange does not inspect
-            // image `src`/attachmentId attributes. That is acceptable here — the
-            // replace is confirmed by `replaced` below, and verify is supplementary.
-            if (replaced === 0) {
-                // The pass-1 SCAN found the target (matchFound was true) and we already
-                // uploaded the new attachment, but pass-2 matched nothing — a concurrent
-                // editor must have removed the node between the two passes. Do NOT throw
-                // here (that would leak the just-uploaded attachment AND report failure);
-                // instead report success with the upload flagged as an unreferenced
-                // orphan so the caller knows. (The early throw above still covers the
-                // case where pass-1 finds nothing, before any upload happens.)
-                return {
-                    success: true,
-                    replaced: 0,
-                    pageId,
-                    oldAttachmentId,
-                    newAttachmentId: up.attachmentId,
-                    src: up.src,
-                    orphanedAttachmentId: up.attachmentId,
-                    warning: "target image was removed concurrently; uploaded attachment is unreferenced",
-                    verify: mutation.verify,
-                };
-            }
-            return {
-                success: true,
-                pageId,
-                replaced,
-                oldAttachmentId,
-                newAttachmentId: up.attachmentId,
-                src: up.src,
-                verify: mutation.verify,
-            };
-        });
-    }
-    // --- Page history / diff / transform ---
-    /**
-     * List the saved versions (history snapshots) of a page, newest first.
-     * Docmost auto-snapshots on every save. Returns one cursor-paginated page of
-     * results: `{ items, nextCursor }`. The history record's id field is `id`.
-     */
-    async listPageHistory(pageId, cursor) {
-        await this.ensureAuthenticated();
-        const payload = { pageId };
-        if (cursor)
-            payload.cursor = cursor;
-        const response = await this.client.post("/pages/history", payload);
-        const data = response.data?.data ?? response.data;
-        return {
-            items: data?.items ?? [],
-            nextCursor: data?.meta?.nextCursor ?? null,
-        };
-    }
-    /**
-     * Fetch a single page-history version including its lossless ProseMirror
-     * `content`. The version also carries pageId/title/createdAt.
-     */
-    async getPageHistory(historyId) {
-        await this.ensureAuthenticated();
-        const response = await this.client.post("/pages/history/info", {
-            historyId,
-        });
-        return response.data?.data ?? response.data;
-    }
-    /**
-     * "Restore" a version: Docmost has NO restore endpoint, so we take the
-     * version's `content` and write it as the page's current content via the live
-     * collab path (which itself creates a new history snapshot). Returns the
-     * affected pageId and the source historyId.
-     */
-    async restorePageVersion(historyId) {
-        await this.ensureAuthenticated();
-        const version = await this.getPageHistory(historyId);
-        if (!version ||
-            !version.pageId ||
-            !version.content ||
-            typeof version.content !== "object") {
-            throw new Error(`restore_page_version: history ${historyId} has no usable content`);
-        }
-        // Defense-in-depth: sanitize URLs in the restored content (parity with the
-        // JSON write path) before writing it back.
-        this.validateDocUrls(version.content);
-        const collabToken = await this.getCollabTokenWithReauth();
-        // version.pageId is the page entity id (already a UUID); resolvePageId
-        // short-circuits a UUID with no round-trip, so this is defensive only (#260).
-        const pageUuid = await this.resolvePageId(version.pageId);
-        const mutation = await mutatePageContent(pageUuid, collabToken, this.apiUrl, () => version.content);
-        return {
-            pageId: version.pageId,
-            restoredFrom: historyId,
-            verify: mutation.verify,
-        };
-    }
-    /**
-     * Diff two versions of a page and return a Docmost-equivalent change set.
-     * `from`/`to` each resolve to a ProseMirror doc:
-     *   - null / undefined / "current" -> the page's CURRENT content;
-     *   - any other string             -> that historyId's content.
-     * Returns the diff plus the resolved version metadata for each side.
-     */
-    async diffPageVersions(pageId, from, to) {
-        await this.ensureAuthenticated();
-        const isCurrent = (v) => v == null || v === "" || v === "current";
-        const resolveSide = async (v) => {
-            if (isCurrent(v)) {
-                const raw = await this.getPageRaw(pageId);
-                return {
-                    doc: raw.content || { type: "doc", content: [] },
-                    meta: {
-                        kind: "current",
-                        pageId,
-                        title: raw.title,
-                        updatedAt: raw.updatedAt,
-                    },
-                };
-            }
-            const version = await this.getPageHistory(v);
-            return {
-                doc: version.content || { type: "doc", content: [] },
-                meta: {
-                    kind: "history",
-                    historyId: version.id,
-                    pageId: version.pageId,
-                    title: version.title,
-                    createdAt: version.createdAt,
-                },
-            };
-        };
-        const fromSide = await resolveSide(from);
-        const toSide = await resolveSide(to);
-        const diff = diffDocs(fromSide.doc, toSide.doc);
-        return { from: fromSide.meta, to: toSide.meta, diff };
-    }
-    /**
-     * Edit a page by running an arbitrary user-supplied JS transform against the
-     * live document, with a diff preview + page-history safety net.
-     *
-     * The transform string is evaluated as `(doc, ctx) => doc` inside a node:vm
-     * sandbox: it gets ONLY `{ doc, ctx, structuredClone, console }` as globals,
-     * a 5s timeout, and NO access to require/process/fs/network. It must return a
-     * `{ type: "doc" }` node, which is validated structurally before any write.
-     *
-     * `ctx` exposes:
-     *   - comments: the page's comments (fetched before the live read);
-     *   - log: an array the transform can push diagnostics to (via console.log);
-     *   - consume(id): mark a comment id as consumed (for deleteComments);
-     *   - helpers: the transforms.ts primitives + commentsToFootnotes.
-     *
-     * Footnote convention used by the helpers: footnote markers are plain "[N]"
-     * text in the body, and the notes are an orderedList under a heading whose
-     * text is "Примечания переводчика".
-     *
-     * dryRun (default true): read the page's current content, run the transform,
-     * and return `{ pushed:false, diff, log }` WITHOUT opening the collab socket.
-     * Otherwise the transform runs atomically inside mutatePageContent, optionally
-     * deletes consumed comments, and returns the new historyId + diff + log.
-     */
-    async transformPage(pageId, transformJs, opts = {}) {
-        const dryRun = opts.dryRun ?? true;
-        const deleteComments = opts.deleteComments ?? false;
-        await this.ensureAuthenticated();
-        const comments = await this.listComments(pageId);
-        // ctx handed to the sandbox. consume() records ids; helpers are the pure
-        // transform primitives. log is captured from console.log inside the sandbox.
-        const ctx = {
-            comments,
-            log: [],
-            consumed: new Set(),
-            consume(id) {
-                this.consumed.add(id);
-            },
-            helpers: {
-                blockText,
-                walk,
-                getList,
-                insertMarkerAfter,
-                setCalloutRange,
-                noteItem,
-                mdToInlineNodes,
-                commentsToFootnotes,
-                canonicalizeFootnotes,
-                insertInlineFootnote,
-            },
-        };
-        // Captured oldDoc / newDoc for the diff (set inside runTransform).
-        let oldDoc;
-        let newDoc;
-        // SYNCHRONOUS transform runner — safe to call inside mutatePageContent's
-        // onSynced (no await between the live read and the write).
-        const runTransform = (liveDoc) => {
-            oldDoc = structuredClone(liveDoc);
-            const sandbox = {
-                doc: structuredClone(liveDoc),
-                ctx,
-                structuredClone,
-                console: {
-                    log: (...a) => ctx.log.push(a.map((x) => String(x)).join(" ")),
-                },
-            };
-            // Wrap the provided string in parentheses so both an expression-arrow
-            // (`(doc, ctx) => {...}`) and a parenthesized function work. Run it in a
-            // fresh context with no require/process/module so the transform cannot
-            // touch fs/network/process. 5s wall-clock timeout.
-            let fn;
-            try {
-                fn = vm.runInNewContext("(" + transformJs + ")", sandbox, {
-                    timeout: 5000,
-                });
-            }
-            catch (e) {
-                throw new Error(`transform did not compile: ${e?.message ?? e}`);
-            }
-            if (typeof fn !== "function") {
-                throw new Error("transform must evaluate to a function (doc, ctx) => doc");
-            }
-            const raw = vm.runInNewContext("f(d, c)", { f: fn, d: sandbox.doc, c: ctx }, { timeout: 5000 });
-            if (!raw ||
-                typeof raw !== "object" ||
-                raw.type !== "doc" ||
-                !Array.isArray(raw.content)) {
-                throw new Error('transform must return a ProseMirror doc node ({ type:"doc", content:[...] })');
-            }
-            // Validate the RAW transform output FIRST (structure — including the
-            // MAX_DEPTH guard — and URLs), mirroring updatePageJson. The canonicalizer
-            // recurses without a depth limiter, so validating after it would turn a
-            // too-deep doc into an opaque "Maximum call stack size exceeded" instead of
-            // the intended "nesting exceeds the maximum depth" error.
-            this.validateDocStructure(raw);
-            this.validateDocUrls(raw);
-            // Auto-canonicalize footnotes after the transform (idempotent): no write
-            // path can leave footnotes out of order / orphaned / in a raw `[^id]`
-            // block. In a dryRun preview this may surface footnote edits the script
-            // author did not write (the canonicalizer tidied them) — that is expected.
-            const result = canonicalizeFootnotes(raw);
-            newDoc = result;
-            return result;
-        };
-        if (dryRun) {
-            // Preview only: run against the current REST snapshot, never open the
-            // socket. oldDoc/newDoc are captured by runTransform.
-            const raw = await this.getPageRaw(pageId);
-            const current = raw.content || { type: "doc", content: [] };
-            runTransform(current);
-            // Run an independent Yjs-encodability check (same sanitize + schema as the
-            // apply path), so the preview fails with the same descriptive error when
-            // the doc is not encodable instead of returning a misleadingly-green diff.
-            assertYjsEncodable(newDoc);
-            return {
-                pushed: false,
-                diff: diffDocs(oldDoc, newDoc),
-                log: ctx.log,
-            };
-        }
-        // Apply atomically against the live doc.
-        const collabToken = await this.getCollabTokenWithReauth();
-        // Open the collab doc by the canonical UUID, never the slugId (#260).
-        const pageUuid = await this.resolvePageId(pageId);
-        const mutation = await mutatePageContent(pageUuid, collabToken, this.apiUrl, runTransform);
-        // Optionally delete consumed comments (best-effort; a delete failure must
-        // not undo the successful write).
-        const deletedComments = [];
-        if (deleteComments) {
-            for (const id of ctx.consumed) {
-                try {
-                    await this.deleteComment(id);
-                    deletedComments.push(id);
-                }
-                catch (e) {
-                    if (process.env.DEBUG) {
-                        console.error(`transform: failed to delete comment ${id}:`, e);
-                    }
-                }
-            }
-        }
-        // Fetch the newest historyId (Docmost snapshots on the write above).
-        let historyId = null;
-        try {
-            const hist = await this.listPageHistory(pageId);
-            historyId = hist.items?.[0]?.id ?? null;
-        }
-        catch (e) {
-            if (process.env.DEBUG) {
-                console.error("transform: failed to fetch history id:", e);
-            }
-        }
-        return {
-            pushed: true,
-            historyId,
-            diff: diffDocs(oldDoc, newDoc),
-            deletedComments,
-            log: ctx.log,
-            verify: mutation.verify,
-        };
-    }
-}
diff --git a/packages/mcp/build/http.js b/packages/mcp/build/http.js
deleted file mode 100644
index 45c422b0..00000000
--- a/packages/mcp/build/http.js
+++ /dev/null
@@ -1,133 +0,0 @@
-import { randomUUID } from "node:crypto";
-import { StreamableHTTPServerTransport } from "@modelcontextprotocol/sdk/server/streamableHttp.js";
-import { isInitializeRequest } from "@modelcontextprotocol/sdk/types.js";
-import { createDocmostMcpServer } from "./index.js";
-/**
- * Build a stateful Streamable-HTTP handler for the Docmost MCP server. The
- * embedding host (the gitmost NestJS server) bridges its raw Node req/res into
- * `handleRequest`. One McpServer + transport is created per MCP session and
- * kept alive between requests, keyed by the `mcp-session-id` header.
- *
- * `config` is EITHER a static `DocmostMcpConfig` (back-compat: stdio + the env
- * service account, unchanged) OR a `McpConfigResolver` run once per session at
- * `initialize` to bind that session to the request's identity.
- */
-export function createMcpHttpHandler(config, options = {}) {
-    // One transport (and one McpServer) per MCP session, keyed by session id.
-    const transports = {};
-    // Last activity timestamp per session id, used for idle eviction.
-    const lastSeen = {};
-    // Anti-session-fixation: the opaque identity key bound to each session at
-    // initialize. A later request for that session whose key differs is rejected.
-    const sessionIdentity = {};
-    // Write a JSON-RPC error and end the response. Used for the 400/401 paths so
-    // every early rejection is a well-formed JSON-RPC error, not a torn response.
-    const sendJsonRpcError = (res, statusCode, code, message) => {
-        res.statusCode = statusCode;
-        res.setHeader("Content-Type", "application/json");
-        res.end(JSON.stringify({
-            jsonrpc: "2.0",
-            error: { code, message },
-            id: null,
-        }));
-    };
-    // Idle session TTL (ms): a session with no activity for this long is evicted.
-    // Defaults to 30 min; overridable via MCP_SESSION_IDLE_MS.
-    const idleTtlMs = (() => {
-        const parsed = parseInt(process.env.MCP_SESSION_IDLE_MS ?? "", 10);
-        return Number.isFinite(parsed) && parsed > 0 ? parsed : 30 * 60 * 1000;
-    })();
-    // Periodically close transports idle longer than the TTL. transport.close()
-    // triggers its onclose, which removes it from `transports`; we also drop the
-    // lastSeen entry. unref() so this timer never keeps the process alive.
-    const sweepIntervalMs = 5 * 60 * 1000;
-    const sweepTimer = setInterval(() => {
-        const now = Date.now();
-        for (const sid of Object.keys(transports)) {
-            if (now - (lastSeen[sid] ?? 0) > idleTtlMs) {
-                void transports[sid].close();
-                delete lastSeen[sid];
-                delete sessionIdentity[sid];
-            }
-        }
-    }, sweepIntervalMs);
-    sweepTimer.unref();
-    async function handleRequest(req, res, parsedBody) {
-        const sessionId = req.headers["mcp-session-id"];
-        const method = (req.method || "GET").toUpperCase();
-        let transport = sessionId ? transports[sessionId] : undefined;
-        if (method === "POST" && !transport) {
-            // A new session may only be created by an initialize request without a
-            // session id.
-            if (sessionId || !isInitializeRequest(parsedBody)) {
-                sendJsonRpcError(res, 400, -32000, "Bad Request: no valid session ID provided");
-                return;
-            }
-            // Resolve the per-session config from the request (per-user identity) when
-            // a resolver was supplied; otherwise use the static config unchanged. The
-            // resolver may throw (e.g. bad credentials) — surface a clean 401, never
-            // a created session.
-            let sessionConfig;
-            let identity;
-            try {
-                sessionConfig =
-                    typeof config === "function" ? await config(req) : config;
-                if (options.identify)
-                    identity = await options.identify(req);
-            }
-            catch (err) {
-                sendJsonRpcError(res, 401, -32001, err instanceof Error ? err.message : "Unauthorized");
-                return;
-            }
-            transport = new StreamableHTTPServerTransport({
-                sessionIdGenerator: () => randomUUID(),
-                onsessioninitialized: (sid) => {
-                    transports[sid] = transport;
-                    lastSeen[sid] = Date.now();
-                    // Bind the resolved identity to the new session id for anti-fixation.
-                    if (identity !== undefined)
-                        sessionIdentity[sid] = identity;
-                },
-            });
-            transport.onclose = () => {
-                const sid = transport.sessionId;
-                if (sid && transports[sid])
-                    delete transports[sid];
-                if (sid)
-                    delete sessionIdentity[sid];
-            };
-            const server = createDocmostMcpServer(sessionConfig);
-            await server.connect(transport);
-            await transport.handleRequest(req, res, parsedBody);
-            return;
-        }
-        if (!transport) {
-            sendJsonRpcError(res, 400, -32000, "Bad Request: no valid session ID provided");
-            return;
-        }
-        // Anti-session-fixation: a request reusing an existing session id must
-        // present credentials/token that resolve to the SAME identity bound at
-        // initialize, otherwise reject with 401. This prevents hijacking another
-        // user's established session by replaying its session id with different
-        // credentials.
-        if (options.identify && sessionId && sessionId in sessionIdentity) {
-            let presented;
-            try {
-                presented = await options.identify(req);
-            }
-            catch (err) {
-                sendJsonRpcError(res, 401, -32001, err instanceof Error ? err.message : "Unauthorized");
-                return;
-            }
-            if (presented !== sessionIdentity[sessionId]) {
-                sendJsonRpcError(res, 401, -32001, "Credentials do not match the user that owns this MCP session.");
-                return;
-            }
-        }
-        // Routing to an existing transport: refresh its idle timestamp.
-        if (sessionId)
-            lastSeen[sessionId] = Date.now();
-        await transport.handleRequest(req, res, parsedBody);
-    }
-    return { handleRequest };
-}
diff --git a/packages/mcp/build/index.js b/packages/mcp/build/index.js
deleted file mode 100644
index a9fc3696..00000000
--- a/packages/mcp/build/index.js
+++ /dev/null
@@ -1,810 +0,0 @@
-import { McpServer } from "@modelcontextprotocol/sdk/server/mcp.js";
-import { z } from "zod";
-import { readFileSync } from "fs";
-import { fileURLToPath } from "url";
-import { dirname, join } from "path";
-import { DocmostClient } from "./client.js";
-import { parseNodeArg } from "./lib/parse-node-arg.js";
-import { SHARED_TOOL_SPECS } from "./tool-specs.js";
-// Re-export the client and its config type so embedding hosts (e.g. the gitmost
-// NestJS server) can `import('@docmost/mcp')` and construct a DocmostClient
-// directly — for the credentials variant OR the per-user getToken variant.
-export { DocmostClient } from "./client.js";
-// Re-export the zod-agnostic shared tool-spec registry so the in-app AI-SDK
-// service can read it off the loaded module (it cannot import the ESM package's
-// internals directly; it goes through loadDocmostMcp()).
-export { SHARED_TOOL_SPECS } from "./tool-specs.js";
-// Read version from package.json
-const __filename = fileURLToPath(import.meta.url);
-const __dirname = dirname(__filename);
-const packageJson = JSON.parse(readFileSync(join(__dirname, "../package.json"), "utf-8"));
-const VERSION = packageJson.version;
-// Configuration for an MCP server instance is the DocmostMcpConfig union
-// (credentials OR getToken) defined and re-exported above. The factory below is
-// fully side-effect-free on import: it reads no environment variables and opens
-// no transport. The standalone stdio entrypoint (stdio.ts) and the HTTP handler
-// (http.ts) supply this config and own the process/transport lifecycle.
-// --- Modern McpServer Implementation ---
-// Editing guide surfaced to MCP clients in the initialize result so they can
-// pick the right tool by intent and avoid resending whole documents.
-//
-// MAINTENANCE RULE: when you ADD, RENAME, or REMOVE a tool (either an inline
-// server.registerTool(...) here or a spec in tool-specs.ts), you MUST update
-// this guide so the new tool is routed by intent. This is enforced by
-// test/unit/server-instructions.test.mjs, which fails when a registered tool
-// name is not mentioned below (see its EXCEPTIONS list for the rare opt-outs).
-// Exported for that test.
-export const SERVER_INSTRUCTIONS = "Docmost editing guide — choose the tool by intent.\n" +
-    "READ: find a page -> search (workspace-wide full-text); list -> list_pages / list_spaces. Locate blocks and their ids CHEAPLY -> get_outline (compact top-level map; start here, not get_page_json). One block's subtree -> get_node (by attrs.id, or \"#<index>\" for tables, which carry no id). Find every occurrence of a string/regex ON a page (and where each is) -> search_in_page, NOT block-by-block get_node — it returns each hit's node ref + block index + context for a targeted comment. Whole page -> get_page (Markdown, lossy; inline <span data-comment-id> tags are comment anchors — markup, not text) or get_page_json (lossless ProseMirror with block ids). Hand a huge page (with images) to an external consumer without pulling it through the model context -> stash_page (returns a short-lived anonymous URL).\n" +
-    "EDIT: fix wording/typos/numbers -> edit_page_text (find/replace inside blocks, no node id needed). Change ONE block (paragraph/heading/callout/etc.) structurally -> patch_node (by attrs.id from get_outline). Add a block -> insert_node (before/after a block by attrs.id or by anchor text, or append). Remove a block -> delete_node (by attrs.id). Tables -> table_get / table_update_cell / table_insert_row / table_delete_row (address by \"#<index>\" from get_outline; table nodes have no attrs.id). Images -> insert_image (add from a web URL) / replace_image (swap an existing image). Footnotes -> insert_footnote. Bulk/structural rewrite -> update_page_json (full ProseMirror replace; prefer the granular tools above to avoid resending the whole ~100KB+ document). Complex/scripted rewrite (multiple coordinated edits, renumbering) -> docmost_transform: write a JS `(doc, ctx) => doc` transform, preview the diff with dryRun (default), then apply with dryRun:false; ctx.helpers includes commentsToFootnotes for turning inline comments into numbered footnotes.\n" +
-    "PAGES: new -> create_page (Markdown). Rename (title only) -> rename_page. Move -> move_page. Delete -> delete_page (SOFT delete — the page goes to trash and is restorable; nothing is permanent). Copy/replace a page's whole content from another page (server-side, no document through the model) -> copy_page_content. Sharing -> share_page / unshare_page / list_shares; share_page makes the page PUBLICLY accessible — do it only when explicitly asked.\n" +
-    "COMMENTS: create_comment is always inline and requires an EXACT selection — contiguous text from a single block, <=250 chars (fails rather than leaving an unanchored comment); reply to a thread via parentCommentId. Propose a concrete text fix for one-click human approval -> create_comment with suggestedText (the exact plain-text replacement for the selection; the selection must then be UNIQUE in the page — extend it with context if needed); prefer this over editing directly when the change is subjective or needs the author's sign-off. Manage -> list_comments, update_comment, resolve_comment (resolve/reopen, reversible — prefer over delete to close), delete_comment, check_new_comments.\n" +
-    "HISTORY: review what changed -> diff_page_versions (a historyId vs current, or two versions). List saved versions -> list_page_history. Undo a bad edit -> restore_page_version (writes a past version back as current; itself revertible). Lossless markdown round-trip (download, edit, re-upload, incl. comment anchors) -> export_page_markdown / import_page_markdown.";
-// Helper to format JSON responses
-const jsonContent = (data) => ({
-    content: [{ type: "text", text: JSON.stringify(data, null, 2) }],
-});
-/**
- * Create a fully configured Docmost MCP server. Side-effect-free: it does not
- * read environment variables and does not connect any transport — the caller
- * decides how to expose it (stdio or HTTP). The client talks to Docmost over
- * REST + the collaboration WebSocket using the provided service-account
- * credentials and auto-re-authenticates.
- */
-export function createDocmostMcpServer(config) {
-    // Pass the whole config union through: the client branches internally on
-    // credentials vs. getToken, so both the external /mcp (creds) and the
-    // internal per-user (getToken) paths are wired here unchanged.
-    const docmostClient = new DocmostClient(config);
-    const server = new McpServer({
-        name: "docmost-mcp",
-        version: VERSION,
-    }, { instructions: SERVER_INSTRUCTIONS });
-    // Register a tool from the shared, zod-agnostic spec registry. The spec owns
-    // the canonical name + model-facing description + (optional) schema builder;
-    // only the execute body is supplied per call. buildShape is invoked with THIS
-    // package's zod (v3); the in-app layer passes its own zod (v4).
-    //
-    // The spec's schema builder returns a plain ZodRawShape (Record<string,
-    // unknown> in the shared module since it must stay zod-agnostic), so the
-    // McpServer.registerTool overloads cannot infer the execute arg's shape from
-    // it. We type `execute` loosely and cast the call through `any`; runtime
-    // behaviour is unchanged — each execute body destructures the same fields the
-    // builder declares.
-    const registerShared = (spec, execute) => server.registerTool(spec.mcpName, spec.buildShape
-        ? { description: spec.description, inputSchema: spec.buildShape(z) }
-        : { description: spec.description }, execute);
-    // Tool: get_workspace
-    registerShared(SHARED_TOOL_SPECS.getWorkspace, async () => {
-        const workspace = await docmostClient.getWorkspace();
-        return jsonContent(workspace);
-    });
-    // Tool: list_spaces
-    registerShared(SHARED_TOOL_SPECS.listSpaces, async () => {
-        const spaces = await docmostClient.getSpaces();
-        return jsonContent(spaces);
-    });
-    // Tool: list_pages
-    // INTENTIONAL per-transport divergence (not in the shared registry): this
-    // transport exposes a `tree:true` mode that returns the full nested hierarchy;
-    // the in-app copy keeps the same tree option but is worded for the in-app agent.
-    // Kept per-layer so each side can tune its own guidance.
-    server.registerTool("list_pages", {
-        description: "List most recent pages in a space ordered by updatedAt (descending). " +
-            "Returns a bounded list (default 50, max 100) — use search for lookups " +
-            "in large spaces. Pass tree:true (with spaceId) to instead get the " +
-            "space's full page hierarchy as a nested tree.",
-        inputSchema: {
-            spaceId: z.string().optional(),
-            limit: z
-                .number()
-                .int()
-                .min(1)
-                .max(100)
-                .optional()
-                .describe("Max pages to return (default 50, max 100)"),
-            tree: z
-                .boolean()
-                .optional()
-                .describe("When true, return the space's full page hierarchy as a nested tree (each node has a children array) instead of the recent-by-updatedAt flat list. Requires spaceId; ignores limit."),
-        },
-    }, async ({ spaceId, limit, tree }) => {
-        const result = await docmostClient.listPages(spaceId, limit ?? 50, tree ?? false);
-        return jsonContent(result);
-    });
-    // Tool: get_page
-    server.registerTool("get_page", {
-        description: "Get page details with content converted to Markdown. The conversion is " +
-            "LOSSY (block ids, exact table/callout structure are approximated); for a " +
-            "lossless representation use get_page_json. Inline <span data-comment-id> " +
-            "tags in the markdown are comment highlight anchors (also present for " +
-            "RESOLVED threads) — treat them as markup, not page text.",
-        inputSchema: {
-            pageId: z.string().min(1),
-        },
-    }, async ({ pageId }) => {
-        const page = await docmostClient.getPage(pageId);
-        return jsonContent(page);
-    });
-    // Tool: get_page_json
-    registerShared(SHARED_TOOL_SPECS.getPageJson, async ({ pageId }) => {
-        const page = await docmostClient.getPageJson(pageId);
-        return jsonContent(page);
-    });
-    // Tool: get_outline
-    registerShared(SHARED_TOOL_SPECS.getOutline, async ({ pageId }) => {
-        const result = await docmostClient.getOutline(pageId);
-        return jsonContent(result);
-    });
-    // Tool: get_node
-    registerShared(SHARED_TOOL_SPECS.getNode, async ({ pageId, nodeId }) => {
-        const result = await docmostClient.getNode(pageId, nodeId);
-        return jsonContent(result);
-    });
-    // Tool: search_in_page
-    registerShared(SHARED_TOOL_SPECS.searchInPage, async ({ pageId, query, regex, caseSensitive, limit }) => {
-        const result = await docmostClient.searchInPage(pageId, query, {
-            regex,
-            caseSensitive,
-            limit,
-        });
-        return jsonContent(result);
-    });
-    // Tool: table_get
-    server.registerTool("table_get", {
-        description: "Read a table as a matrix. Returns {rows, cols, cells (text[][]), " +
-            "cellIds (paragraph id per cell, or null)}. `table` = `#<index>` from " +
-            "get_outline, or any block id inside the table. Use cellIds with " +
-            "patch_node for rich-formatted cell edits. `cols` is the FIRST row's " +
-            "width; ragged tables may vary per row, so use the per-row length of " +
-            "`cells` for each row.",
-        inputSchema: {
-            pageId: z.string().min(1),
-            table: z.string().min(1),
-        },
-    }, async ({ pageId, table }) => {
-        const result = await docmostClient.getTable(pageId, table);
-        return jsonContent(result);
-    });
-    // Tool: table_insert_row
-    // NOT in the shared registry: this transport names the table argument `table`,
-    // while the in-app tool names it `tableRef` (ai-chat-tools.service.ts). Sharing
-    // one buildShape would rename a public MCP parameter, so the table row/cell
-    // tools stay per-transport by design.
-    server.registerTool("table_insert_row", {
-        description: "Insert a row of plain-text cells into a table. `table` = `#<index>` or " +
-            "a block id inside it. `cells` = text per column (padded to the table's " +
-            "column count; error if more cells than columns). `index` = 0-based " +
-            "insert position (0 inserts before the header); omit to append at the end.",
-        inputSchema: {
-            pageId: z.string().min(1),
-            table: z.string().min(1),
-            cells: z.array(z.string()),
-            index: z.number().int().optional(),
-        },
-    }, async ({ pageId, table, cells, index }) => {
-        const result = await docmostClient.tableInsertRow(pageId, table, cells, index);
-        return jsonContent(result);
-    });
-    // Tool: table_delete_row
-    // NOT shared — same `table` (here) vs `tableRef` (in-app) parameter-name
-    // divergence as table_insert_row.
-    server.registerTool("table_delete_row", {
-        description: "Delete the row at 0-based `index` from a table (`table` = `#<index>` or " +
-            "a block id inside it). Refuses to delete the table's only row. An " +
-            "out-of-range `index` throws. Deleting `index` 0 removes the header row, " +
-            "and the next row becomes the new header.",
-        inputSchema: {
-            pageId: z.string().min(1),
-            table: z.string().min(1),
-            index: z.number().int(),
-        },
-    }, async ({ pageId, table, index }) => {
-        const result = await docmostClient.tableDeleteRow(pageId, table, index);
-        return jsonContent(result);
-    });
-    // Tool: table_update_cell
-    // NOT shared — same `table` (here) vs `tableRef` (in-app) parameter-name
-    // divergence as table_insert_row.
-    server.registerTool("table_update_cell", {
-        description: "Set the plain-text content of cell [row,col] (0-based) in a table " +
-            "(`table` = `#<index>` or a block id inside it). Replaces the cell's " +
-            "content with a single text paragraph; for rich formatting use patch_node " +
-            "on the cell's paragraph id from table_get.",
-        inputSchema: {
-            pageId: z.string().min(1),
-            table: z.string().min(1),
-            row: z.number().int(),
-            col: z.number().int(),
-            text: z.string(),
-        },
-    }, async ({ pageId, table, row, col, text }) => {
-        const result = await docmostClient.tableUpdateCell(pageId, table, row, col, text);
-        return jsonContent(result);
-    });
-    // Tool: create_page
-    server.registerTool("create_page", {
-        description: "Create a new page from Markdown in a space. Pass parentPageId to nest " +
-            "it under a parent; omit it to create at the space root.",
-        inputSchema: {
-            title: z.string().min(1).describe("Title of the page"),
-            content: z.string().min(1).describe("Markdown content"),
-            spaceId: z.string().min(1),
-            parentPageId: z
-                .string()
-                .optional()
-                .describe("Optional parent page ID to nest under"),
-        },
-    }, async ({ title, content, spaceId, parentPageId }) => {
-        const result = await docmostClient.createPage(title, content, spaceId, parentPageId);
-        return jsonContent(result);
-    });
-    // Tool: update_page_json
-    server.registerTool("update_page_json", {
-        description: "Replace a page's content with a raw ProseMirror JSON document " +
-            "(lossless write: preserves the block ids, callouts, tables and " +
-            "attributes you pass in). Typical flow: get_page_json -> modify the " +
-            "JSON -> update_page_json. Keep existing node ids intact so heading " +
-            "anchors and history stay stable. Minimal full-doc example: " +
-            '{"type":"doc","content":[{"type":"paragraph","content":' +
-            '[{"type":"text","text":"Hi"}]}]}. `content` may be a JSON object or a ' +
-            "JSON string (both accepted), and is OPTIONAL: omit it to update only " +
-            "the title (though prefer rename_page for a title-only change). " +
-            "Supplying neither content nor title is an error.",
-        inputSchema: {
-            pageId: z.string().min(1).describe("ID of the page to update"),
-            content: z
-                .any()
-                .optional()
-                .describe('ProseMirror document {"type":"doc","content":[...]} (JSON object or ' +
-                "JSON string). Omit to rename only."),
-            title: z.string().optional().describe("Optional new title"),
-        },
-    }, async ({ pageId, content, title }) => {
-        // Only parse/validate the document when it was actually supplied; when it
-        // is omitted, pass it straight through so the client performs a title-only
-        // (or no-op) update.
-        let doc;
-        if (content === undefined || content === null) {
-            doc = undefined;
-        }
-        else {
-            // String -> JSON.parse (throwing on invalid); object passes through.
-            doc = parseNodeArg(content, "content was a string but not valid JSON");
-        }
-        const result = await docmostClient.updatePageJson(pageId, doc, title);
-        return jsonContent(result);
-    });
-    // Tool: export_page_markdown
-    server.registerTool("export_page_markdown", {
-        description: "Export a page to a single self-contained, lossless Docmost-flavoured " +
-            "Markdown file (custom extensions): YAML-free meta header, body with " +
-            "inline comment anchors and diagrams, and a trailing comments-thread " +
-            "block. Designed for a download -> edit body -> import_page_markdown " +
-            "round-trip that preserves everything, including comment highlights. " +
-            "Comment THREADS are preserved in the file but are not re-pushed to the " +
-            "server on import.",
-        inputSchema: {
-            pageId: z.string().min(1),
-        },
-    }, async ({ pageId }) => {
-        const md = await docmostClient.exportPageMarkdown(pageId);
-        return { content: [{ type: "text", text: md }] };
-    });
-    // Tool: import_page_markdown
-    registerShared(SHARED_TOOL_SPECS.importPageMarkdown, async ({ pageId, markdown }) => {
-        const res = await docmostClient.importPageMarkdown(pageId, markdown);
-        return jsonContent(res);
-    });
-    // Tool: copy_page_content
-    registerShared(SHARED_TOOL_SPECS.copyPageContent, async ({ sourcePageId, targetPageId }) => {
-        const result = await docmostClient.copyPageContent(sourcePageId, targetPageId);
-        return jsonContent(result);
-    });
-    // Tool: rename_page
-    server.registerTool("rename_page", {
-        description: "Rename a page (change its title only) without touching or resending " +
-            "its content.",
-        inputSchema: {
-            pageId: z.string().min(1).describe("ID of the page to rename"),
-            title: z.string().min(1).describe("New title"),
-        },
-    }, async ({ pageId, title }) => {
-        const result = await docmostClient.renamePage(pageId, title);
-        return jsonContent(result);
-    });
-    // Tool: edit_page_text
-    registerShared(SHARED_TOOL_SPECS.editPageText, async ({ pageId, edits }) => {
-        const result = await docmostClient.editPageText(pageId, edits);
-        return jsonContent(result);
-    });
-    // Tool: stash_page — returns a resource_link (NOT embedded text) so the doc
-    // body never enters the model context. Registered directly (not via
-    // registerShared) because that helper only emits text content. Also returns
-    // `structuredContent` carrying the full documented `{uri, sha256, size, images}`
-    // shape alongside the resource_link, so MCP clients receive the blob's sha256
-    // (its ETag, for integrity) and mirror counts, not just the link.
-    server.registerTool(SHARED_TOOL_SPECS.stashPage.mcpName, {
-        description: SHARED_TOOL_SPECS.stashPage.description,
-        inputSchema: SHARED_TOOL_SPECS.stashPage.buildShape(z),
-    }, async ({ pageId }) => {
-        const result = await docmostClient.stashPage(pageId);
-        return {
-            content: [
-                {
-                    type: "resource_link",
-                    uri: result.uri,
-                    name: "page.json",
-                    mimeType: "application/json",
-                    size: result.size,
-                },
-            ],
-            // Mirror the full documented result shape ({ uri, size, sha256, images })
-            // as structuredContent so MCP clients get the blob's sha256 (its ETag, for
-            // integrity) and the mirror counts, not just the resource_link.
-            structuredContent: {
-                uri: result.uri,
-                sha256: result.sha256,
-                size: result.size,
-                images: result.images,
-            },
-        };
-    });
-    // Tool: patch_node — schema + description from the shared registry (identical
-    // across both transports). The execute body keeps its own parseNodeArg
-    // normalization (the model sometimes serializes `node` as a JSON string).
-    registerShared(SHARED_TOOL_SPECS.patchNode, async ({ pageId, nodeId, node }) => {
-        const parsedNode = parseNodeArg(node);
-        const result = await docmostClient.patchNode(pageId, nodeId, parsedNode);
-        return jsonContent(result);
-    });
-    // Tool: insert_node — schema + description from the shared registry. As with
-    // patch_node, the execute body retains parseNodeArg on the incoming node.
-    registerShared(SHARED_TOOL_SPECS.insertNode, async ({ pageId, node, position, anchorNodeId, anchorText }) => {
-        const parsedNode = parseNodeArg(node);
-        const result = await docmostClient.insertNode(pageId, parsedNode, {
-            position,
-            anchorNodeId,
-            anchorText,
-        });
-        return jsonContent(result);
-    });
-    // Tool: delete_node
-    registerShared(SHARED_TOOL_SPECS.deleteNode, async ({ pageId, nodeId }) => {
-        const result = await docmostClient.deleteNode(pageId, nodeId);
-        return jsonContent(result);
-    });
-    // Tool: insert_image
-    server.registerTool("insert_image", {
-        description: "Download an image from a web (http/https) URL and insert it into " +
-            "a page in one step. By default " +
-            "appends the image at the end of the page. With replaceText, replaces the " +
-            "first top-level block whose text contains that string (handy for " +
-            'swapping a text placeholder like "[image: foo.png]" for the real image). ' +
-            "With afterText, inserts the image right after the first block containing " +
-            "that string. Preserves all other block ids.",
-        inputSchema: {
-            pageId: z.string().min(1),
-            imageUrl: z
-                .string()
-                .min(1)
-                .describe("http(s) URL of the image to download and upload"),
-            align: z.enum(["left", "center", "right"]).optional(),
-            alt: z.string().optional(),
-            replaceText: z
-                .string()
-                .optional()
-                .describe("Replace the first top-level block whose text contains this string with the image"),
-            afterText: z
-                .string()
-                .optional()
-                .describe("Insert the image right after the first top-level block whose text contains this string"),
-        },
-    }, async ({ pageId, imageUrl, align, alt, replaceText, afterText }) => {
-        const result = await docmostClient.insertImage(pageId, imageUrl, {
-            align,
-            alt,
-            replaceText,
-            afterText,
-        });
-        return jsonContent(result);
-    });
-    // Tool: replace_image
-    server.registerTool("replace_image", {
-        description: "Replace an existing image on a page with a new image fetched from a web " +
-            "(http/https) URL: uploads the new file as a NEW " +
-            "attachment (fresh clean URL that renders and busts browser caches), then " +
-            "repoints every image node referencing the old attachmentId (recursively, " +
-            "incl. callouts/tables) via the live document, preserving comments, " +
-            "alignment and alt. The old attachment is left as an unreferenced orphan " +
-            "(Docmost has no API to delete a single attachment; it is removed only when " +
-            "the page/space is deleted). In-place byte overwrite is avoided because some " +
-            "Docmost versions corrupt the attachment (HTTP 500) on overwrite.",
-        inputSchema: {
-            pageId: z.string().min(1),
-            attachmentId: z
-                .string()
-                .min(1)
-                .describe("attachmentId of the image currently in the page to replace"),
-            imageUrl: z
-                .string()
-                .min(1)
-                .describe("http(s) URL of the new image to download"),
-            align: z.enum(["left", "center", "right"]).optional(),
-            alt: z.string().optional(),
-        },
-    }, async ({ pageId, attachmentId, imageUrl, align, alt }) => {
-        const result = await docmostClient.replaceImage(pageId, attachmentId, imageUrl, {
-            align,
-            alt,
-        });
-        return jsonContent(result);
-    });
-    // Tool: share_page
-    // INTENTIONAL per-transport divergence (not shared): the in-app copy adds a
-    // security-confirmation framing ("only share when the user explicitly asked,
-    // since this exposes the page to anyone with the link") tuned for the in-app
-    // agent; this transport keeps the plain public-URL wording.
-    server.registerTool("share_page", {
-        description: "Make a page publicly accessible (idempotent) and return its public " +
-            "URL. The URL format is <app>/share/<key>/p/<slugId>. This exposes the " +
-            "page content to ANYONE with the URL — do it only when explicitly asked.",
-        inputSchema: {
-            pageId: z.string().min(1).describe("ID of the page to share"),
-            searchIndexing: z
-                .boolean()
-                .optional()
-                .describe("Allow search engines to index the page (default true)"),
-        },
-    }, async ({ pageId, searchIndexing }) => {
-        const result = await docmostClient.sharePage(pageId, searchIndexing ?? true);
-        return jsonContent(result);
-    });
-    // Tool: unshare_page
-    registerShared(SHARED_TOOL_SPECS.unsharePage, async ({ pageId }) => {
-        const result = await docmostClient.unsharePage(pageId);
-        return jsonContent(result);
-    });
-    // Tool: list_shares
-    registerShared(SHARED_TOOL_SPECS.listShares, async () => {
-        const result = await docmostClient.listShares();
-        return jsonContent(result);
-    });
-    // Tool: move_page
-    server.registerTool("move_page", {
-        description: "Move a page under a new parent (nesting) or to the space root.",
-        inputSchema: {
-            pageId: z.string().min(1),
-            parentPageId: z
-                .string()
-                .nullable()
-                .optional()
-                .describe("Target parent page ID. Pass 'null' or empty string to move to root."),
-            position: z
-                .string()
-                .min(5)
-                .optional()
-                .describe("fractional-index position key; min 5 chars; omit to append at the end."),
-        },
-    }, async ({ pageId, parentPageId, position }) => {
-        const finalParentId = parentPageId === "" || parentPageId === "null" ? null : parentPageId;
-        // Cheap cycle guard: a page cannot be moved directly under itself.
-        // (Deeper descendant-cycle detection is intentionally out of scope.)
-        if (finalParentId !== null && finalParentId === pageId) {
-            throw new Error("cannot move a page under itself");
-        }
-        const result = await docmostClient.movePage(pageId, finalParentId || null, position);
-        // Require POSITIVE confirmation: the live /pages/move success shape is
-        // exactly { success: true, status: 200 }. An empty body, a 204, or any odd
-        // shape lacking success === true must NOT be reported as a successful move,
-        // so we surface the raw API result instead of declaring success.
-        if (!(result && typeof result === "object" && result.success === true)) {
-            throw new Error(`Failed to move page ${pageId}: ${JSON.stringify(result)}`);
-        }
-        return jsonContent({
-            message: `Successfully moved page ${pageId} to parent ${finalParentId || "root"}`,
-            result,
-        });
-    });
-    // Tool: delete_page
-    server.registerTool("delete_page", {
-        description: "Delete a single page by ID. SOFT delete only: the page is moved to " +
-            "trash and can be restored; nothing is permanently deleted.",
-        inputSchema: {
-            pageId: z.string().min(1),
-        },
-    }, async ({ pageId }) => {
-        await docmostClient.deletePage(pageId);
-        return {
-            content: [
-                { type: "text", text: `Successfully deleted page ${pageId}` },
-            ],
-        };
-    });
-    // --- Comment tools (ported from upstream PR #3 by Max Nikitin) ---
-    // Tool: list_comments
-    server.registerTool("list_comments", {
-        description: "List ALL comments on a page in one call (pagination is handled " +
-            "internally), including RESOLVED threads — filter by resolvedAt when you " +
-            "need only open ones. Content is returned as Markdown.",
-        inputSchema: {
-            pageId: z.string().describe("ID of the page"),
-        },
-    }, async ({ pageId }) => {
-        const comments = await docmostClient.listComments(pageId);
-        return jsonContent(comments);
-    });
-    // Tool: create_comment
-    // INTENTIONAL per-transport divergence (not shared): the in-app copy tunes the
-    // guidance for the in-app agent (e.g. "retry with a corrected EXACT selection"
-    // and "Reversible via the comment UI"); this transport keeps its own wording.
-    server.registerTool("create_comment", {
-        description: "Create a new comment on a page. The comment is ALWAYS inline and is " +
-            "anchored to (highlights) its `selection` text — there are no page-level " +
-            "comments. Content is provided as Markdown and automatically converted. " +
-            "A top-level comment REQUIRES an exact `selection`; if the selection " +
-            "cannot be found in the page the call fails (no orphan comment is left). " +
-            "Replies (parentCommentId set) inherit the parent's anchor and take no " +
-            "selection. You may also attach a `suggestedText` proposing a replacement " +
-            "for the `selection`; a human applies (or rejects) it from the UI. When " +
-            "`suggestedText` is set the `selection` MUST occur exactly once in the " +
-            "page — expand it with surrounding context if it is ambiguous.",
-        inputSchema: {
-            pageId: z.string().describe("ID of the page to comment on"),
-            content: z.string().min(1).describe("Comment content in Markdown format"),
-            selection: z
-                .string()
-                .min(1)
-                // Enforce the documented 250-char cap to match the description above.
-                .max(250)
-                .optional()
-                .describe("EXACT contiguous text from a single paragraph/block to anchor the " +
-                "comment on (<=250 chars). Required for a top-level comment; omit " +
-                "only when replying via parentCommentId."),
-            parentCommentId: z
-                .string()
-                .optional()
-                .describe("Parent comment ID to create a reply (max 2 nesting levels)"),
-            suggestedText: z
-                .string()
-                .min(1)
-                .max(2000)
-                .optional()
-                .describe("Optional proposed replacement (PLAIN TEXT) for the `selection`, " +
-                "applied by a human via the UI (never auto-applied). REQUIRES a " +
-                "`selection`; NOT allowed on a reply. When set, the `selection` must " +
-                "be UNIQUE in the page — expand it with surrounding context (still " +
-                "<=250 chars) if it occurs more than once, or the call is refused."),
-        },
-    }, async ({ pageId, content, selection, parentCommentId, suggestedText }) => {
-        if (!parentCommentId && (!selection || !selection.trim())) {
-            throw new Error("create_comment: a 'selection' (exact text to anchor on) is required for a top-level comment; omit it only when replying via parentCommentId.");
-        }
-        if (suggestedText !== undefined) {
-            if (parentCommentId) {
-                throw new Error("create_comment: 'suggestedText' cannot be attached to a reply; it applies only to a top-level inline comment.");
-            }
-            if (!selection || !selection.trim()) {
-                throw new Error("create_comment: 'suggestedText' requires a 'selection' to anchor and rewrite.");
-            }
-        }
-        const result = await docmostClient.createComment(pageId, content, "inline", selection, parentCommentId, suggestedText);
-        return jsonContent(result);
-    });
-    // Tool: update_comment
-    server.registerTool("update_comment", {
-        description: "Update an existing comment's content. Only the comment creator can " +
-            "update it. Content is provided as Markdown.",
-        inputSchema: {
-            commentId: z.string().min(1).describe("ID of the comment to update"),
-            content: z
-                .string()
-                .min(1)
-                .describe("New comment content in Markdown format"),
-        },
-    }, async ({ commentId, content }) => {
-        const result = await docmostClient.updateComment(commentId, content);
-        return jsonContent(result);
-    });
-    // Tool: delete_comment
-    server.registerTool("delete_comment", {
-        description: "Delete a comment. Only the comment creator or space admin can delete it.",
-        inputSchema: {
-            commentId: z.string().min(1).describe("ID of the comment to delete"),
-        },
-    }, async ({ commentId }) => {
-        await docmostClient.deleteComment(commentId);
-        return {
-            content: [
-                {
-                    type: "text",
-                    text: `Successfully deleted comment ${commentId}`,
-                },
-            ],
-        };
-    });
-    // Tool: resolve_comment
-    server.registerTool("resolve_comment", {
-        description: "Resolve (close) or reopen a comment thread. Only top-level comments can " +
-            "be resolved — the server rejects resolving a reply. Reversible: pass " +
-            "resolved=false to reopen. Resolving keeps the thread and its replies " +
-            "(unlike delete_comment, which permanently removes them).",
-        inputSchema: {
-            commentId: z
-                .string()
-                .min(1)
-                .describe("ID of the top-level comment thread to resolve or reopen"),
-            resolved: z
-                .boolean()
-                .optional()
-                .default(true)
-                .describe("true (default) marks the thread resolved/closed; false reopens it"),
-        },
-    }, async ({ commentId, resolved }) => {
-        const result = await docmostClient.resolveComment(commentId, resolved);
-        return jsonContent(result);
-    });
-    // Tool: check_new_comments
-    server.registerTool("check_new_comments", {
-        description: "Check for new comments across pages in a space since a given timestamp. " +
-            "Optionally scope to a page subtree (folder). Returns only comments " +
-            "created after the specified time.",
-        inputSchema: {
-            spaceId: z.string().describe("Space ID to check for new comments"),
-            since: z
-                .string()
-                .min(1)
-                .describe("ISO 8601 timestamp — only return comments created after this time (e.g. '2026-03-10T00:00:00Z')"),
-            parentPageId: z
-                .string()
-                .optional()
-                .describe("Optional root page ID to scope the check to a subtree (folder). " +
-                "Only pages under this parent will be checked."),
-        },
-    }, async ({ spaceId, since, parentPageId }) => {
-        // Reject an unparseable timestamp up front: otherwise the comparison
-        // against NaN silently treats every comment as "not new" and the tool
-        // returns zero results without signalling the bad input.
-        if (Number.isNaN(Date.parse(since))) {
-            throw new Error(`Invalid 'since' timestamp: ${JSON.stringify(since)} — expected an ISO 8601 date (e.g. '2026-03-10T00:00:00Z')`);
-        }
-        const result = await docmostClient.checkNewComments(spaceId, since, parentPageId);
-        return jsonContent(result);
-    });
-    // Tool: search
-    // INTENTIONAL per-transport divergence (not shared): the in-app `searchPages`
-    // runs a semantic + keyword hybrid (RRF) with in-process access control and a
-    // different schema (limit 1-20); this transport is a plain REST full-text search
-    // (limit up to 100). Different behaviour AND schema, so kept per-layer.
-    server.registerTool("search", {
-        description: "Full-text search for pages and content across the whole workspace. " +
-            "Results are bounded by `limit` (1-100; when omitted the server applies " +
-            "its own default).",
-        inputSchema: {
-            query: z.string().min(1).describe("Search query"),
-            limit: z
-                .number()
-                .int()
-                .min(1)
-                .max(100)
-                .optional()
-                .describe("Max results to return (max 100)"),
-        },
-    }, async ({ query, limit }) => {
-        // The tool exposes no spaceId filter, so pass undefined for the client's
-        // optional spaceId parameter and forward limit into its correct slot.
-        const result = await docmostClient.search(query, undefined, limit);
-        return jsonContent(result);
-    });
-    // Tool: docmost_transform
-    // INTENTIONAL per-transport divergence (not shared): the in-app `transformPage`
-    // deliberately omits the `deleteComments` schema field (comment-deletion
-    // guardrail) and carries a much shorter description; this transport exposes the
-    // full helper catalogue. Different schema, so kept per-layer.
-    server.registerTool("docmost_transform", {
-        description: "Edit a page by running an arbitrary JS transform `(doc, ctx) => doc` " +
-            "against its LIVE ProseMirror document, with a diff preview and page " +
-            "history as the safety net. By default dryRun=true: returns a diff " +
-            "preview WITHOUT writing. Set dryRun=false to apply (atomic, won't " +
-            "clobber concurrent edits). `doc` is the lossless ProseMirror document " +
-            "({type:'doc',content:[...]}); return a new doc of the same shape. " +
-            "`ctx` gives you: comments (the page's comments, each {id, content " +
-            "(markdown), selection, type}); log (array; console.log pushes to it); " +
-            "consume(id) (mark a comment id as consumed — those are deleted when " +
-            "deleteComments=true after a successful apply); and helpers: " +
-            "blockText(node) (plain text), walk(node, fn) (depth-first over all " +
-            "nodes incl. callouts/tables/lists), getList(doc, predicate) (find a " +
-            "node even without attrs.id), insertMarkerAfter(doc, anchor, marker, " +
-            "{beforeBlock}) (insert a plain unmarked text run after anchor, " +
-            "mark-safe), setCalloutRange(doc, n) (sync a [1]…[K] callout range to " +
-            "[1]…[n]), noteItem(inlineNodes) (wrap inline nodes in a listItem with a " +
-            "fresh id), mdToInlineNodes(markdown) (comment markdown -> inline nodes), " +
-            "commentsToFootnotes(doc, comments, {notesHeading}) (turn inline " +
-            "comments into numbered footnotes), canonicalizeFootnotes(doc) (derive " +
-            "footnote numbering + the single bottom list from reference order, drop " +
-            "orphans/duplicates — runs AUTOMATICALLY on the transform RESULT, so the " +
-            "applied (and dryRun-previewed) doc is always footnote-canonical; a dryRun " +
-            "diff may therefore show footnote tidy-ups your script did not make, and " +
-            "it is idempotent after the first run), and " +
-            "insertInlineFootnote(doc, {anchorText, text}) (author-inline footnote: " +
-            "marker + dedup'd definition, list derived). Footnote convention: markers are " +
-            "plain '[N]' text in the body; the notes are an orderedList under a " +
-            "heading whose text is 'Примечания переводчика' (that is only the DEFAULT " +
-            "notesHeading — pass the notesHeading option to the helpers to use a " +
-            "heading matching the page's language). The transform runs " +
-            "sandboxed (no require/process/fs/network, 5s timeout) and must return a " +
-            "{type:'doc'} node.",
-        inputSchema: {
-            pageId: z.string().min(1),
-            transformJs: z
-                .string()
-                .min(1)
-                .describe("A JS function `(doc, ctx) => doc` (expression-arrow or " +
-                "parenthesized function). It receives a clone of the live doc and " +
-                "ctx (comments, log, consume(id), helpers: blockText/walk/getList/" +
-                "insertMarkerAfter/setCalloutRange/noteItem/mdToInlineNodes/" +
-                "commentsToFootnotes/canonicalizeFootnotes/insertInlineFootnote) " +
-                "and must return a {type:'doc'} node."),
-            dryRun: z
-                .boolean()
-                .optional()
-                .default(true)
-                .describe("Preview only (no write) when true (default)."),
-            deleteComments: z
-                .boolean()
-                .optional()
-                .default(false)
-                .describe("After a successful apply, delete every comment id passed to " +
-                "ctx.consume(id)."),
-        },
-    }, async ({ pageId, transformJs, dryRun, deleteComments }) => {
-        const result = await docmostClient.transformPage(pageId, transformJs, {
-            dryRun,
-            deleteComments,
-        });
-        return jsonContent(result);
-    });
-    // Tool: insert_footnote
-    server.registerTool("insert_footnote", {
-        description: "Insert an AUTHOR-INLINE footnote: you specify only WHERE (anchorText) " +
-            "and WHAT (text). The footnote marker is placed right after anchorText in " +
-            "the body, and the bottom footnotes list + the numbering are derived " +
-            "deterministically server-side. You do NOT assign a number, and you " +
-            "never see or edit the footnotes list — so footnotes cannot end up out " +
-            "of order, orphaned, or as a raw '[^id]' block. If a footnote with the " +
-            "SAME text already exists, its number is REUSED (one definition, several " +
-            "references). The write is atomic and won't clobber concurrent edits; if " +
-            "anchorText is not found, nothing is written and an error is returned.",
-        inputSchema: {
-            pageId: z.string().min(1),
-            anchorText: z
-                .string()
-                .min(1)
-                .describe("A snippet of existing body text; the footnote marker is inserted " +
-                "immediately after its first occurrence (mark-safe)."),
-            text: z
-                .string()
-                .min(1)
-                .describe("The footnote content as markdown (becomes the definition)."),
-        },
-    }, async ({ pageId, anchorText, text }) => {
-        const result = await docmostClient.insertFootnote(pageId, anchorText, text);
-        return jsonContent(result);
-    });
-    // Tool: diff_page_versions
-    registerShared(SHARED_TOOL_SPECS.diffPageVersions, async ({ pageId, from, to }) => {
-        const result = await docmostClient.diffPageVersions(pageId, from, to);
-        return jsonContent(result);
-    });
-    // Tool: list_page_history
-    registerShared(SHARED_TOOL_SPECS.listPageHistory, async ({ pageId, cursor }) => {
-        const result = await docmostClient.listPageHistory(pageId, cursor);
-        return jsonContent(result);
-    });
-    // Tool: restore_page_version
-    registerShared(SHARED_TOOL_SPECS.restorePageVersion, async ({ historyId }) => {
-        const result = await docmostClient.restorePageVersion(historyId);
-        return jsonContent(result);
-    });
-    return server;
-}
diff --git a/packages/mcp/build/lib/auth-utils.js b/packages/mcp/build/lib/auth-utils.js
deleted file mode 100644
index 39b91d9d..00000000
--- a/packages/mcp/build/lib/auth-utils.js
+++ /dev/null
@@ -1,92 +0,0 @@
-import axios from "axios";
-export async function getCollabToken(baseUrl, apiToken) {
-    try {
-        const response = await axios.post(`${baseUrl}/auth/collab-token`, {}, {
-            headers: {
-                Authorization: `Bearer ${apiToken}`,
-                "Content-Type": "application/json",
-            },
-        });
-        // console.error('Collab Token Response:', response.data);
-        // Response is wrapped in { data: { token: ... } }
-        return response.data.data?.token || response.data.token;
-    }
-    catch (error) {
-        if (axios.isAxiosError(error)) {
-            // Attach the HTTP status to the plain Error so callers (e.g.
-            // getCollabTokenWithReauth) can still detect a 401/403 after the
-            // original AxiosError has been wrapped away.
-            // Avoid leaking the full server response body by default; include only
-            // status + statusText. Append the body only when DEBUG is set.
-            let message = `Failed to get collab token: ${error.response?.status} ${error.response?.statusText}`;
-            if (process.env.DEBUG) {
-                message += ` - ${JSON.stringify(error.response?.data)}`;
-            }
-            const err = new Error(message);
-            err.status = error.response?.status;
-            throw err;
-        }
-        throw error;
-    }
-}
-/**
- * Pure cookie-parsing helper extracted from `performLogin` so the parsing logic
- * can be unit-tested without performing the login network request. Given the
- * raw `Set-Cookie` header array from the login response, return the `authToken`
- * cookie's value.
- *
- * Behavior (kept identical to the original inline logic):
- *  - throws if there is no Set-Cookie header at all;
- *  - matches the cookie NAME exactly (`authToken`), so a future
- *    `authTokenRefresh=...` cookie is NOT picked up (a `startsWith` would be);
- *  - returns everything after the FIRST `=` up to the first `;`, so a base64
- *    value containing `=` padding is preserved (a naive `split("=")` would
- *    truncate it);
- *  - cookie attributes after the first `;` (Path, HttpOnly, Expires, …) are
- *    ignored;
- *  - throws if no `authToken` cookie is present.
- */
-export function extractAuthTokenFromSetCookie(cookies) {
-    if (!cookies) {
-        throw new Error("No Set-Cookie header found in login response");
-    }
-    // Match the cookie name exactly to avoid matching a future
-    // authTokenRefresh cookie (startsWith would catch it).
-    const authCookie = cookies.find((c) => {
-        const kv = c.split(";")[0];
-        return kv.slice(0, kv.indexOf("=")) === "authToken";
-    });
-    if (!authCookie) {
-        throw new Error("No authToken cookie found in login response");
-    }
-    // Take everything after the FIRST "=" up to the first ";".
-    // Splitting on "=" would truncate base64 values containing "=" padding.
-    const kv = authCookie.split(";")[0];
-    return kv.slice(kv.indexOf("=") + 1);
-}
-export async function performLogin(baseUrl, email, password) {
-    try {
-        const response = await axios.post(`${baseUrl}/auth/login`, {
-            email,
-            password,
-        });
-        // Extract token from Set-Cookie header
-        return extractAuthTokenFromSetCookie(response.headers["set-cookie"]);
-    }
-    catch (error) {
-        // Avoid leaking the full server response body by default; log only the
-        // HTTP status. Log the verbose body only when DEBUG is set.
-        if (axios.isAxiosError(error)) {
-            if (process.env.DEBUG) {
-                console.error("Login failed:", error.response?.data);
-            }
-            else {
-                console.error("Login failed:", error.response?.status);
-            }
-        }
-        else {
-            console.error("Login failed:", error.message);
-        }
-        throw error;
-    }
-}
diff --git a/packages/mcp/build/lib/collaboration.js b/packages/mcp/build/lib/collaboration.js
deleted file mode 100644
index 4504b8d0..00000000
--- a/packages/mcp/build/lib/collaboration.js
+++ /dev/null
@@ -1,743 +0,0 @@
-import { HocuspocusProvider } from "@hocuspocus/provider";
-import { TiptapTransformer } from "@hocuspocus/transformer";
-import * as Y from "yjs";
-import WebSocket from "ws";
-import { marked } from "marked";
-import { generateJSON } from "@tiptap/html";
-import { Node as PMNode } from "@tiptap/pm/model";
-import { updateYFragment } from "y-prosemirror";
-import { JSDOM } from "jsdom";
-import { docmostExtensions, docmostSchema } from "./docmost-schema.js";
-import { withPageLock } from "./page-lock.js";
-import { sanitizeForYjs, findUnstorableAttr } from "./node-ops.js";
-import { lexFootnoteLines } from "./footnote-lex.js";
-import { canonicalizeFootnotes } from "./footnote-canonicalize.js";
-import { summarizeChange } from "./diff.js";
-/**
- * Build the descriptive error for an opaque Yjs encode failure ("Unexpected
- * content type"), shared by both encode paths (`buildYDoc` -> `toYdoc` and
- * `applyDocToFragment` -> `updateYFragment`) so the message wording stays in one
- * place. `label` names the stage that failed (diagnostic). `sanitizeForYjs`
- * already stripped `undefined` attrs, so a remaining failure is pinpointed via
- * `findUnstorableAttr`.
- */
-function unstorableYjsError(safe, label, e) {
-    const bad = findUnstorableAttr(safe);
-    return new Error(`Failed to encode document to Yjs (${label}): ${e instanceof Error ? e.message : String(e)}.${bad ? ` Offending attribute: ${bad}.` : " A node/mark attribute likely holds a value Yjs cannot store (e.g. undefined)."}`);
-}
-// Setup DOM environment for Tiptap HTML parsing in Node.js
-const dom = new JSDOM("<!DOCTYPE html><html><body></body></html>");
-global.window = dom.window;
-global.document = dom.window.document;
-// @ts-ignore
-global.Element = dom.window.Element;
-// @ts-ignore
-global.WebSocket = WebSocket;
-// Navigator is read-only in newer Node versions and already exists
-// global.navigator = dom.window.navigator;
-/**
- * Hard ceiling above which we skip callout preprocessing entirely. The linear
- * scanner below has no quadratic blow-up, but we still cap input defensively so
- * a pathological multi-megabyte payload cannot tie up the event loop; in that
- * case the markdown is passed through verbatim (callouts are simply not
- * detected) rather than risking a slow scan.
- */
-const MAX_CALLOUT_PREPROCESS_BYTES = 4 * 1024 * 1024; // 4 MB
-/** Matches an opening callout fence: `:::type` (type captured, lower-cased). */
-const CALLOUT_OPEN_RE = /^:::\s*(\w+)\s*$/;
-/** Matches a bare closing callout fence: `:::`. */
-const CALLOUT_CLOSE_RE = /^:::\s*$/;
-/** Matches the start/end of a code fence (``` or ~~~), capturing the marker. */
-const CODE_FENCE_RE = /^(\s*)(`{3,}|~{3,})/;
-/**
- * Pre-process Docmost-flavoured markdown: convert `:::type ... :::`
- * callout blocks (the syntax our markdown export produces) into HTML
- * divs that the callout extension parses. The inner content is rendered
- * through marked as regular markdown.
- *
- * Implemented as a single linear pass over the lines (no quadratic regex
- * rescan). It:
- *   - tracks fenced code regions (```...``` and ~~~...~~~) and never treats a
- *     `:::` line that lives inside a code fence as a callout delimiter, so a
- *     callout body that itself contains a fenced code block with a `:::` line is
- *     no longer corrupted;
- *   - matches an opening `:::type` line with the next CLOSING `:::` at the SAME
- *     nesting level, supporting NESTED callouts via a depth counter (an inner
- *     `:::type` opens a deeper level and consumes a matching `:::`);
- *   - emits the same `<div data-type="callout" data-callout-type="TYPE">` output
- *     (inner rendered through marked) as the previous regex implementation.
- */
-async function preprocessCallouts(markdown) {
-    // Defensive cap: skip preprocessing for pathologically large inputs.
-    if (markdown.length > MAX_CALLOUT_PREPROCESS_BYTES) {
-        return markdown;
-    }
-    // Recursively transform a slice of lines, converting top-level callouts in
-    // that slice into <div> blocks and rendering their inner content (which may
-    // itself contain nested callouts) through this same function.
-    const transform = async (lines) => {
-        const out = [];
-        let inCodeFence = false;
-        let codeFenceMarker = ""; // the exact run of backticks/tildes that opened it
-        let i = 0;
-        while (i < lines.length) {
-            const line = lines[i];
-            // Inside a code fence, only its matching closing fence is significant;
-            // everything else (including `:::` lines) is copied through verbatim.
-            if (inCodeFence) {
-                out.push(line);
-                const fence = line.match(CODE_FENCE_RE);
-                if (fence && fence[2].startsWith(codeFenceMarker[0]) &&
-                    fence[2].length >= codeFenceMarker.length) {
-                    inCodeFence = false;
-                    codeFenceMarker = "";
-                }
-                i++;
-                continue;
-            }
-            // A code fence opening outside any callout body: enter code-fence mode.
-            const fenceOpen = line.match(CODE_FENCE_RE);
-            if (fenceOpen) {
-                inCodeFence = true;
-                codeFenceMarker = fenceOpen[2];
-                out.push(line);
-                i++;
-                continue;
-            }
-            // An opening callout fence: scan forward (with code-fence and nested
-            // callout awareness) for its matching closing `:::` at the same level.
-            const open = line.match(CALLOUT_OPEN_RE);
-            if (open) {
-                const type = open[1].toLowerCase();
-                const bodyLines = [];
-                let depth = 1;
-                let innerInCodeFence = false;
-                let innerCodeFenceMarker = "";
-                let j = i + 1;
-                for (; j < lines.length; j++) {
-                    const bl = lines[j];
-                    if (innerInCodeFence) {
-                        const f = bl.match(CODE_FENCE_RE);
-                        if (f && f[2].startsWith(innerCodeFenceMarker[0]) &&
-                            f[2].length >= innerCodeFenceMarker.length) {
-                            innerInCodeFence = false;
-                            innerCodeFenceMarker = "";
-                        }
-                        bodyLines.push(bl);
-                        continue;
-                    }
-                    const innerFence = bl.match(CODE_FENCE_RE);
-                    if (innerFence) {
-                        innerInCodeFence = true;
-                        innerCodeFenceMarker = innerFence[2];
-                        bodyLines.push(bl);
-                        continue;
-                    }
-                    if (CALLOUT_OPEN_RE.test(bl)) {
-                        depth++;
-                        bodyLines.push(bl);
-                        continue;
-                    }
-                    if (CALLOUT_CLOSE_RE.test(bl)) {
-                        depth--;
-                        if (depth === 0)
-                            break; // matching close for THIS callout
-                        bodyLines.push(bl);
-                        continue;
-                    }
-                    bodyLines.push(bl);
-                }
-                if (j < lines.length) {
-                    // Found the matching closing fence: render the body (recursively, so
-                    // nested callouts are handled) and emit the callout div.
-                    const inner = await transform(bodyLines);
-                    const renderedInner = await marked.parse(inner);
-                    out.push(`\n<div data-type="callout" data-callout-type="${type}">${renderedInner}</div>\n`);
-                    i = j + 1; // skip past the closing `:::`
-                    continue;
-                }
-                // No matching close (unterminated callout): treat the opener as a
-                // literal line and continue, preserving the original text.
-                out.push(line);
-                i++;
-                continue;
-            }
-            out.push(line);
-            i++;
-        }
-        return out.join("\n");
-    };
-    return transform(markdown.split("\n"));
-}
-/**
- * Bridge marked's checkbox lists to TipTap task lists.
- *
- * marked renders GitHub task list items (`- [x] done`) as a plain
- * `<ul><li><p><input type="checkbox" checked> text</p></li></ul>` WITHOUT the
- * markup TipTap's TaskList/TaskItem extensions parse. This rewrites such lists
- * into the shape those extensions expect:
- *   TaskList parseHTML matches `ul[data-type="taskList"]`,
- *   TaskItem matches `li[data-type="taskItem"]`,
- *   the checked state is read from `data-checked === "true"`.
- *
- * A list is only converted when it has at least one `<li>` and EVERY direct
- * `<li>` contains a checkbox input. Both `<ul>` and `<ol>` are considered: a
- * numbered checklist (`1. [x] a`, which marked renders as an `<ol>` of checkbox
- * `<li>`s) would otherwise lose its task state. TipTap task lists are unordered,
- * so a matching `<ol>` is emitted as `data-type="taskList"` exactly like a
- * `<ul>`. Mixed or ordinary lists (including ordinary `<ol>` lists) are left
- * untouched so they keep rendering as bullet/numbered lists. The marked `<p>`
- * wrapper is kept inside the `<li>` because TaskItem content allows paragraphs.
- */
-function bridgeTaskLists(html) {
-    // Cheap early-out: if the markup contains no checkbox input at all there is
-    // nothing to bridge, so skip the expensive JSDOM parse entirely. This is the
-    // common case (most pages have no task lists).
-    if (!/type=["']?checkbox/i.test(html)) {
-        return html;
-    }
-    // Defensive cap (consistent with preprocessCallouts): skip the bridge for
-    // pathologically large inputs rather than running a second expensive JSDOM
-    // parse on a multi-megabyte payload. The markup is passed through verbatim.
-    if (html.length > MAX_CALLOUT_PREPROCESS_BYTES) {
-        return html;
-    }
-    const dom = new JSDOM(html);
-    const document = dom.window.document;
-    // Collect the checkbox(es) that belong to THIS <li> directly: either direct
-    // child <input type="checkbox"> elements or ones inside the <li>'s direct <p>
-    // child (the shape marked emits: `<li><p><input type="checkbox"> text</p></li>`).
-    // Checkboxes nested deeper (e.g. inside a child <ul>/<ol>) are excluded so a
-    // bullet <li> that merely contains a nested task sublist is not misdetected.
-    // Raw inline HTML can put more than one checkbox in a single <li>; we gather
-    // ALL of them so none survive into the converted item.
-    const directCheckboxes = (li) => {
-        const found = [];
-        for (const child of Array.from(li.children)) {
-            if (child.tagName === "INPUT" &&
-                child.getAttribute("type") === "checkbox") {
-                found.push(child);
-                continue;
-            }
-            if (child.tagName === "P") {
-                for (const inp of Array.from(child.querySelectorAll(":scope > input[type='checkbox']"))) {
-                    found.push(inp);
-                }
-            }
-        }
-        return found;
-    };
-    // Both <ul> and <ol> are candidates: an <ol> whose every direct <li> carries
-    // its own checkbox is a numbered checklist that must also become a taskList.
-    const lists = Array.from(document.querySelectorAll("ul, ol"));
-    for (const list of lists) {
-        // Only consider DIRECT child <li> elements; nested lists are handled by
-        // their own iteration of the outer loop.
-        const items = Array.from(list.children).filter((child) => child.tagName === "LI");
-        if (items.length === 0)
-            continue;
-        const itemCheckboxes = items.map((li) => directCheckboxes(li));
-        // Convert only when every direct <li> carries at least one OWN checkbox.
-        if (!itemCheckboxes.every((boxes) => boxes.length > 0))
-            continue;
-        // A numbered checklist arrives as an <ol>. We must NOT leave the tag as
-        // <ol> while tagging it data-type="taskList": generateJSON would then match
-        // BOTH the orderedList rule (tag ol) and the taskList rule (data-type),
-        // emitting a phantom empty orderedList beside the real taskList. So rename a
-        // qualifying <ol> to a <ul> — move its <li> children over and replace it —
-        // leaving only the taskList rule to match. Already-<ul> lists are unchanged.
-        let target = list;
-        if (list.tagName === "OL") {
-            const ul = document.createElement("ul");
-            // Carry over existing attributes (e.g. class) so nothing is silently lost.
-            for (const attr of Array.from(list.attributes)) {
-                ul.setAttribute(attr.name, attr.value);
-            }
-            // Move every child node (including the <li>s we collected) into the <ul>.
-            while (list.firstChild) {
-                ul.appendChild(list.firstChild);
-            }
-            list.replaceWith(ul);
-            target = ul;
-        }
-        target.setAttribute("data-type", "taskList");
-        items.forEach((li, index) => {
-            const boxes = itemCheckboxes[index];
-            // The first checkbox determines the checked state (matches the previous
-            // single-checkbox behaviour); any extras only need removing.
-            const input = boxes[0] ?? null;
-            li.setAttribute("data-type", "taskItem");
-            const checked = input != null &&
-                (input.hasAttribute("checked") || input.checked);
-            li.setAttribute("data-checked", checked ? "true" : "false");
-            // Remove ALL direct checkbox inputs so none survive into the content
-            // (a raw-inline-HTML <li> may carry more than one).
-            for (const box of boxes) {
-                box.remove();
-            }
-        });
-    }
-    return document.body.innerHTML;
-}
-// Mirror of packages/editor-ext footnote markdown handling. A `[^id]` inline
-// marker becomes <sup data-footnote-ref data-id="id">, and `[^id]: text`
-// definition lines are collected into a single <section data-footnotes>.
-// Definition detection + fence handling are shared with analyzeFootnotes via
-// lexFootnoteLines (footnote-lex.js). FOOTNOTE_REF_RE is the inline tokenizer's.
-const FOOTNOTE_REF_RE = /\[\^([^\]\s]+)\]/;
-function escapeFootnoteAttr(value) {
-    return String(value).replace(/&/g, "&amp;").replace(/"/g, "&quot;");
-}
-const footnoteRefMarkedExtension = {
-    name: "footnoteRef",
-    level: "inline",
-    start(src) {
-        return src.match(/\[\^/)?.index ?? -1;
-    },
-    tokenizer(src) {
-        const match = FOOTNOTE_REF_RE.exec(src);
-        if (match && match.index === 0) {
-            return { type: "footnoteRef", raw: match[0], id: match[1] };
-        }
-        return undefined;
-    },
-    renderer(token) {
-        return `<sup data-footnote-ref data-id="${escapeFootnoteAttr(token.id)}"></sup>`;
-    },
-};
-marked.use({ extensions: [footnoteRefMarkedExtension] });
-/**
- * Pull `[^id]: text` definition lines out of the body and render a single
- * <section data-footnotes> for them (or "" when there are none).
- */
-function extractFootnotes(markdown) {
-    const bodyLines = [];
-    const defs = [];
-    // Shared lexer (footnote-lex): a `[^id]: ...` line inside a ``` / ~~~ code
-    // block is inert and stays in the body verbatim; only real definition lines
-    // are pulled out. analyzeFootnotes() consumes the SAME lexer so its diagnostics
-    // match exactly what import keeps/strips (#166).
-    for (const tok of lexFootnoteLines(markdown)) {
-        if (!tok.inFence && tok.definition)
-            defs.push(tok.definition);
-        else
-            bodyLines.push(tok.line);
-    }
-    if (defs.length === 0)
-        return { body: markdown, section: "" };
-    // Duplicate definition ids: FIRST WINS, the rest are DROPPED (mirror of
-    // editor-ext extractFootnoteDefinitions). Reference markers are left untouched
-    // so repeated `[^a]` references reuse the single footnote (Pandoc semantics,
-    // #166). The dropped duplicate is surfaced to the caller via analyzeFootnotes
-    // (`duplicateDefinitions`), not silently lost. MUST stay in sync with the
-    // editor-ext mirror.
-    const firstById = new Map(); // id -> first definition text
-    for (const def of defs) {
-        if (!firstById.has(def.id))
-            firstById.set(def.id, def.text);
-    }
-    const inner = [...firstById.entries()]
-        .map(([id, text]) => `<div data-footnote-def data-id="${escapeFootnoteAttr(id)}"><p>${marked.parseInline(text || "")}</p></div>`)
-        .join("");
-    return {
-        body: bodyLines.join("\n"),
-        section: `<section data-footnotes>${inner}</section>`,
-    };
-}
-/**
- * Convert markdown to a ProseMirror doc using the full Docmost schema.
- *
- * This conversion does NOT canonicalize footnotes — it is the shared, content-
- * preserving primitive used by BOTH page write paths and COMMENT bodies
- * (createComment / updateComment). Canonicalization MUST NOT run on a comment
- * body: a comment may legitimately contain a footnote-definition line
- * (`[^1]: text`) with no matching reference, and the canonicalizer drops a
- * reference-less footnotesList — which would silently delete the comment's text.
- *
- * Page write paths that DO need the canonical footnote topology call
- * `markdownToProseMirrorCanonical` instead (markdown import, update_page markdown
- * path). Keep this function reference-loss-free.
- */
-export async function markdownToProseMirror(markdownContent) {
-    const withCallouts = await preprocessCallouts(markdownContent);
-    const { body, section } = extractFootnotes(withCallouts);
-    const html = (await marked.parse(body)) + section;
-    const bridged = bridgeTaskLists(html);
-    return generateJSON(bridged, docmostExtensions);
-}
-/**
- * Page-write variant of `markdownToProseMirror`: converts markdown then enforces
- * the canonical footnote topology. The footnote `section` markdown is emitted in
- * DEFINITION order, but numbering derives from REFERENCE order, so without this
- * the bottom list renders out of order (`1, 4, 2, 3, …`); orphan definitions and
- * duplicate lists are also normalized. Idempotent — a no-op once canonical, and a
- * no-op for footnote-free content.
- *
- * Use this ONLY for full-document PAGE writes (never for comment bodies, where it
- * would drop a reference-less footnote definition — see `markdownToProseMirror`).
- */
-export async function markdownToProseMirrorCanonical(markdownContent) {
-    return canonicalizeFootnotes(await markdownToProseMirror(markdownContent));
-}
-/**
- * Build the collaboration WebSocket URL from an API base URL:
- * switch http(s)->ws(s), strip a trailing /api, mount on /collab.
- * Shared by the live read and the mutate path so both target the same socket.
- */
-export function buildCollabWsUrl(baseUrl) {
-    let wsUrl = baseUrl.replace(/^http/, "ws");
-    try {
-        const urlObj = new URL(wsUrl);
-        if (urlObj.pathname.endsWith("/api") || urlObj.pathname.endsWith("/api/")) {
-            urlObj.pathname = urlObj.pathname.replace(/\/api\/?$/, "");
-        }
-        urlObj.pathname = urlObj.pathname.replace(/\/$/, "") + "/collab";
-        // Drop any query/hash from the base URL so it is not carried into the
-        // collaboration ws URL.
-        urlObj.search = "";
-        urlObj.hash = "";
-        wsUrl = urlObj.toString();
-    }
-    catch (e) {
-        // Fallback if URL parsing fails
-        if (!wsUrl.endsWith("/collab")) {
-            wsUrl = wsUrl.replace(/\/$/, "") + "/collab";
-        }
-    }
-    return wsUrl;
-}
-/**
- * Encode a ProseMirror doc to a Yjs document, sanitizing it first and turning
- * the opaque yjs "Unexpected content type" failure into a descriptive error.
- *
- * `sanitizeForYjs` strips `undefined` node/mark attributes (the common cause of
- * the failure); if `toYdoc` still throws, `findUnstorableAttr` is used to point
- * at the offending attribute path.
- */
-export function buildYDoc(doc) {
-    const safe = sanitizeForYjs(doc);
-    try {
-        return TiptapTransformer.toYdoc(safe, "default", docmostExtensions);
-    }
-    catch (e) {
-        throw unstorableYjsError(safe, "toYdoc", e);
-    }
-}
-/**
- * Write a new ProseMirror doc into the live Yjs fragment by STRUCTURAL DIFF,
- * preserving the Yjs identity of unchanged nodes (issue #152).
- *
- * The previous approach deleted the whole fragment and re-applied a fresh Y.Doc,
- * which discarded every Yjs node id. y-prosemirror anchors the editor selection
- * to those ids, so an open editor's cursor lost its anchor and snapped to the
- * end of the document on every agent write (most visibly on comment anchoring,
- * which changes no text at all). `updateYFragment` is exactly the routine the
- * editor itself uses to sync ProseMirror edits into Yjs: it diffs the new node
- * against the current fragment and touches only the changed children, so
- * unchanged nodes keep their ids and the live cursor stays put.
- *
- * Must run inside a single `transact` so the diff applies atomically (no remote
- * update interleaves). Keeps `buildYDoc`'s `findUnstorableAttr` diagnostic for
- * the opaque "Unexpected content type" encode failure.
- */
-export function applyDocToFragment(ydoc, newDoc) {
-    const safe = sanitizeForYjs(newDoc);
-    const fragment = ydoc.getXmlFragment("default");
-    // Hydrate the ProseMirror node in its OWN try so a failure here (e.g. an
-    // unknown node type) is labelled "fromJSON" — the stage that actually threw —
-    // instead of being misattributed to the Yjs write stage (#154 review).
-    let pmNode;
-    try {
-        pmNode = PMNode.fromJSON(docmostSchema, safe);
-    }
-    catch (e) {
-        throw unstorableYjsError(safe, "fromJSON", e);
-    }
-    try {
-        ydoc.transact(() => {
-            updateYFragment(ydoc, fragment, pmNode, {
-                mapping: new Map(),
-                isOMark: new Map(),
-            });
-        });
-    }
-    catch (e) {
-        throw unstorableYjsError(safe, "updateYFragment", e);
-    }
-}
-/**
- * Run an independent Yjs-encodability check (the same `sanitizeForYjs` + schema
- * the apply path uses) and throw the same descriptive error when the doc cannot
- * be stored. Used by the dry-run preview.
- *
- * Note: it does NOT run `updateYFragment` against the live fragment, so it is an
- * encodability GATE, not a byte-for-byte rehearsal of apply — `buildYDoc`
- * (`toYdoc`) and `applyDocToFragment` (`updateYFragment`) are two different
- * encoders that nonetheless reject the same unstorable attributes. To narrow the
- * preview/apply gap it ALSO rehearses the apply path's `PMNode.fromJSON`
- * hydration, so a doc that would only fail there (e.g. an unknown node type) is
- * rejected at preview time too (#154 review). Still cheap: no live fragment, no
- * `updateYFragment`.
- */
-export function assertYjsEncodable(doc) {
-    buildYDoc(doc);
-    const safe = sanitizeForYjs(doc);
-    try {
-        PMNode.fromJSON(docmostSchema, safe);
-    }
-    catch (e) {
-        throw unstorableYjsError(safe, "fromJSON", e);
-    }
-}
-/** Time we wait for the initial handshake/sync before giving up. */
-const CONNECT_TIMEOUT_MS = 25000;
-/** Time we wait for the server to acknowledge our write before giving up. */
-const PERSIST_TIMEOUT_MS = 20000;
-/**
- * Safely mutate the live content of a page over the collaboration websocket.
- *
- * This is the single safe write path for every MCP content mutation. It:
- *   1. serializes per-page writes through withPageLock (no two MCP writes on
- *      the same page overlap);
- *   2. connects to Hocuspocus and waits for the initial sync so the local ydoc
- *      mirrors the authoritative server doc — INCLUDING edits/comments/images
- *      that are not yet in the debounced REST snapshot;
- *   3. inside onSynced, SYNCHRONOUSLY reads the live doc, runs `transform`, and
- *      writes the result back — with no `await` between read and write so no
- *      remote update can interleave and clobber concurrent human edits;
- *   4. waits for the server to acknowledge the write (unsyncedChanges -> 0)
- *      before resolving, so the next operation observes our change.
- *
- * `transform` receives the live ProseMirror doc and returns the NEW full
- * ProseMirror doc to write, or `null` to abort with no write (a no-op). If
- * `transform` throws, the error is propagated to the caller (not swallowed).
- *
- * Resolves a `MutationResult { doc, verify }`: `doc` is the doc that was
- * written (or the live doc when the transform aborted), and `verify` is a
- * verifiable change report (text/block/mark deltas) of what actually changed.
- * The report is computed AFTER the atomic read->write, so it never widens the
- * read->write window, and it never throws (it can NEVER break a write).
- */
-export async function mutatePageContent(pageId, collabToken, baseUrl, transform) {
-    return withPageLock(pageId, () => {
-        if (process.env.DEBUG) {
-            console.error(`Starting realtime content mutate for page ${pageId}`);
-            // Token prefix is sensitive; only log it under DEBUG.
-            console.error(`Token prefix: ${collabToken ? collabToken.substring(0, 5) : "NONE"}...`);
-        }
-        const ydoc = new Y.Doc();
-        const wsUrl = buildCollabWsUrl(baseUrl);
-        if (process.env.DEBUG)
-            console.error(`Connecting to WebSocket: ${wsUrl}`);
-        return new Promise((resolve, reject) => {
-            let provider;
-            let applied = false; // onSynced may fire again on reconnect — apply once.
-            let settled = false;
-            // Set true on disconnect/close so a reconnect-driven unsyncedChanges->0
-            // cannot be mistaken for a successful persist of our write.
-            let connectionLost = false;
-            let connectTimer;
-            let persistTimer;
-            let unsyncedHandler;
-            const cleanup = () => {
-                if (connectTimer)
-                    clearTimeout(connectTimer);
-                if (persistTimer)
-                    clearTimeout(persistTimer);
-                if (provider) {
-                    if (unsyncedHandler) {
-                        try {
-                            provider.off("unsyncedChanges", unsyncedHandler);
-                        }
-                        catch (err) { }
-                    }
-                    try {
-                        provider.destroy();
-                    }
-                    catch (err) { }
-                }
-            };
-            const finish = (err, value) => {
-                if (settled)
-                    return;
-                settled = true;
-                cleanup();
-                if (err)
-                    reject(err);
-                else
-                    resolve(value);
-            };
-            connectTimer = setTimeout(() => {
-                finish(new Error("Connection timeout to collaboration server"));
-            }, CONNECT_TIMEOUT_MS);
-            // Resolve once the server has acknowledged our update. The provider
-            // increments unsyncedChanges when our local update is sent and
-            // decrements it when the server replies with a SyncStatus(applied=true);
-            // reaching 0 means the authoritative in-memory ydoc on the server now
-            // contains our write.
-            const waitForPersistence = () => {
-                if (settled)
-                    return;
-                // A missing provider is a failure, not a success: without it the write
-                // can never have been acknowledged. Only an actual unsyncedChanges===0
-                // on a live provider counts as persisted.
-                if (!provider) {
-                    finish(new Error("collab provider gone before persistence"));
-                    return;
-                }
-                if (provider.unsyncedChanges === 0) {
-                    finish(null, mutationResult);
-                    return;
-                }
-                persistTimer = setTimeout(() => {
-                    finish(new Error("Timeout waiting for collaboration server to persist the update"));
-                }, PERSIST_TIMEOUT_MS);
-                unsyncedHandler = (data) => {
-                    // Only treat unsyncedChanges->0 as success when the connection is
-                    // still up. A transient disconnect + reconnect handshake can drive
-                    // the counter back to 0 without our write being re-transmitted; in
-                    // that case let the disconnect/close error win instead.
-                    if (data.number === 0 && !connectionLost) {
-                        finish(null, mutationResult);
-                    }
-                };
-                provider.on("unsyncedChanges", unsyncedHandler);
-            };
-            // The verifiable result resolved on every success/abort path. Set on
-            // abort (no-op report) and after a real write (computed change report).
-            let mutationResult;
-            provider = new HocuspocusProvider({
-                url: wsUrl,
-                name: `page.${pageId}`,
-                document: ydoc,
-                token: collabToken,
-                // @ts-ignore - Required for Node.js environment
-                WebSocketPolyfill: WebSocket,
-                onConnect: () => {
-                    if (process.env.DEBUG)
-                        console.error("WS Connect");
-                },
-                // An unexpected disconnect/close while we are still waiting (during the
-                // connect-wait before onSynced, or during the persistence wait after the
-                // write) means the update will never be acknowledged — surface it now
-                // instead of hanging until the connect/persist timeout fires. `finish`
-                // is idempotent via the `settled` flag, so the onClose that our own
-                // cleanup()->provider.destroy() triggers (after settled=true is set) is
-                // a harmless no-op and cannot cause a double-resolve.
-                onDisconnect: () => {
-                    if (process.env.DEBUG)
-                        console.error("WS Disconnect");
-                    // Mark BEFORE finish so the unsyncedChanges handler (if it races)
-                    // sees the connection as lost and won't report a false success.
-                    connectionLost = true;
-                    finish(new Error("Collaboration connection closed before the update was persisted/synced"));
-                },
-                onClose: () => {
-                    if (process.env.DEBUG)
-                        console.error("WS Close");
-                    // Mark BEFORE finish so the unsyncedChanges handler (if it races)
-                    // sees the connection as lost and won't report a false success.
-                    connectionLost = true;
-                    finish(new Error("Collaboration connection closed before the update was persisted/synced"));
-                },
-                onSynced: () => {
-                    if (applied || settled)
-                        return;
-                    applied = true;
-                    if (process.env.DEBUG)
-                        console.error("Connected and synced!");
-                    // CRITICAL: everything between reading the live doc and writing it
-                    // back must stay synchronous (no await). While the JS event loop is
-                    // not yielded, no incoming remote update can interleave, so any
-                    // already-synced concurrent edits are preserved in liveDoc.
-                    let newDoc;
-                    let beforeDoc;
-                    try {
-                        let liveDoc = TiptapTransformer.fromYdoc(ydoc, "default");
-                        if (!liveDoc ||
-                            typeof liveDoc !== "object" ||
-                            !Array.isArray(liveDoc.content)) {
-                            liveDoc = { type: "doc", content: [] };
-                        }
-                        // Snapshot the before-doc for the change report. Docs are
-                        // JSON-serializable, so this is a safe deep clone.
-                        beforeDoc = JSON.parse(JSON.stringify(liveDoc));
-                        newDoc = transform(liveDoc);
-                        if (newDoc == null) {
-                            // Transform aborted — write nothing, return the live doc with a
-                            // no-op change report.
-                            mutationResult = {
-                                doc: liveDoc,
-                                verify: {
-                                    changed: false,
-                                    textInserted: 0,
-                                    textDeleted: 0,
-                                    blocksChanged: 0,
-                                    marks: {},
-                                    summary: "no changes (transform aborted)",
-                                },
-                            };
-                            finish(null, mutationResult);
-                            return;
-                        }
-                        // Structural diff into the live fragment (issue #152): preserves
-                        // the Yjs ids of unchanged nodes, so an open editor's cursor is not
-                        // yanked to the end of the document on every agent write.
-                        applyDocToFragment(ydoc, newDoc);
-                    }
-                    catch (e) {
-                        // Includes errors thrown by transform (e.g. "afterText not found",
-                        // "text not found"): propagate them verbatim to the caller.
-                        finish(e instanceof Error ? e : new Error(String(e)));
-                        return;
-                    }
-                    // Compute the verifiable change report AFTER the transact write: it
-                    // only needs the JSON before/after, so it cannot affect the atomic
-                    // read->write window, and summarizeChange never throws.
-                    mutationResult = {
-                        doc: newDoc,
-                        verify: summarizeChange(beforeDoc, newDoc),
-                    };
-                    if (process.env.DEBUG)
-                        console.error("Content written, waiting for server to persist...");
-                    waitForPersistence();
-                },
-                onAuthenticationFailed: () => {
-                    finish(new Error("Authentication failed for collaboration connection"));
-                },
-            });
-        });
-    });
-}
-/**
- * Replace the live content of a page over the collaboration websocket.
- * Accepts a ready ProseMirror JSON document; the caller controls whether
- * it was produced from markdown (ids regenerate) or edited in place
- * (existing block ids preserved).
- *
- * This is an intentional full replace (used by update_page / update_page_json),
- * but now runs under the per-page lock and waits for server persistence via
- * mutatePageContent.
- */
-export async function replacePageContent(pageId, prosemirrorDoc, collabToken, baseUrl) {
-    // Fail fast on a bad document instead of deferring the failure into the
-    // collaboration write (where TiptapTransformer.toYdoc(undefined) used to
-    // throw). The transform must return a valid ProseMirror doc.
-    if (prosemirrorDoc == null ||
-        typeof prosemirrorDoc !== "object" ||
-        prosemirrorDoc.type !== "doc") {
-        throw new Error("replacePageContent: invalid ProseMirror document");
-    }
-    return await mutatePageContent(pageId, collabToken, baseUrl, () => prosemirrorDoc);
-}
-/**
- * Markdown update path (kept for backwards compatibility).
- * NOTE: this re-imports the whole document — block ids are regenerated.
- * Tables and :::callout::: blocks survive thanks to the full schema.
- */
-export async function updatePageContentRealtime(pageId, markdownContent, collabToken, baseUrl) {
-    // PAGE write: canonicalize footnotes (markdown import builds the bottom list in
-    // definition order; numbering is reference-ordered).
-    const tiptapJson = await markdownToProseMirrorCanonical(markdownContent);
-    return await mutatePageContent(pageId, collabToken, baseUrl, () => tiptapJson);
-}
diff --git a/packages/mcp/build/lib/comment-anchor.js b/packages/mcp/build/lib/comment-anchor.js
deleted file mode 100644
index b5c26dc4..00000000
--- a/packages/mcp/build/lib/comment-anchor.js
+++ /dev/null
@@ -1,371 +0,0 @@
-/**
- * Inline-comment anchoring against a ProseMirror document.
- *
- * Docmost stores an inline comment's highlight as a `comment` MARK on the
- * document text (`{ type: "comment", attrs: { commentId, resolved } }`); the
- * `/comments/create` API only records the comment row + its `selection` text and
- * does NOT insert that mark, so the anchor has to be written into the page
- * content separately. This module finds where a selection lives in the document
- * and splices the comment mark across the matched range.
- *
- * Matching has to be robust because the agent supplies the selection as plain
- * text while the document stores rich inline content: a selection can span
- * several adjacent text nodes (inline code / bold / links each become their own
- * text node), and the document may use smart/typographic quotes, dash variants,
- * non-breaking spaces, or collapsed runs of whitespace that the agent typed as
- * ASCII quotes/hyphens/single spaces. We therefore normalize both sides before
- * comparing and match across maximal runs of consecutive text nodes within a
- * single block, while mapping every normalized character back to its raw index
- * so the mark lands on the exact original characters.
- */
-/** Typographic double-quote variants mapped to ASCII `"`. */
-const DOUBLE_QUOTES = "«»„“”‟〝〞＂";
-/** Typographic single-quote/apostrophe variants mapped to ASCII `'`. */
-const SINGLE_QUOTES = "‘’‚‛";
-/** Dash variants mapped to ASCII `-`. */
-const DASHES = "–—―−‐‑‒";
-/** Guard against pathological/cyclic documents in the depth-first walk. */
-const MAX_DEPTH = 200;
-/** The comment mark Docmost stores on anchored text. */
-function makeCommentMark(commentId) {
-    // The comment mark schema declares both commentId and resolved; include
-    // resolved:false for completeness so the stored mark matches the editor's.
-    return { type: "comment", attrs: { commentId, resolved: false } };
-}
-/** True for any character we collapse/replace with a single normal space. */
-function isWhitespaceChar(ch) {
-    // Regular ASCII whitespace plus the special spaces called out in the spec:
-    // nbsp, narrow nbsp, en/em/thin/hair/figure spaces, etc. \s covers tab and
-    // newline; the explicit code points cover the non-breaking variants \s misses
-    // in some engines, so list them for determinism.
-    return (/\s/.test(ch) ||
-        ch === " " || // no-break space
-        ch === " " || // figure space
-        ch === " " || // narrow no-break space
-        ch === " " || // thin space
-        ch === " " || // hair space
-        ch === " " || // en space
-        ch === " " // em space
-    );
-}
-/**
- * Normalize a string for matching and return both the normalized text and a
- * `map` where `map[i]` is the index into the ORIGINAL `s` of the i-th
- * normalized character.
- *
- * Rules: map smart quotes / dashes / special spaces to their ASCII forms,
- * collapse any run of whitespace to a SINGLE space (whose map entry points at
- * the FIRST raw whitespace char of the run), and DO NOT lowercase (anchoring is
- * case-sensitive to match the exact document text).
- */
-export function normalizeForMatch(s) {
-    let norm = "";
-    const map = [];
-    let i = 0;
-    while (i < s.length) {
-        const ch = s[i];
-        if (isWhitespaceChar(ch)) {
-            // Collapse the whole whitespace run to one space mapped to the run start.
-            const runStart = i;
-            while (i < s.length && isWhitespaceChar(s[i]))
-                i++;
-            norm += " ";
-            map.push(runStart);
-            continue;
-        }
-        let mapped = ch;
-        if (DOUBLE_QUOTES.indexOf(ch) !== -1)
-            mapped = '"';
-        else if (SINGLE_QUOTES.indexOf(ch) !== -1)
-            mapped = "'";
-        else if (DASHES.indexOf(ch) !== -1)
-            mapped = "-";
-        norm += mapped;
-        map.push(i);
-        i++;
-    }
-    return { norm, map };
-}
-/**
- * Find a selection inside a SINGLE block's direct `content` array.
- *
- * Builds maximal runs of consecutive `text` nodes (any non-text inline node,
- * e.g. a mention, breaks the run), normalizes each run and the selection the
- * same way, then searches each run for the normalized selection. Returns the
- * child/offset range of the FIRST matching run, or `null` if none match.
- */
-export function findAnchorInBlock(blockContent, selection) {
-    if (!Array.isArray(blockContent))
-        return null;
-    const normSelObj = normalizeForMatch(selection);
-    // Trim leading/trailing spaces on the NORMALIZED selection only.
-    const normSel = normSelObj.norm.trim();
-    if (normSel.length === 0)
-        return null;
-    let i = 0;
-    while (i < blockContent.length) {
-        const node = blockContent[i];
-        if (!node || typeof node !== "object" || node.type !== "text") {
-            i++;
-            continue;
-        }
-        // Accumulate a maximal run of consecutive text nodes.
-        let rawRun = "";
-        const rawToChild = [];
-        let j = i;
-        while (j < blockContent.length) {
-            const n = blockContent[j];
-            if (!n || typeof n !== "object" || n.type !== "text")
-                break;
-            const text = typeof n.text === "string" ? n.text : "";
-            for (let k = 0; k < text.length; k++) {
-                rawToChild.push({ childIdx: j, offset: k });
-            }
-            rawRun += text;
-            j++;
-        }
-        // Try to match within this run.
-        const { norm, map } = normalizeForMatch(rawRun);
-        const idx = norm.indexOf(normSel);
-        if (idx !== -1) {
-            const rawStart = map[idx];
-            const rawEndExclusive = idx + normSel.length < map.length
-                ? map[idx + normSel.length]
-                : rawRun.length;
-            const startLoc = rawToChild[rawStart];
-            // rawEndExclusive points at the raw char AFTER the match; the last matched
-            // raw char is at rawEndExclusive-1, so endOffset is its offset + 1.
-            const lastLoc = rawToChild[rawEndExclusive - 1];
-            return {
-                startChild: startLoc.childIdx,
-                startOffset: startLoc.offset,
-                endChild: lastLoc.childIdx,
-                endOffset: lastLoc.offset + 1,
-            };
-        }
-        // No match in this run: continue scanning AFTER it.
-        i = j > i ? j : i + 1;
-    }
-    return null;
-}
-/**
- * Reconstruct the RAW text spanned by an AnchorMatch inside one block's
- * `content` array. `startChild..endChild` are all text nodes (guaranteed by
- * findAnchorInBlock, which only builds runs of `text` nodes), so concatenate
- * each node's text slice: from `startOffset` on the first node, up to
- * `endOffset` on the last, and the whole `.text` for any node fully inside the
- * range. Mirrors spliceCommentMark's per-node slicing so the string returned
- * here is EXACTLY the characters the comment mark will cover.
- */
-function reconstructRawText(blockContent, match) {
-    const { startChild, startOffset, endChild, endOffset } = match;
-    let out = "";
-    for (let k = startChild; k <= endChild; k++) {
-        const n = blockContent[k];
-        const text = typeof n.text === "string" ? n.text : "";
-        const sliceStart = k === startChild ? startOffset : 0;
-        const sliceEnd = k === endChild ? endOffset : text.length;
-        out += text.slice(sliceStart, sliceEnd);
-    }
-    return out;
-}
-/**
- * Return the RAW document substring that `selection` would anchor to — the exact
- * characters the comment mark will cover — or `null` when the selection cannot
- * be anchored anywhere in `doc`.
- *
- * This mirrors canAnchorInDoc / applyAnchorInDoc EXACTLY (same depth-first,
- * document-order traversal and the same findAnchorInBlock match on the FIRST
- * matching block), but instead of a boolean / an in-place mutation it
- * reconstructs the raw text spanned by the matched range. Because
- * findAnchorInBlock maps the normalized selection back to raw text-node
- * positions, the returned string is the document's ORIGINAL characters (smart
- * quotes, em-dashes, nbsp, collapsed whitespace) — NOT the normalized ASCII
- * agent input.
- *
- * Callers store THIS as the comment's `selection` so the stored value equals the
- * text actually under the mark, which is what the apply-suggestion equality
- * check (replaceYjsMarkedText's `joinedText !== expectedText`) compares against.
- * Without it a suggestion whose anchor only matched via normalization would be
- * un-appliable (spurious 409).
- */
-export function getAnchoredText(doc, selection) {
-    const visit = (node, depth) => {
-        if (depth > MAX_DEPTH || !node || typeof node !== "object")
-            return null;
-        if (!Array.isArray(node.content))
-            return null;
-        const match = findAnchorInBlock(node.content, selection);
-        if (match)
-            return reconstructRawText(node.content, match);
-        for (const child of node.content) {
-            if (child && typeof child === "object" && Array.isArray(child.content)) {
-                const found = visit(child, depth + 1);
-                if (found !== null)
-                    return found;
-            }
-        }
-        return null;
-    };
-    return visit(doc, 0);
-}
-/**
- * Depth-first, document-order check for whether `selection` can be anchored
- * anywhere in `doc`. At each node with an array `content`, first try to match
- * within that node's own content, then recurse into children that themselves
- * have a `content` array.
- */
-export function canAnchorInDoc(doc, selection) {
-    const visit = (node, depth) => {
-        if (depth > MAX_DEPTH || !node || typeof node !== "object")
-            return false;
-        if (!Array.isArray(node.content))
-            return false;
-        if (findAnchorInBlock(node.content, selection))
-            return true;
-        for (const child of node.content) {
-            if (child && typeof child === "object" && Array.isArray(child.content)) {
-                if (visit(child, depth + 1))
-                    return true;
-            }
-        }
-        return false;
-    };
-    return visit(doc, 0);
-}
-/**
- * Split the matched text nodes and splice the comment mark across the range.
- * `blockContent` is mutated IN PLACE. `match.startChild..endChild` are all text
- * nodes (guaranteed by findAnchorInBlock building runs of text nodes).
- */
-function spliceCommentMark(blockContent, match, commentId) {
-    const { startChild, startOffset, endChild, endOffset } = match;
-    const commentMark = makeCommentMark(commentId);
-    const fragments = [];
-    for (let k = startChild; k <= endChild; k++) {
-        const n = blockContent[k];
-        const text = typeof n.text === "string" ? n.text : "";
-        const sliceStart = k === startChild ? startOffset : 0;
-        const sliceEnd = k === endChild ? endOffset : text.length;
-        const before = k === startChild ? text.slice(0, startOffset) : "";
-        const marked = text.slice(sliceStart, sliceEnd);
-        const after = k === endChild ? text.slice(endOffset) : "";
-        // Process per-node so each node's OWN marks/attrs are preserved.
-        const ownMarks = Array.isArray(n.marks) ? n.marks : [];
-        // Drop any pre-existing comment mark from the marked fragment so it ends up
-        // with exactly one comment mark (the new one) rather than two.
-        const markedBaseMarks = ownMarks.filter((m) => !(m && m.type === "comment"));
-        if (before.length > 0) {
-            fragments.push({ ...n, text: before, marks: [...ownMarks] });
-        }
-        if (marked.length > 0) {
-            fragments.push({
-                ...n,
-                text: marked,
-                marks: [...markedBaseMarks, commentMark],
-            });
-        }
-        if (after.length > 0) {
-            fragments.push({ ...n, text: after, marks: [...ownMarks] });
-        }
-    }
-    blockContent.splice(startChild, endChild - startChild + 1, ...fragments);
-}
-/**
- * Count how many times `selection` occurs across the whole document, using the
- * same normalization and run-matching as findAnchorInBlock but WITHOUT stopping
- * at the first hit: every non-overlapping occurrence within each block's text
- * runs is counted and summed across all blocks (depth-first, the same traversal
- * as canAnchorInDoc).
- *
- * This is the uniqueness gate for SUGGESTIONS: because applying a suggestion
- * rewrites the exact anchored text, an ambiguous anchor (>1 occurrence) would
- * silently edit the wrong place, so a suggestion is only allowed when this
- * returns exactly 1. Ordinary comments keep first-occurrence anchoring and do
- * not use this. (Note: counts OCCURRENCES, not just matching blocks, so two
- * occurrences inside one block are correctly reported as 2.)
- */
-export function countAnchorMatches(doc, selection) {
-    const normSel = normalizeForMatch(selection).norm.trim();
-    if (normSel.length === 0)
-        return 0;
-    // Count non-overlapping occurrences of the normalized selection within a
-    // single block's direct content, matching findAnchorInBlock's run building.
-    const countInBlock = (blockContent) => {
-        if (!Array.isArray(blockContent))
-            return 0;
-        let count = 0;
-        let i = 0;
-        while (i < blockContent.length) {
-            const node = blockContent[i];
-            if (!node || typeof node !== "object" || node.type !== "text") {
-                i++;
-                continue;
-            }
-            // Accumulate a maximal run of consecutive text nodes.
-            let rawRun = "";
-            let j = i;
-            while (j < blockContent.length) {
-                const n = blockContent[j];
-                if (!n || typeof n !== "object" || n.type !== "text")
-                    break;
-                rawRun += typeof n.text === "string" ? n.text : "";
-                j++;
-            }
-            const norm = normalizeForMatch(rawRun).norm;
-            // Count every non-overlapping occurrence in this run.
-            let from = 0;
-            for (;;) {
-                const idx = norm.indexOf(normSel, from);
-                if (idx === -1)
-                    break;
-                count++;
-                from = idx + normSel.length;
-            }
-            i = j > i ? j : i + 1;
-        }
-        return count;
-    };
-    let total = 0;
-    const visit = (node, depth) => {
-        if (depth > MAX_DEPTH || !node || typeof node !== "object")
-            return;
-        if (!Array.isArray(node.content))
-            return;
-        total += countInBlock(node.content);
-        for (const child of node.content) {
-            if (child && typeof child === "object" && Array.isArray(child.content)) {
-                visit(child, depth + 1);
-            }
-        }
-    };
-    visit(doc, 0);
-    return total;
-}
-/**
- * Depth-first (same order as canAnchorInDoc) over `doc`; on the FIRST block
- * whose content matches `selection`, splice the comment mark across the matched
- * range in place and return true. Returns false (and does NOT mutate) when no
- * block matches.
- */
-export function applyAnchorInDoc(doc, selection, commentId) {
-    const visit = (node, depth) => {
-        if (depth > MAX_DEPTH || !node || typeof node !== "object")
-            return false;
-        if (!Array.isArray(node.content))
-            return false;
-        const match = findAnchorInBlock(node.content, selection);
-        if (match) {
-            spliceCommentMark(node.content, match, commentId);
-            return true;
-        }
-        for (const child of node.content) {
-            if (child && typeof child === "object" && Array.isArray(child.content)) {
-                if (visit(child, depth + 1))
-                    return true;
-            }
-        }
-        return false;
-    };
-    return visit(doc, 0);
-}
diff --git a/packages/mcp/build/lib/diff.js b/packages/mcp/build/lib/diff.js
deleted file mode 100644
index c19ff9a9..00000000
--- a/packages/mcp/build/lib/diff.js
+++ /dev/null
@@ -1,423 +0,0 @@
-/**
- * Headless, Docmost-equivalent document diff.
- *
- * Docmost's history editor computes a change set with the exact pipeline below
- * (recreateTransform -> ChangeSet.addSteps -> simplifyChanges) and renders it as
- * editor decorations. This module runs the SAME computation but serializes the
- * result to text + integrity counts instead of decorations, so a diff can be
- * previewed without a browser.
- *
- * recreateTransform here comes from @fellow/prosemirror-recreate-transform, the
- * maintained published fork of the MIT prosemirror-recreate-steps source that
- * Docmost vendors in @docmost/editor-ext; it exposes the identical
- * recreateTransform(fromDoc, toDoc, { complexSteps, wordDiffs, simplifyDiff })
- * signature.
- *
- * If recreateTransform / the changeset throws on a pathological document pair,
- * we fall back to a coarse block-level text diff so the tool never hard-fails.
- */
-import { Node } from "@tiptap/pm/model";
-import { ChangeSet, simplifyChanges } from "@tiptap/pm/changeset";
-import { recreateTransform } from "@fellow/prosemirror-recreate-transform";
-import { docmostSchema } from "./docmost-schema.js";
-/** Recursively concatenate the plain text of a JSON node. */
-function plainText(node) {
-    if (!node || typeof node !== "object")
-        return "";
-    let out = "";
-    if (typeof node.text === "string")
-        out += node.text;
-    if (Array.isArray(node.content)) {
-        for (const child of node.content)
-            out += plainText(child);
-    }
-    return out;
-}
-/** Count nodes in a JSON doc that satisfy `pred` (recursive). */
-function countNodes(doc, pred) {
-    let n = 0;
-    const visit = (node) => {
-        if (!node || typeof node !== "object")
-            return;
-        if (pred(node))
-            n++;
-        if (Array.isArray(node.content))
-            for (const c of node.content)
-                visit(c);
-    };
-    visit(doc);
-    return n;
-}
-/**
- * Count UNIQUE links in a JSON doc by their `href`. A single link can be split
- * across several adjacent text runs (e.g. a "link+bold" run followed by a "link"
- * run); counting link-bearing runs would over-count it. Walking the tree and
- * collecting hrefs into a Set keys each distinct link once. Link marks with a
- * missing/empty href are bucketed under a single "" key so a malformed link is
- * still counted as one.
- */
-function countUniqueLinks(doc) {
-    const hrefs = new Set();
-    const visit = (node) => {
-        if (!node || typeof node !== "object")
-            return;
-        if (node.type === "text" && Array.isArray(node.marks)) {
-            for (const m of node.marks) {
-                if (m && m.type === "link") {
-                    const href = m.attrs && typeof m.attrs.href === "string" ? m.attrs.href : "";
-                    hrefs.add(href);
-                }
-            }
-        }
-        if (Array.isArray(node.content))
-            for (const c of node.content)
-                visit(c);
-    };
-    visit(doc);
-    return hrefs.size;
-}
-/** Count footnoteReference nodes anywhere under a node (reading order). */
-function countFootnoteRefs(node) {
-    if (!node || typeof node !== "object")
-        return 0;
-    let n = node.type === "footnoteReference" ? 1 : 0;
-    if (Array.isArray(node.content)) {
-        for (const child of node.content)
-            n += countFootnoteRefs(child);
-    }
-    return n;
-}
-/**
- * Ordered list of footnote marker numbers found in the BODY only (every
- * top-level block before the first "Примечания..." notes heading; if no such
- * heading, the whole doc), in reading order.
- *
- * Supports BOTH representations:
- *  - real `footnoteReference` nodes (the current footnote feature) — numbered
- *    1..n by reading position, since their visible number is derived;
- *  - legacy `[N]` text markers (older translated docs) — the literal N.
- */
-function footnoteMarkers(doc, notesHeading) {
-    const top = Array.isArray(doc?.content) ? doc.content : [];
-    const notesIdx = top.findIndex((n) => n &&
-        n.type === "heading" &&
-        plainText(n).trim() === notesHeading);
-    const bodyBlocks = notesIdx >= 0 ? top.slice(0, notesIdx) : top;
-    // Real footnoteReference nodes take precedence: when present, number them by
-    // reading position (their displayed number is not stored).
-    let refCount = 0;
-    for (const block of bodyBlocks)
-        refCount += countFootnoteRefs(block);
-    if (refCount > 0) {
-        return Array.from({ length: refCount }, (_, i) => i + 1);
-    }
-    // Fallback: legacy `[N]` text markers.
-    const markers = [];
-    const re = /\[(\d+)\]/g;
-    for (const block of bodyBlocks) {
-        const text = plainText(block);
-        let m;
-        re.lastIndex = 0;
-        while ((m = re.exec(text)) !== null) {
-            markers.push(Number(m[1]));
-        }
-    }
-    return markers;
-}
-/** Compute the [old,new] integrity tuples for two JSON docs. */
-function computeIntegrity(oldDoc, newDoc, notesHeading) {
-    const images = [
-        countNodes(oldDoc, (n) => n.type === "image"),
-        countNodes(newDoc, (n) => n.type === "image"),
-    ];
-    const links = [
-        countUniqueLinks(oldDoc),
-        countUniqueLinks(newDoc),
-    ];
-    const tables = [
-        countNodes(oldDoc, (n) => n.type === "table"),
-        countNodes(newDoc, (n) => n.type === "table"),
-    ];
-    const callouts = [
-        countNodes(oldDoc, (n) => n.type === "callout"),
-        countNodes(newDoc, (n) => n.type === "callout"),
-    ];
-    const fns = [
-        footnoteMarkers(oldDoc, notesHeading),
-        footnoteMarkers(newDoc, notesHeading),
-    ];
-    return { images, links, tables, callouts, footnoteMarkers: fns };
-}
-/**
- * Resolve the lead text of the top-level block in a ProseMirror Node that
- * contains the given document position. Returns "" when out of range.
- */
-function blockContextAt(node, pos) {
-    try {
-        const clamped = Math.max(0, Math.min(pos, node.content.size));
-        const $pos = node.resolve(clamped);
-        // depth 1 is the top-level block in a doc node.
-        const block = $pos.depth >= 1 ? $pos.node(1) : $pos.node(0);
-        const text = block.textContent || "";
-        return text.length > 80 ? text.slice(0, 77) + "..." : text;
-    }
-    catch {
-        return "";
-    }
-}
-/** Truncate a string for the markdown summary. */
-function truncate(s, n = 120) {
-    return s.length > n ? s.slice(0, n - 3) + "..." : s;
-}
-/**
- * Coarse fallback: a block-by-block plain-text diff. Used only when the precise
- * changeset pipeline throws, so the tool degrades gracefully instead of failing.
- */
-function coarseDiff(oldDoc, newDoc) {
-    const oldBlocks = Array.isArray(oldDoc?.content) ? oldDoc.content : [];
-    const newBlocks = Array.isArray(newDoc?.content) ? newDoc.content : [];
-    const oldTexts = oldBlocks.map(plainText);
-    const newTexts = newBlocks.map(plainText);
-    const oldSet = new Set(oldTexts);
-    const newSet = new Set(newTexts);
-    const changes = [];
-    for (const t of oldTexts) {
-        if (!newSet.has(t) && t.trim() !== "") {
-            changes.push({ op: "delete", block: truncate(t, 80), text: t });
-        }
-    }
-    for (const t of newTexts) {
-        if (!oldSet.has(t) && t.trim() !== "") {
-            changes.push({ op: "insert", block: truncate(t, 80), text: t });
-        }
-    }
-    return changes;
-}
-/** Build the human-readable unified-ish markdown summary. */
-function renderMarkdown(result, fellBack) {
-    const lines = [];
-    const { summary, integrity, changes } = result;
-    lines.push(`# Diff: ${summary.inserted} inserted / ${summary.deleted} deleted (${summary.blocksChanged} blocks changed)`);
-    if (fellBack) {
-        lines.push("");
-        lines.push("> note: precise diff failed; coarse block-level diff shown.");
-    }
-    lines.push("");
-    lines.push("## Integrity (old -> new)");
-    lines.push(`- images: ${integrity.images[0]} -> ${integrity.images[1]}`);
-    lines.push(`- links: ${integrity.links[0]} -> ${integrity.links[1]}`);
-    lines.push(`- tables: ${integrity.tables[0]} -> ${integrity.tables[1]}`);
-    lines.push(`- callouts: ${integrity.callouts[0]} -> ${integrity.callouts[1]}`);
-    lines.push(`- footnoteMarkers: [${integrity.footnoteMarkers[0].join(", ")}] -> [${integrity.footnoteMarkers[1].join(", ")}]`);
-    lines.push("");
-    lines.push("## Changes");
-    if (changes.length === 0) {
-        lines.push("(no textual changes)");
-    }
-    else {
-        for (const c of changes) {
-            const sign = c.op === "insert" ? "+" : "-";
-            const ctx = c.block ? ` @ ${truncate(c.block, 60)}` : "";
-            lines.push(`${sign} ${truncate(c.text)}${ctx}`);
-        }
-    }
-    return lines.join("\n");
-}
-/**
- * Diff two ProseMirror JSON documents the way Docmost's history editor does and
- * serialize the result to text + integrity counts.
- *
- * @param oldDocJson the earlier document
- * @param newDocJson the later document
- * @param notesHeading heading delimiting body from notes for footnote counting
- */
-export function diffDocs(oldDocJson, newDocJson, notesHeading = "Примечания переводчика") {
-    const integrity = computeIntegrity(oldDocJson, newDocJson, notesHeading);
-    let changes = [];
-    let inserted = 0;
-    let deleted = 0;
-    let fellBack = false;
-    const changedBlocks = new Set();
-    try {
-        const oldNode = Node.fromJSON(docmostSchema, oldDocJson);
-        const newNode = Node.fromJSON(docmostSchema, newDocJson);
-        const tr = recreateTransform(oldNode, newNode, {
-            complexSteps: false,
-            wordDiffs: true,
-            simplifyDiff: true,
-        });
-        const changeSet = ChangeSet.create(oldNode).addSteps(tr.doc, tr.mapping.maps, []);
-        const simplified = simplifyChanges(changeSet.changes, newNode);
-        for (const change of simplified) {
-            // Deleted text lives in the OLD doc coordinate range [fromA, toA).
-            if (change.toA > change.fromA) {
-                const text = oldNode.textBetween(change.fromA, change.toA, "\n", " ");
-                if (text.length > 0) {
-                    deleted += text.length;
-                    const block = blockContextAt(oldNode, change.fromA);
-                    changes.push({ op: "delete", block, text });
-                    if (block)
-                        changedBlocks.add("d:" + block);
-                }
-            }
-            // Inserted text lives in the NEW doc coordinate range [fromB, toB).
-            if (change.toB > change.fromB) {
-                const text = newNode.textBetween(change.fromB, change.toB, "\n", " ");
-                if (text.length > 0) {
-                    inserted += text.length;
-                    const block = blockContextAt(newNode, change.fromB);
-                    changes.push({ op: "insert", block, text });
-                    if (block)
-                        changedBlocks.add("i:" + block);
-                }
-            }
-        }
-    }
-    catch {
-        // Pathological pair: degrade to a coarse block-level diff so we never throw.
-        fellBack = true;
-        changes = coarseDiff(oldDocJson, newDocJson);
-        for (const c of changes) {
-            if (c.op === "insert")
-                inserted += c.text.length;
-            else
-                deleted += c.text.length;
-            if (c.block)
-                changedBlocks.add(c.op[0] + ":" + c.block);
-        }
-    }
-    const partial = {
-        summary: { inserted, deleted, blocksChanged: changedBlocks.size },
-        integrity,
-        changes,
-    };
-    return { ...partial, markdown: renderMarkdown(partial, fellBack) };
-}
-/**
- * Recursively walk every `text` node and tally the count of each mark by
- * `mark.type` (e.g. `{ bold: 5, strike: 3, link: 2 }`). Pure and never throws.
- */
-function markCounts(doc) {
-    const counts = {};
-    const visit = (node) => {
-        if (!node || typeof node !== "object")
-            return;
-        if (node.type === "text" && Array.isArray(node.marks)) {
-            for (const m of node.marks) {
-                if (m && typeof m.type === "string") {
-                    counts[m.type] = (counts[m.type] || 0) + 1;
-                }
-            }
-        }
-        if (Array.isArray(node.content))
-            for (const c of node.content)
-                visit(c);
-    };
-    visit(doc);
-    return counts;
-}
-/**
- * Build a VerifyReport for a content mutation. Pure and never throws — on any
- * internal error it returns a minimal "changed (diff unavailable)" report so it
- * can NEVER break a write.
- *
- * `changed` is VALUE-based, not JSON-string-based: it is derived from the actual
- * deltas (text chars, blocks, mark counts, structural integrity counts), so two
- * value-equal docs that differ only in JSON key order report cleanly as
- * `changed:false` / "no content change" rather than a misleading +0/-0 change.
- *
- * The structural integrity delta (from diffDocs's `integrity` tuples) is what
- * makes `changed` true for an image/table/callout/link count change that diffs
- * to zero text — closing a verify blind spot for insert_image, delete_node on a
- * table, etc.
- */
-export function summarizeChange(before, after) {
-    try {
-        const diff = diffDocs(before, after);
-        // Per-mark-type delta: include a type only when its count actually changed.
-        const beforeMarks = markCounts(before);
-        const afterMarks = markCounts(after);
-        const marks = {};
-        for (const type of new Set([
-            ...Object.keys(beforeMarks),
-            ...Object.keys(afterMarks),
-        ])) {
-            const b = beforeMarks[type] || 0;
-            const a = afterMarks[type] || 0;
-            if (b !== a)
-                marks[type] = [b, a];
-        }
-        // Structural integrity delta from diffDocs: count-based [old,new] tuples for
-        // images/links/tables/callouts. Include a type only when old != new.
-        const integrity = diff.integrity;
-        const structure = {};
-        const countTypes = [
-            "images",
-            "links",
-            "tables",
-            "callouts",
-        ];
-        for (const type of countTypes) {
-            const [b, a] = integrity[type];
-            if (b !== a)
-                structure[type] = [b, a];
-        }
-        const textInserted = diff.summary.inserted;
-        const textDeleted = diff.summary.deleted;
-        const blocksChanged = diff.summary.blocksChanged;
-        const hasMarkDelta = Object.keys(marks).length > 0;
-        const hasStructureDelta = Object.keys(structure).length > 0;
-        // VALUE-based change decision: ignore JSON key-order no-ops entirely.
-        const changed = textInserted > 0 ||
-            textDeleted > 0 ||
-            blocksChanged > 0 ||
-            hasMarkDelta ||
-            hasStructureDelta;
-        if (!changed) {
-            return {
-                changed: false,
-                textInserted: 0,
-                textDeleted: 0,
-                blocksChanged: 0,
-                marks: {},
-                summary: "no content change",
-            };
-        }
-        const parts = [];
-        // Only mention text/blocks when they actually changed (avoid a misleading
-        // "+0/-0 chars, 0 block(s)" prefix on a pure mark/structure change).
-        if (textInserted > 0 || textDeleted > 0 || blocksChanged > 0) {
-            parts.push(`+${textInserted}/-${textDeleted} chars, ${blocksChanged} block(s)`);
-        }
-        const markParts = Object.entries(marks).map(([type, [b, a]]) => `${type} ${b}→${a}`);
-        if (markParts.length > 0)
-            parts.push(`marks: ${markParts.join(", ")}`);
-        const structureParts = Object.entries(structure).map(([type, [b, a]]) => `${type} ${b}→${a}`);
-        if (structureParts.length > 0)
-            parts.push(structureParts.join(", "));
-        // `changed` is true here, so at least one group is present and parts is non-empty.
-        const summary = `changed: ${parts.join("; ")}`;
-        const report = {
-            changed: true,
-            textInserted,
-            textDeleted,
-            blocksChanged,
-            marks,
-            summary,
-        };
-        if (hasStructureDelta)
-            report.structure = structure;
-        return report;
-    }
-    catch {
-        // A pathological pair must never break a write: degrade to a minimal report.
-        return {
-            changed: true,
-            textInserted: 0,
-            textDeleted: 0,
-            blocksChanged: 0,
-            marks: {},
-            summary: "changed (diff unavailable)",
-        };
-    }
-}
diff --git a/packages/mcp/build/lib/docmost-schema.js b/packages/mcp/build/lib/docmost-schema.js
deleted file mode 100644
index 2c7b576a..00000000
--- a/packages/mcp/build/lib/docmost-schema.js
+++ /dev/null
@@ -1,1172 +0,0 @@
-/**
- * Full TipTap extension set matching the real Docmost document schema.
- *
- * The default StarterKit-only schema silently destroys Docmost-specific
- * nodes (callout, table) and drops attributes it does not know about
- * (node ids, image sizing, link targets). Every code path that converts
- * to or from ProseMirror JSON must use THIS set, otherwise a round-trip
- * loses content.
- */
-import StarterKit from "@tiptap/starter-kit";
-import Image from "@tiptap/extension-image";
-import TaskList from "@tiptap/extension-task-list";
-import TaskItem from "@tiptap/extension-task-item";
-import Highlight from "@tiptap/extension-highlight";
-import Subscript from "@tiptap/extension-subscript";
-import Superscript from "@tiptap/extension-superscript";
-import { Node, Extension, Mark, getSchema } from "@tiptap/core";
-// Inlined from @tiptap/core's getStyleProperty (added after 3.20.x) so this
-// package can stay on the same @tiptap/core version as the editor and avoid a
-// duplicate-tiptap version split in the monorepo. Reads a single declaration
-// from an element's inline `style` attribute, last-wins, case-insensitive.
-function getStyleProperty(element, propertyName) {
-    const styleAttr = element.getAttribute("style");
-    if (!styleAttr) {
-        return null;
-    }
-    const decls = styleAttr.split(";").map((decl) => decl.trim()).filter(Boolean);
-    const target = propertyName.toLowerCase();
-    for (let i = decls.length - 1; i >= 0; i -= 1) {
-        const decl = decls[i];
-        const colonIndex = decl.indexOf(":");
-        if (colonIndex === -1) {
-            continue;
-        }
-        const prop = decl.slice(0, colonIndex).trim().toLowerCase();
-        if (prop === target) {
-            return decl.slice(colonIndex + 1).trim();
-        }
-    }
-    return null;
-}
-/** Allowed Docmost callout types; anything else falls back to "info". */
-const CALLOUT_TYPES = ["info", "warning", "danger", "success"];
-export const clampCalloutType = (value) => value && CALLOUT_TYPES.includes(value.toLowerCase())
-    ? value.toLowerCase()
-    : "info";
-/**
- * Allowlist guard for CSS color values imported from HTML.
- *
- * Docmost interpolates stored mark colors straight into an inline style
- * attribute (e.g. style="background-color: ${color}" / "color: ${color}").
- * An unsanitized value such as `red; --x: url(...)` or `red"><script>` would
- * let a crafted document break out of the style attribute. We therefore only
- * accept a narrow, well-formed subset of CSS <color> syntax and reject (-> null)
- * anything else.
- *
- * Accepted forms:
- *   - named colors:           letters only, e.g. "red", "rebeccapurple"
- *   - hex:                    #rgb, #rgba, #rrggbb, #rrggbbaa
- *   - functional notation:    rgb()/rgba()/hsl()/hsla() containing only
- *                             digits, %, ., commas, spaces and slashes
- */
-const SAFE_COLOR_RE = /^(?:[a-zA-Z]+|#(?:[0-9a-fA-F]{3,4}|[0-9a-fA-F]{6}|[0-9a-fA-F]{8})|(?:rgb|rgba|hsl|hsla)\([0-9.,%/\s]+\))$/;
-export const sanitizeCssColor = (value) => {
-    if (typeof value !== "string")
-        return null;
-    const color = value.trim();
-    return color && SAFE_COLOR_RE.test(color) ? color : null;
-};
-/** Docmost callout (info/warning/danger/success banner). */
-const Callout = Node.create({
-    name: "callout",
-    group: "block",
-    content: "block+",
-    defining: true,
-    addAttributes() {
-        return {
-            // Read the type from data-callout-type so generateJSON(html) preserves
-            // it; without an explicit parseHTML every imported callout became "info".
-            type: {
-                default: "info",
-                parseHTML: (el) => clampCalloutType(el.getAttribute("data-callout-type")),
-                renderHTML: (attrs) => ({
-                    "data-callout-type": clampCalloutType(attrs.type),
-                }),
-            },
-            icon: {
-                default: null,
-                parseHTML: (el) => el.getAttribute("data-icon"),
-                renderHTML: (attrs) => attrs.icon ? { "data-icon": attrs.icon } : {},
-            },
-        };
-    },
-    parseHTML() {
-        return [{ tag: 'div[data-type="callout"]' }];
-    },
-    renderHTML({ HTMLAttributes }) {
-        return ["div", { "data-type": "callout", ...HTMLAttributes }, 0];
-    },
-});
-/** Minimal table family: enough for schema round-trips and HTML parsing. */
-const Table = Node.create({
-    name: "table",
-    group: "block",
-    content: "tableRow+",
-    isolating: true,
-    parseHTML() {
-        return [{ tag: "table" }];
-    },
-    renderHTML() {
-        return ["table", ["tbody", 0]];
-    },
-});
-const TableRow = Node.create({
-    name: "tableRow",
-    content: "(tableCell | tableHeader)*",
-    parseHTML() {
-        return [{ tag: "tr" }];
-    },
-    renderHTML() {
-        return ["tr", 0];
-    },
-});
-const cellAttributes = () => ({
-    colspan: { default: 1 },
-    rowspan: { default: 1 },
-    colwidth: { default: null },
-    backgroundColor: { default: null },
-    backgroundColorName: { default: null },
-    // Column alignment so GFM aligned tables (|:--|:-:|--:|) round-trip.
-    align: {
-        default: null,
-        parseHTML: (el) => el.getAttribute("align") || el.style.textAlign || null,
-        renderHTML: (attrs) => attrs.align ? { align: attrs.align } : {},
-    },
-});
-const TableCell = Node.create({
-    name: "tableCell",
-    content: "block+",
-    isolating: true,
-    addAttributes: cellAttributes,
-    parseHTML() {
-        return [{ tag: "td" }];
-    },
-    renderHTML() {
-        return ["td", 0];
-    },
-});
-const TableHeader = Node.create({
-    name: "tableHeader",
-    content: "block+",
-    isolating: true,
-    addAttributes: cellAttributes,
-    parseHTML() {
-        return [{ tag: "th" }];
-    },
-    renderHTML() {
-        return ["th", 0];
-    },
-});
-/**
- * Attributes Docmost stores on standard nodes that the stock extensions
- * do not declare. Without these, Node.fromJSON silently drops them —
- * including the block ids that heading anchors rely on.
- */
-const DocmostAttributes = Extension.create({
-    name: "docmostAttributes",
-    addGlobalAttributes() {
-        return [
-            {
-                types: ["heading", "paragraph"],
-                attributes: {
-                    id: { default: null },
-                    indent: { default: null },
-                    textAlign: { default: null },
-                },
-            },
-            {
-                types: ["image"],
-                attributes: {
-                    align: { default: null },
-                    attachmentId: { default: null },
-                    aspectRatio: { default: null },
-                    height: { default: null },
-                    placeholder: { default: null },
-                    size: { default: null },
-                    width: { default: null },
-                },
-            },
-            {
-                types: ["orderedList"],
-                attributes: { type: { default: null } },
-            },
-            {
-                types: ["link"],
-                attributes: { internal: { default: null }, title: { default: null } },
-            },
-        ];
-    },
-});
-/**
- * Docmost inline comment mark. Anchors a comment thread to a text range via
- * `commentId`. Without it, any document containing comment highlights fails to
- * round-trip through the schema ("There is no mark type comment in this schema"),
- * which breaks update_page_json and edit_page_text on every commented page.
- * Mirrors Docmost's @docmost/editor-ext comment mark (commentId / resolved).
- */
-const Comment = Mark.create({
-    name: "comment",
-    exitable: true,
-    inclusive: false,
-    addAttributes() {
-        return {
-            commentId: {
-                default: null,
-                parseHTML: (el) => el.getAttribute("data-comment-id"),
-                renderHTML: (attrs) => attrs.commentId ? { "data-comment-id": attrs.commentId } : {},
-            },
-            resolved: {
-                default: false,
-                parseHTML: (el) => el.getAttribute("data-resolved") === "true",
-                renderHTML: (attrs) => attrs.resolved ? { "data-resolved": "true" } : {},
-            },
-        };
-    },
-    parseHTML() {
-        return [{ tag: "span[data-comment-id]" }];
-    },
-    renderHTML({ HTMLAttributes }) {
-        return ["span", { class: "comment-mark", ...HTMLAttributes }, 0];
-    },
-});
-/**
- * Text color mark. The markdown-converter emits colored text as
- * <span style="color: ...">, but with no mark parsing it back the color was
- * silently dropped on import. This mirrors TipTap's @tiptap/extension-text-style
- * `textStyle` mark (the name Docmost expects) and carries a single `color`
- * attribute. The parsed color is passed through the allowlist guard so a crafted
- * style cannot break out of the attribute when Docmost re-renders it.
- */
-const TextStyle = Mark.create({
-    name: "textStyle",
-    addAttributes() {
-        return {
-            color: {
-                default: null,
-                parseHTML: (el) => sanitizeCssColor(el.style.color || el.getAttribute("data-color")),
-                renderHTML: (attrs) => {
-                    const color = sanitizeCssColor(attrs.color);
-                    return color ? { style: `color: ${color}` } : {};
-                },
-            },
-        };
-    },
-    parseHTML() {
-        return [
-            {
-                tag: "span",
-                // Only claim a plain colored span. Do NOT match spans that are already a
-                // comment mark (data-comment-id) or a mention node (data-type=mention),
-                // otherwise importing such HTML would silently drop the comment/mention.
-                getAttrs: (el) => el.style.color &&
-                    !el.getAttribute("data-comment-id") &&
-                    el.getAttribute("data-type") !== "mention"
-                    ? {}
-                    : false,
-            },
-        ];
-    },
-    renderHTML({ HTMLAttributes }) {
-        return ["span", HTMLAttributes, 0];
-    },
-});
-/**
- * Inline spoiler mark. Mirrors the @docmost/editor-ext `spoiler` mark so a
- * document carrying a spoiler survives the MCP read -> transform -> write path
- * (and markdown export) instead of silently dropping the unrecognized mark.
- * packages/mcp does NOT depend on editor-ext, so the definition is kept local;
- * it parses span[data-spoiler] and renders the same span[data-spoiler][class]
- * the editor-ext mark emits.
- */
-const Spoiler = Mark.create({
-    name: "spoiler",
-    // Don't bleed onto text typed at the boundary (mirrors editor-ext).
-    inclusive: false,
-    parseHTML() {
-        return [{ tag: "span[data-spoiler]" }];
-    },
-    renderHTML({ HTMLAttributes }) {
-        return ["span", { "data-spoiler": "true", class: "spoiler", ...HTMLAttributes }, 0];
-    },
-});
-/**
- * Passthrough definitions for the remaining Docmost-specific nodes.
- *
- * TiptapTransformer.toYdoc (the write path every mutation uses) throws
- * "Unknown node type: X" for any node not registered here, so editing ANY
- * page that contains one of these nodes used to fail outright. The read path
- * (fromYdoc) accepts them, which is why they appear in real documents.
- *
- * Each node below mirrors the real @docmost/editor-ext definition's name,
- * group, content, inline/atom flags and attribute keys (with the same data-*
- * HTML mapping) so that a fromYdoc -> transform -> toYdoc round-trip both
- * validates and preserves attributes faithfully. Interactive concerns
- * (node views, commands, keyboard shortcuts, input rules, suggestion plugins)
- * are intentionally omitted: the MCP server never renders these nodes, it only
- * needs the schema to accept and carry them. The Callout node above is the
- * pattern these follow.
- */
-/** Docmost @mention (user/page reference). Inline atom. */
-const Mention = Node.create({
-    name: "mention",
-    group: "inline",
-    inline: true,
-    selectable: true,
-    atom: true,
-    draggable: true,
-    addAttributes() {
-        return {
-            id: {
-                default: null,
-                parseHTML: (el) => el.getAttribute("data-id"),
-                renderHTML: (attrs) => attrs.id ? { "data-id": attrs.id } : {},
-            },
-            label: {
-                default: null,
-                parseHTML: (el) => el.getAttribute("data-label"),
-                renderHTML: (attrs) => attrs.label ? { "data-label": attrs.label } : {},
-            },
-            entityType: {
-                default: null,
-                parseHTML: (el) => el.getAttribute("data-entity-type"),
-                renderHTML: (attrs) => attrs.entityType ? { "data-entity-type": attrs.entityType } : {},
-            },
-            entityId: {
-                default: null,
-                parseHTML: (el) => el.getAttribute("data-entity-id"),
-                renderHTML: (attrs) => attrs.entityId ? { "data-entity-id": attrs.entityId } : {},
-            },
-            slugId: {
-                default: null,
-                parseHTML: (el) => el.getAttribute("data-slug-id"),
-                renderHTML: (attrs) => attrs.slugId ? { "data-slug-id": attrs.slugId } : {},
-            },
-            creatorId: {
-                default: null,
-                parseHTML: (el) => el.getAttribute("data-creator-id"),
-                renderHTML: (attrs) => attrs.creatorId ? { "data-creator-id": attrs.creatorId } : {},
-            },
-            anchorId: {
-                default: null,
-                parseHTML: (el) => el.getAttribute("data-anchor-id"),
-                renderHTML: (attrs) => attrs.anchorId ? { "data-anchor-id": attrs.anchorId } : {},
-            },
-        };
-    },
-    parseHTML() {
-        return [{ tag: 'span[data-type="mention"]' }];
-    },
-    renderHTML({ HTMLAttributes }) {
-        return ["span", { "data-type": "mention", ...HTMLAttributes }, 0];
-    },
-});
-/**
- * Footnote feature (mirror of packages/editor-ext/src/lib/footnote). Three
- * nodes connected by `id`:
- *  - FootnoteReference: inline atom marker in the body (<sup data-footnote-ref>);
- *  - FootnotesList:     a single bottom container (<section data-footnotes>);
- *  - FootnoteDefinition: one editable note keyed by id (<div data-footnote-def>).
- * The visible number is not stored; it is derived from reference order.
- *
- * priority 101 so this node's <sup> parse rule beats the Superscript mark's
- * <sup> rule (otherwise an empty reference is parsed as an empty superscript
- * mark and dropped). Keep in sync with editor-ext.
- */
-const FootnoteReference = Node.create({
-    name: "footnoteReference",
-    priority: 101,
-    group: "inline",
-    inline: true,
-    atom: true,
-    selectable: true,
-    draggable: false,
-    addAttributes() {
-        return {
-            id: {
-                default: null,
-                parseHTML: (el) => el.getAttribute("data-id"),
-                renderHTML: (attrs) => attrs.id ? { "data-id": attrs.id } : {},
-            },
-        };
-    },
-    parseHTML() {
-        return [{ tag: "sup[data-footnote-ref]", priority: 100 }];
-    },
-    renderHTML({ HTMLAttributes }) {
-        return ["sup", { "data-footnote-ref": "", ...HTMLAttributes }];
-    },
-});
-const FootnotesList = Node.create({
-    name: "footnotesList",
-    group: "block",
-    content: "footnoteDefinition+",
-    isolating: true,
-    selectable: false,
-    defining: true,
-    parseHTML() {
-        return [{ tag: "section[data-footnotes]" }];
-    },
-    renderHTML({ HTMLAttributes }) {
-        return ["section", { "data-footnotes": "", ...HTMLAttributes }, 0];
-    },
-});
-const FootnoteDefinition = Node.create({
-    name: "footnoteDefinition",
-    content: "paragraph+",
-    defining: true,
-    isolating: true,
-    selectable: false,
-    addAttributes() {
-        return {
-            id: {
-                default: null,
-                parseHTML: (el) => el.getAttribute("data-id"),
-                renderHTML: (attrs) => attrs.id ? { "data-id": attrs.id } : {},
-            },
-        };
-    },
-    parseHTML() {
-        return [{ tag: "div[data-footnote-def]" }];
-    },
-    renderHTML({ HTMLAttributes }) {
-        return ["div", { "data-footnote-def": "", ...HTMLAttributes }, 0];
-    },
-});
-/** Inline KaTeX expression. Carries the LaTeX source in `text`. */
-const MathInline = Node.create({
-    name: "mathInline",
-    group: "inline",
-    inline: true,
-    atom: true,
-    addAttributes() {
-        return {
-            text: { default: "" },
-        };
-    },
-    parseHTML() {
-        return [{ tag: 'span[data-type="mathInline"]' }];
-    },
-    renderHTML({ HTMLAttributes }) {
-        return [
-            "span",
-            { "data-type": "mathInline", "data-katex": "true" },
-            `${HTMLAttributes.text ?? ""}`,
-        ];
-    },
-});
-/** Block KaTeX expression. Carries the LaTeX source in `text`. */
-const MathBlock = Node.create({
-    name: "mathBlock",
-    group: "block",
-    atom: true,
-    isolating: true,
-    addAttributes() {
-        return {
-            text: { default: "" },
-        };
-    },
-    parseHTML() {
-        return [{ tag: 'div[data-type="mathBlock"]' }];
-    },
-    renderHTML({ HTMLAttributes }) {
-        return [
-            "div",
-            { "data-type": "mathBlock", "data-katex": "true" },
-            `${HTMLAttributes.text ?? ""}`,
-        ];
-    },
-});
-/** Collapsible <details> wrapper: summary + content children. */
-const Details = Node.create({
-    name: "details",
-    group: "block",
-    content: "detailsSummary detailsContent",
-    defining: true,
-    isolating: true,
-    addAttributes() {
-        return {
-            open: {
-                default: false,
-                parseHTML: (el) => el.getAttribute("open"),
-                renderHTML: (attrs) => attrs.open ? { open: "" } : {},
-            },
-        };
-    },
-    parseHTML() {
-        return [{ tag: "details" }];
-    },
-    renderHTML({ HTMLAttributes }) {
-        return ["details", { ...HTMLAttributes }, 0];
-    },
-});
-/** Clickable summary line of a <details> block. */
-const DetailsSummary = Node.create({
-    name: "detailsSummary",
-    group: "block",
-    content: "inline*",
-    defining: true,
-    isolating: true,
-    selectable: false,
-    parseHTML() {
-        return [{ tag: "summary" }];
-    },
-    renderHTML({ HTMLAttributes }) {
-        return ["summary", { "data-type": "detailsSummary", ...HTMLAttributes }, 0];
-    },
-});
-/** Body of a <details> block. Permissive content so fromYdoc output validates. */
-const DetailsContent = Node.create({
-    name: "detailsContent",
-    group: "block",
-    // Docmost declares block* (an empty details body is valid); block+ would
-    // reject a collapsed/empty details on round-trip.
-    content: "block*",
-    defining: true,
-    selectable: false,
-    parseHTML() {
-        return [{ tag: 'div[data-type="detailsContent"]' }];
-    },
-    renderHTML({ HTMLAttributes }) {
-        return ["div", { "data-type": "detailsContent", ...HTMLAttributes }, 0];
-    },
-});
-/** File attachment card (non-image upload). Block atom. */
-const Attachment = Node.create({
-    name: "attachment",
-    group: "block",
-    inline: false,
-    isolating: true,
-    atom: true,
-    defining: true,
-    draggable: true,
-    addAttributes() {
-        return {
-            url: {
-                default: "",
-                parseHTML: (el) => el.getAttribute("data-attachment-url"),
-                renderHTML: (attrs) => ({
-                    "data-attachment-url": attrs.url ?? "",
-                }),
-            },
-            name: {
-                default: null,
-                parseHTML: (el) => el.getAttribute("data-attachment-name"),
-                renderHTML: (attrs) => attrs.name ? { "data-attachment-name": attrs.name } : {},
-            },
-            mime: {
-                default: null,
-                parseHTML: (el) => el.getAttribute("data-attachment-mime"),
-                renderHTML: (attrs) => attrs.mime ? { "data-attachment-mime": attrs.mime } : {},
-            },
-            size: {
-                default: null,
-                parseHTML: (el) => el.getAttribute("data-attachment-size"),
-                renderHTML: (attrs) => attrs.size != null ? { "data-attachment-size": attrs.size } : {},
-            },
-            attachmentId: {
-                default: null,
-                parseHTML: (el) => el.getAttribute("data-attachment-id"),
-                renderHTML: (attrs) => attrs.attachmentId
-                    ? { "data-attachment-id": attrs.attachmentId }
-                    : {},
-            },
-            // Docmost declares `placeholder` (a transient upload key, not rendered
-            // to HTML). Carry it so a round-trip never hits "Unsupported attribute".
-            placeholder: { default: null },
-        };
-    },
-    parseHTML() {
-        return [{ tag: 'div[data-type="attachment"]' }];
-    },
-    renderHTML({ HTMLAttributes }) {
-        return ["div", { "data-type": "attachment", ...HTMLAttributes }, 0];
-    },
-});
-/** Uploaded <video> player. Block atom. */
-const Video = Node.create({
-    name: "video",
-    group: "block",
-    isolating: true,
-    atom: true,
-    defining: true,
-    draggable: true,
-    addAttributes() {
-        return {
-            src: {
-                default: "",
-                parseHTML: (el) => el.getAttribute("src"),
-                renderHTML: (attrs) => ({ src: attrs.src ?? "" }),
-            },
-            alt: {
-                default: null,
-                parseHTML: (el) => el.getAttribute("aria-label"),
-                renderHTML: (attrs) => attrs.alt ? { "aria-label": attrs.alt } : {},
-            },
-            attachmentId: {
-                default: null,
-                parseHTML: (el) => el.getAttribute("data-attachment-id"),
-                renderHTML: (attrs) => attrs.attachmentId
-                    ? { "data-attachment-id": attrs.attachmentId }
-                    : {},
-            },
-            width: {
-                default: null,
-                parseHTML: (el) => el.getAttribute("width"),
-                renderHTML: (attrs) => attrs.width != null ? { width: attrs.width } : {},
-            },
-            height: {
-                default: null,
-                parseHTML: (el) => el.getAttribute("height"),
-                renderHTML: (attrs) => attrs.height != null ? { height: attrs.height } : {},
-            },
-            size: {
-                default: null,
-                parseHTML: (el) => el.getAttribute("data-size"),
-                renderHTML: (attrs) => attrs.size != null ? { "data-size": attrs.size } : {},
-            },
-            align: {
-                default: "center",
-                parseHTML: (el) => el.getAttribute("data-align"),
-                renderHTML: (attrs) => attrs.align ? { "data-align": attrs.align } : {},
-            },
-            aspectRatio: {
-                default: null,
-                parseHTML: (el) => el.getAttribute("data-aspect-ratio"),
-                renderHTML: (attrs) => attrs.aspectRatio != null
-                    ? { "data-aspect-ratio": attrs.aspectRatio }
-                    : {},
-            },
-            // Docmost declares `placeholder` (a transient upload key, not rendered
-            // to HTML). Carry it so a round-trip never hits "Unsupported attribute".
-            placeholder: { default: null },
-        };
-    },
-    parseHTML() {
-        return [{ tag: "video" }];
-    },
-    renderHTML({ HTMLAttributes }) {
-        return ["video", { controls: "true", ...HTMLAttributes }];
-    },
-});
-/**
- * Defensive passthrough for a `youtube` node. Docmost itself has no dedicated
- * youtube node (YouTube is handled via `embed`), but the converter read path
- * references this type, so accept it as a generic block atom that preserves
- * its src so legacy/external documents survive a round-trip.
- */
-const Youtube = Node.create({
-    name: "youtube",
-    group: "block",
-    inline: false,
-    isolating: true,
-    atom: true,
-    defining: true,
-    draggable: true,
-    addAttributes() {
-        return {
-            src: {
-                default: "",
-                parseHTML: (el) => el.getAttribute("data-src"),
-                renderHTML: (attrs) => ({
-                    "data-src": attrs.src ?? "",
-                }),
-            },
-            width: {
-                default: null,
-                parseHTML: (el) => el.getAttribute("data-width"),
-                renderHTML: (attrs) => attrs.width != null ? { "data-width": attrs.width } : {},
-            },
-            height: {
-                default: null,
-                parseHTML: (el) => el.getAttribute("data-height"),
-                renderHTML: (attrs) => attrs.height != null ? { "data-height": attrs.height } : {},
-            },
-            align: {
-                default: "center",
-                parseHTML: (el) => el.getAttribute("data-align"),
-                renderHTML: (attrs) => attrs.align ? { "data-align": attrs.align } : {},
-            },
-        };
-    },
-    parseHTML() {
-        return [{ tag: 'div[data-type="youtube"]' }];
-    },
-    renderHTML({ HTMLAttributes }) {
-        return ["div", { "data-type": "youtube", ...HTMLAttributes }, 0];
-    },
-});
-/** Generic embed (provider iframe). Block atom. */
-const Embed = Node.create({
-    name: "embed",
-    group: "block",
-    inline: false,
-    isolating: true,
-    atom: true,
-    defining: true,
-    draggable: true,
-    addAttributes() {
-        return {
-            src: {
-                default: "",
-                parseHTML: (el) => el.getAttribute("data-src"),
-                renderHTML: (attrs) => ({
-                    "data-src": attrs.src ?? "",
-                }),
-            },
-            provider: {
-                default: "",
-                parseHTML: (el) => el.getAttribute("data-provider"),
-                renderHTML: (attrs) => ({
-                    "data-provider": attrs.provider ?? "",
-                }),
-            },
-            align: {
-                default: "center",
-                parseHTML: (el) => el.getAttribute("data-align"),
-                renderHTML: (attrs) => ({
-                    "data-align": attrs.align ?? "center",
-                }),
-            },
-            width: {
-                default: 800,
-                parseHTML: (el) => el.getAttribute("data-width"),
-                renderHTML: (attrs) => ({
-                    "data-width": attrs.width,
-                }),
-            },
-            height: {
-                default: 600,
-                parseHTML: (el) => el.getAttribute("data-height"),
-                renderHTML: (attrs) => ({
-                    "data-height": attrs.height,
-                }),
-            },
-        };
-    },
-    parseHTML() {
-        return [{ tag: 'div[data-type="embed"]' }];
-    },
-    renderHTML({ HTMLAttributes }) {
-        return ["div", { "data-type": "embed", ...HTMLAttributes }, 0];
-    },
-});
-/**
- * Docmost raw HTML embed. Block atom; the client renders `source` inside a
- * sandboxed iframe. The MCP server never renders it — it only needs the
- * schema to accept and carry the node so a fromYdoc -> transform -> toYdoc
- * round-trip does not throw "Unknown node type: htmlEmbed". Mirrors the
- * @docmost/editor-ext node name, attribute keys and flags; keep in sync when
- * the editor-ext htmlEmbed schema changes.
- *
- * NOTE: unlike the canonical editor-ext node, `data-source` here is mapped as
- * plain text rather than base64-encoded. That is intentional: the MCP write
- * path carries the node through Yjs (fromYdoc -> toYdoc) on its JSON `source`
- * attribute and never invokes parseHTML/renderHTML, and htmlEmbed is not
- * produced from the markdown/HTML (generateJSON) path. If a future HTML path
- * for htmlEmbed is added here, this mapping must adopt editor-ext's base64
- * encode/decode to avoid double-encoding `source`.
- */
-const HtmlEmbed = Node.create({
-    name: "htmlEmbed",
-    group: "block",
-    inline: false,
-    isolating: true,
-    atom: true,
-    defining: true,
-    draggable: true,
-    addAttributes() {
-        return {
-            source: {
-                default: "",
-                parseHTML: (el) => el.getAttribute("data-source") ?? "",
-                renderHTML: (attrs) => ({
-                    "data-source": attrs.source ?? "",
-                }),
-            },
-            height: {
-                default: null,
-                parseHTML: (el) => {
-                    const v = el.getAttribute("data-height");
-                    if (!v)
-                        return null;
-                    const n = parseInt(v, 10);
-                    return Number.isFinite(n) ? n : null;
-                },
-                renderHTML: (attrs) => attrs.height != null ? { "data-height": String(attrs.height) } : {},
-            },
-        };
-    },
-    parseHTML() {
-        return [{ tag: 'div[data-type="htmlEmbed"]' }];
-    },
-    renderHTML({ HTMLAttributes }) {
-        return ["div", { "data-type": "htmlEmbed", ...HTMLAttributes }, 0];
-    },
-});
-/** Shared attribute set for drawio/excalidraw diagram nodes. */
-const diagramAttributes = () => ({
-    src: {
-        default: "",
-        parseHTML: (el) => el.getAttribute("data-src"),
-        renderHTML: (attrs) => ({
-            "data-src": attrs.src ?? "",
-        }),
-    },
-    title: {
-        default: null,
-        parseHTML: (el) => el.getAttribute("data-title"),
-        renderHTML: (attrs) => attrs.title ? { "data-title": attrs.title } : {},
-    },
-    alt: {
-        default: null,
-        parseHTML: (el) => el.getAttribute("data-alt"),
-        renderHTML: (attrs) => attrs.alt ? { "data-alt": attrs.alt } : {},
-    },
-    width: {
-        default: null,
-        parseHTML: (el) => el.getAttribute("data-width"),
-        renderHTML: (attrs) => attrs.width != null ? { "data-width": attrs.width } : {},
-    },
-    height: {
-        default: null,
-        parseHTML: (el) => el.getAttribute("data-height"),
-        renderHTML: (attrs) => attrs.height != null ? { "data-height": attrs.height } : {},
-    },
-    size: {
-        default: null,
-        parseHTML: (el) => el.getAttribute("data-size"),
-        renderHTML: (attrs) => attrs.size != null ? { "data-size": attrs.size } : {},
-    },
-    aspectRatio: {
-        default: null,
-        parseHTML: (el) => el.getAttribute("data-aspect-ratio"),
-        renderHTML: (attrs) => attrs.aspectRatio != null
-            ? { "data-aspect-ratio": attrs.aspectRatio }
-            : {},
-    },
-    align: {
-        default: "center",
-        parseHTML: (el) => el.getAttribute("data-align"),
-        renderHTML: (attrs) => attrs.align ? { "data-align": attrs.align } : {},
-    },
-    attachmentId: {
-        default: null,
-        parseHTML: (el) => el.getAttribute("data-attachment-id"),
-        renderHTML: (attrs) => attrs.attachmentId ? { "data-attachment-id": attrs.attachmentId } : {},
-    },
-});
-/** draw.io diagram. Block atom (image-backed). */
-const Drawio = Node.create({
-    name: "drawio",
-    group: "block",
-    inline: false,
-    isolating: true,
-    atom: true,
-    defining: true,
-    draggable: true,
-    addAttributes: diagramAttributes,
-    parseHTML() {
-        return [{ tag: 'div[data-type="drawio"]' }];
-    },
-    renderHTML({ HTMLAttributes }) {
-        return ["div", { "data-type": "drawio", ...HTMLAttributes }, 0];
-    },
-});
-/** Excalidraw diagram. Block atom (image-backed). */
-const Excalidraw = Node.create({
-    name: "excalidraw",
-    group: "block",
-    inline: false,
-    isolating: true,
-    atom: true,
-    defining: true,
-    draggable: true,
-    addAttributes: diagramAttributes,
-    parseHTML() {
-        return [{ tag: 'div[data-type="excalidraw"]' }];
-    },
-    renderHTML({ HTMLAttributes }) {
-        return ["div", { "data-type": "excalidraw", ...HTMLAttributes }, 0];
-    },
-});
-/** Multi-column layout container holding one or more `column` children. */
-const Columns = Node.create({
-    name: "columns",
-    group: "block",
-    content: "column+",
-    defining: true,
-    isolating: true,
-    addAttributes() {
-        return {
-            layout: {
-                default: "two_equal",
-                parseHTML: (el) => el.getAttribute("data-layout"),
-                renderHTML: (attrs) => attrs.layout ? { "data-layout": attrs.layout } : {},
-            },
-            widthMode: {
-                default: "normal",
-                parseHTML: (el) => el.getAttribute("data-width-mode") || "normal",
-                renderHTML: (attrs) => attrs.widthMode && attrs.widthMode !== "normal"
-                    ? { "data-width-mode": attrs.widthMode }
-                    : {},
-            },
-        };
-    },
-    parseHTML() {
-        return [{ tag: 'div[data-type="columns"]' }];
-    },
-    renderHTML({ HTMLAttributes }) {
-        return ["div", { "data-type": "columns", ...HTMLAttributes }, 0];
-    },
-});
-/** Single column within a `columns` layout. */
-const Column = Node.create({
-    name: "column",
-    group: "block",
-    content: "block+",
-    defining: true,
-    isolating: true,
-    selectable: false,
-    addAttributes() {
-        return {
-            width: {
-                default: null,
-                parseHTML: (el) => {
-                    const value = el.getAttribute("data-width");
-                    return value ? parseFloat(value) : null;
-                },
-                renderHTML: (attrs) => attrs.width ? { "data-width": attrs.width } : {},
-            },
-        };
-    },
-    parseHTML() {
-        return [{ tag: 'div[data-type="column"]' }];
-    },
-    renderHTML({ HTMLAttributes }) {
-        return ["div", { "data-type": "column", ...HTMLAttributes }, 0];
-    },
-});
-/**
- * Subpages listing block (auto-generated index of child pages). Docmost
- * declares no attributes; the markdown-converter has a `case "subpages"`, so
- * the read path can emit it and toYdoc must accept it. Block atom.
- */
-const Subpages = Node.create({
-    name: "subpages",
-    group: "block",
-    inline: false,
-    isolating: true,
-    atom: true,
-    defining: true,
-    draggable: true,
-    parseHTML() {
-        return [{ tag: 'div[data-type="subpages"]' }];
-    },
-    renderHTML({ HTMLAttributes }) {
-        return ["div", { "data-type": "subpages", ...HTMLAttributes }, 0];
-    },
-});
-/** Uploaded <audio> player. Block atom. Mirrors Docmost audio attrs. */
-const Audio = Node.create({
-    name: "audio",
-    group: "block",
-    inline: false,
-    isolating: true,
-    atom: true,
-    defining: true,
-    draggable: true,
-    addAttributes() {
-        return {
-            src: {
-                default: "",
-                parseHTML: (el) => el.getAttribute("src"),
-                renderHTML: (attrs) => ({ src: attrs.src ?? "" }),
-            },
-            attachmentId: {
-                default: null,
-                parseHTML: (el) => el.getAttribute("data-attachment-id"),
-                renderHTML: (attrs) => attrs.attachmentId
-                    ? { "data-attachment-id": attrs.attachmentId }
-                    : {},
-            },
-            size: {
-                default: null,
-                parseHTML: (el) => el.getAttribute("data-size"),
-                renderHTML: (attrs) => attrs.size != null ? { "data-size": attrs.size } : {},
-            },
-            // Transient upload key Docmost declares with rendered:false; carried so
-            // a round-trip never hits "Unsupported attribute".
-            placeholder: { default: null },
-        };
-    },
-    parseHTML() {
-        return [{ tag: "audio" }];
-    },
-    renderHTML({ HTMLAttributes }) {
-        return ["audio", { controls: "true", ...HTMLAttributes }];
-    },
-});
-/** Embedded PDF viewer. Block atom. Mirrors Docmost pdf attrs. */
-const Pdf = Node.create({
-    name: "pdf",
-    group: "block",
-    inline: false,
-    isolating: true,
-    atom: true,
-    defining: true,
-    draggable: true,
-    addAttributes() {
-        return {
-            src: {
-                default: "",
-                parseHTML: (el) => el.getAttribute("src"),
-                renderHTML: (attrs) => ({ src: attrs.src ?? "" }),
-            },
-            name: {
-                default: null,
-                parseHTML: (el) => el.getAttribute("data-name"),
-                renderHTML: (attrs) => attrs.name ? { "data-name": attrs.name } : {},
-            },
-            attachmentId: {
-                default: null,
-                parseHTML: (el) => el.getAttribute("data-attachment-id"),
-                renderHTML: (attrs) => attrs.attachmentId
-                    ? { "data-attachment-id": attrs.attachmentId }
-                    : {},
-            },
-            size: {
-                default: null,
-                parseHTML: (el) => el.getAttribute("data-size"),
-                renderHTML: (attrs) => attrs.size != null ? { "data-size": attrs.size } : {},
-            },
-            width: {
-                default: null,
-                parseHTML: (el) => el.getAttribute("width"),
-                renderHTML: (attrs) => attrs.width != null ? { width: attrs.width } : {},
-            },
-            height: {
-                default: null,
-                parseHTML: (el) => el.getAttribute("height"),
-                renderHTML: (attrs) => attrs.height != null ? { height: attrs.height } : {},
-            },
-            // Transient upload key Docmost declares with rendered:false; carried so
-            // a round-trip never hits "Unsupported attribute".
-            placeholder: { default: null },
-        };
-    },
-    parseHTML() {
-        return [{ tag: 'div[data-type="pdf"]' }];
-    },
-    renderHTML({ HTMLAttributes }) {
-        return ["div", { "data-type": "pdf", ...HTMLAttributes }, 0];
-    },
-});
-/** Page break (print/export divider). Block atom; Docmost declares no attrs. */
-const PageBreak = Node.create({
-    name: "pageBreak",
-    group: "block",
-    inline: false,
-    isolating: true,
-    atom: true,
-    defining: true,
-    draggable: true,
-    parseHTML() {
-        return [{ tag: 'div[data-type="pageBreak"]' }];
-    },
-    renderHTML({ HTMLAttributes }) {
-        return ["div", { "data-type": "pageBreak", ...HTMLAttributes }];
-    },
-});
-/**
- * Full extension list. Image is block-level (matches Docmost); the
- * ProseMirror DOM parser hoists <img> found inside <p> automatically.
- * StarterKit v3 already bundles the link extension, configured here.
- */
-export const docmostExtensions = [
-    StarterKit.configure({
-        codeBlock: {},
-        heading: {},
-        link: { openOnClick: false },
-    }),
-    // Stock @tiptap/extension-image has no caption attribute, so a round-trip
-    // through this schema would drop the data-caption the client TiptapImage
-    // emits. Mirror editor-ext image.ts: add a caption attribute that parses
-    // data-caption and re-renders it only when set (caption-less images stay
-    // clean), keeping the MCP markdown round-trip lossless.
-    Image.extend({
-        addAttributes() {
-            const parent = this.parent?.() ?? {};
-            return {
-                ...parent,
-                caption: {
-                    default: undefined,
-                    parseHTML: (el) => el.getAttribute("data-caption") || undefined,
-                    renderHTML: (attrs) => attrs.caption ? { "data-caption": attrs.caption } : {},
-                },
-            };
-        },
-    }).configure({ inline: false }),
-    TaskList,
-    TaskItem.configure({ nested: true }),
-    // Highlight stores its color unescaped and Docmost interpolates it into
-    // style="background-color: ${color}". Wrap the color attribute's parseHTML
-    // with the same allowlist guard used by textStyle so a crafted import color
-    // cannot break out of the style attribute. Multicolor behavior is preserved.
-    Highlight.extend({
-        addAttributes() {
-            const parent = this.parent?.() ?? {};
-            return {
-                ...parent,
-                color: {
-                    ...parent.color,
-                    parseHTML: (el) => sanitizeCssColor(el.getAttribute("data-color") ||
-                        getStyleProperty(el, "background-color") ||
-                        el.style.backgroundColor),
-                },
-            };
-        },
-    }).configure({ multicolor: true }),
-    Subscript,
-    Superscript,
-    // StarterKit does not provide a textStyle mark, so register ours; without it
-    // generateJSON drops <span style="color: ...">, defeating the color import.
-    TextStyle,
-    Comment,
-    Spoiler,
-    Callout,
-    Table,
-    TableRow,
-    TableCell,
-    TableHeader,
-    Mention,
-    FootnoteReference,
-    FootnotesList,
-    FootnoteDefinition,
-    MathInline,
-    MathBlock,
-    Details,
-    DetailsSummary,
-    DetailsContent,
-    Attachment,
-    Video,
-    Youtube,
-    Embed,
-    HtmlEmbed,
-    Drawio,
-    Excalidraw,
-    Columns,
-    Column,
-    Subpages,
-    Audio,
-    Pdf,
-    PageBreak,
-    DocmostAttributes,
-];
-/**
- * The ProseMirror schema for the docmost editor, built ONCE from
- * `docmostExtensions`. Pure and reused by every consumer (diff, collaboration
- * write-back) so the schema can never drift between call sites — it lives next
- * to the extension list it is derived from.
- */
-export const docmostSchema = getSchema(docmostExtensions);
diff --git a/packages/mcp/build/lib/filters.js b/packages/mcp/build/lib/filters.js
deleted file mode 100644
index eb056968..00000000
--- a/packages/mcp/build/lib/filters.js
+++ /dev/null
@@ -1,92 +0,0 @@
-/**
- * Filter functions to extract only relevant information from API responses
- * for better agent consumption
- */
-export function filterWorkspace(data) {
-    return {
-        id: data.id,
-        name: data.name,
-        description: data.description,
-        defaultSpaceId: data.defaultSpaceId,
-        createdAt: data.createdAt,
-        updatedAt: data.updatedAt,
-        deletedAt: data.deletedAt,
-    };
-}
-export function filterSpace(space) {
-    return {
-        id: space.id,
-        name: space.name,
-        description: space.description,
-        slug: space.slug,
-        visibility: space.visibility,
-        createdAt: space.createdAt,
-        updatedAt: space.updatedAt,
-        deletedAt: space.deletedAt,
-    };
-}
-export function filterGroup(group) {
-    return {
-        id: group.id,
-        name: group.name,
-        description: group.description,
-        workspaceId: group.workspaceId,
-        createdAt: group.createdAt,
-        updatedAt: group.updatedAt,
-        deletedAt: group.deletedAt,
-    };
-}
-export function filterPage(page, content, subpages) {
-    return {
-        id: page.id,
-        slugId: page.slugId,
-        title: page.title,
-        parentPageId: page.parentPageId,
-        spaceId: page.spaceId,
-        isLocked: page.isLocked,
-        createdAt: page.createdAt,
-        updatedAt: page.updatedAt,
-        deletedAt: page.deletedAt,
-        // Include converted markdown content if valid string (even empty)
-        ...(typeof content === "string" && { content }),
-        // Include subpages if provided
-        ...(subpages &&
-            subpages.length > 0 && {
-            subpages: subpages.map((p) => ({ id: p.id, title: p.title })),
-        }),
-    };
-}
-export function filterComment(comment, markdownContent) {
-    return {
-        id: comment.id,
-        pageId: comment.pageId,
-        content: markdownContent ?? comment.content,
-        selection: comment.selection || null,
-        type: comment.type || "page",
-        parentCommentId: comment.parentCommentId || null,
-        creatorId: comment.creatorId,
-        creatorName: comment.creator?.name || null,
-        createdAt: comment.createdAt,
-        editedAt: comment.editedAt || null,
-        resolvedAt: comment.resolvedAt || null,
-        resolvedById: comment.resolvedById || null,
-        // Suggestion state: the proposed replacement text (if any) and, once a human
-        // applies it via the UI, when and by whom.
-        suggestedText: comment.suggestedText || null,
-        suggestionAppliedAt: comment.suggestionAppliedAt || null,
-        suggestionAppliedById: comment.suggestionAppliedById || null,
-    };
-}
-export function filterSearchResult(result) {
-    return {
-        id: result.id,
-        title: result.title,
-        parentPageId: result.parentPageId,
-        createdAt: result.createdAt,
-        updatedAt: result.updatedAt,
-        rank: result.rank,
-        highlight: result.highlight,
-        spaceId: result.space?.id,
-        spaceName: result.space?.name,
-    };
-}
diff --git a/packages/mcp/build/lib/footnote-analyze.js b/packages/mcp/build/lib/footnote-analyze.js
deleted file mode 100644
index 0bae93c7..00000000
--- a/packages/mcp/build/lib/footnote-analyze.js
+++ /dev/null
@@ -1,101 +0,0 @@
-/**
- * Footnote diagnostics for imported Markdown (issue #166).
- *
- * A PURE, fence-aware text scan (independent of the Markdown->ProseMirror
- * conversion path, so it reports the same problems for `create_page`,
- * `update_page` and `import_page_markdown`). It never changes the document — the
- * importer still creates the page; this only surfaces footnote problems to the
- * caller so an agent can fix its own markup instead of shipping broken footnotes.
- *
- * Detected problems:
- *  - danglingReferences: a `[^id]` reference with no `[^id]:` definition.
- *  - emptyDefinitions:   a `[^id]:` whose (kept) text is empty/whitespace.
- *  - duplicateDefinitions: an id defined by two or more `[^id]:` lines (only the
- *    first is kept on import — first-wins; see extractFootnotes).
- *  - referencesInTables: a `[^id]` marker found in a GFM table row (heuristic:
- *    the line, trimmed, starts with `|`) — footnotes in table cells often do not
- *    render as expected.
- */
-import { lexFootnoteLines, forEachFootnoteReference, } from "./footnote-lex.js";
-/**
- * Analyze the footnotes in a Markdown string. Pure; safe to call on any body.
- */
-export function analyzeFootnotes(markdown) {
-    // Distinct reference ids in first-appearance order, plus the set of ids seen
-    // inside a table row.
-    const refIds = [];
-    const refIdSet = new Set();
-    const referencesInTables = new Set();
-    const addRef = (id, inTable) => {
-        if (!refIdSet.has(id)) {
-            refIdSet.add(id);
-            refIds.push(id);
-        }
-        if (inTable)
-            referencesInTables.add(id);
-    };
-    // Definition texts per id, in first-appearance order of the id.
-    const defTextsById = new Map();
-    // Same lexer the importer uses, so the analysis matches exactly what import
-    // keeps/strips (#166): fenced lines are inert, definition lines are pulled.
-    for (const tok of lexFootnoteLines(markdown)) {
-        if (tok.inFence)
-            continue;
-        if (tok.definition) {
-            const { id, text } = tok.definition;
-            const arr = defTextsById.get(id);
-            if (arr)
-                arr.push(text);
-            else
-                defTextsById.set(id, [text]);
-            // A definition's TEXT can itself reference another footnote (`[^a]: see
-            // [^b]`); count those so such a `[^b]` is not falsely reported dangling.
-            forEachFootnoteReference(text, (rid) => addRef(rid, false));
-            continue;
-        }
-        const inTable = tok.line.trimStart().startsWith("|");
-        forEachFootnoteReference(tok.line, (id) => addRef(id, inTable));
-    }
-    const danglingReferences = refIds.filter((id) => !defTextsById.has(id));
-    const duplicateDefinitions = [];
-    const emptyDefinitions = [];
-    for (const [id, texts] of defTextsById) {
-        if (texts.length >= 2)
-            duplicateDefinitions.push(id);
-        // First-wins: the kept definition is the first one; flag it if it is blank.
-        if ((texts[0] ?? "").trim().length === 0)
-            emptyDefinitions.push(id);
-    }
-    const tableRefs = [...referencesInTables];
-    const warnings = [];
-    const list = (ids) => ids.map((id) => `[^${id}]`).join(", ");
-    if (danglingReferences.length > 0) {
-        warnings.push(`Footnote reference(s) with no matching definition: ${list(danglingReferences)} (each will render as an empty footnote in the editor).`);
-    }
-    if (emptyDefinitions.length > 0) {
-        warnings.push(`Footnote definition(s) with empty text: ${list(emptyDefinitions)}.`);
-    }
-    if (duplicateDefinitions.length > 0) {
-        warnings.push(`Footnote id(s) defined more than once (only the first definition was kept): ${list(duplicateDefinitions)}.`);
-    }
-    if (tableRefs.length > 0) {
-        warnings.push(`Footnote marker(s) inside a table row (footnotes in table cells may not render as expected): ${list(tableRefs)}.`);
-    }
-    return {
-        danglingReferences,
-        emptyDefinitions,
-        duplicateDefinitions,
-        referencesInTables: tableRefs,
-        warnings,
-    };
-}
-/**
- * The optional `footnoteWarnings` field for a page-write tool result: present
- * (with the warning lines) only when `markdown` has footnote problems, omitted
- * otherwise. One helper so all three call sites (create/update/import) attach the
- * field identically. Spread into the result: `{ ...result, ...footnoteWarningsField(text) }`.
- */
-export function footnoteWarningsField(markdown) {
-    const { warnings } = analyzeFootnotes(markdown);
-    return warnings.length > 0 ? { footnoteWarnings: warnings } : {};
-}
diff --git a/packages/mcp/build/lib/footnote-authoring.js b/packages/mcp/build/lib/footnote-authoring.js
deleted file mode 100644
index ab8d7eb2..00000000
--- a/packages/mcp/build/lib/footnote-authoring.js
+++ /dev/null
@@ -1,88 +0,0 @@
-/**
- * Inline-authoring helpers for footnotes (MCP).
- *
- * These build/identify footnote DEFINITION nodes for the author-inline tool
- * (`insertInlineFootnote` in transforms.ts): a content key to de-duplicate notes
- * by text, a definition-node factory, and a fresh uuidv7-style id generator.
- *
- * Split out of `footnote-canonicalize.ts` so that module stays a pure MIRROR of
- * the editor-ext canonicalizer (compositionally symmetric to the editor-ext
- * copy, which keeps its authoring helpers in `footnote-util.ts`). The pure
- * canonicalizer has no dependency on these.
- */
-const FOOTNOTE_DEFINITION_NAME = "footnoteDefinition";
-function cloneJson(v) {
-    if (typeof structuredClone === "function")
-        return structuredClone(v);
-    return JSON.parse(JSON.stringify(v));
-}
-/**
- * Normalized content key for de-duplicating footnote DEFINITIONS by their text.
- *
- * Two definitions with the same key are the SAME footnote — so the inline
- * authoring tool reuses one id (one number, one definition, several references)
- * instead of minting a second definition. Key = plaintext (whitespace-collapsed,
- * trimmed) PLUS a signature of the inline mark types in order, so two notes that
- * read the same but differ in formatting (one bold, one plain) are NOT merged.
- * Conservative: only an exact match merges.
- */
-export function footnoteContentKey(defNode) {
-    const parts = [];
-    const visit = (n) => {
-        if (!n || typeof n !== "object")
-            return;
-        if (n.type === "text" && typeof n.text === "string") {
-            const marks = Array.isArray(n.marks)
-                ? n.marks.map((m) => m?.type).filter(Boolean).sort().join(",")
-                : "";
-            parts.push(`${n.text}${marks}`);
-        }
-        if (Array.isArray(n.content))
-            for (const c of n.content)
-                visit(c);
-    };
-    visit(defNode);
-    // Collapse the assembled text's whitespace and trim, keeping the mark
-    // signature attached so formatting differences still distinguish notes.
-    return parts
-        .join("")
-        .replace(/[ \t\r\n]+/g, " ")
-        .trim();
-}
-/**
- * Build a footnoteDefinition node from inline ProseMirror nodes, keyed by id.
- */
-export function makeFootnoteDefinition(id, inlineNodes) {
-    const content = Array.isArray(inlineNodes) ? cloneJson(inlineNodes) : [];
-    return {
-        type: FOOTNOTE_DEFINITION_NAME,
-        attrs: { id },
-        content: [{ type: "paragraph", content }],
-    };
-}
-/**
- * Generate a uuidv7-style id (time-ordered), matching editor-ext's
- * `generateFootnoteId`. Used for a genuinely-new inline footnote id.
- */
-export function generateFootnoteId() {
-    const now = Date.now();
-    const timeHex = now.toString(16).padStart(12, "0");
-    const rand = (length) => {
-        let s = "";
-        for (let i = 0; i < length; i++)
-            s += Math.floor(Math.random() * 16).toString(16);
-        return s;
-    };
-    const versioned = "7" + rand(3);
-    const variantNibble = (8 + Math.floor(Math.random() * 4)).toString(16);
-    const variant = variantNibble + rand(3);
-    return (timeHex.slice(0, 8) +
-        "-" +
-        timeHex.slice(8, 12) +
-        "-" +
-        versioned +
-        "-" +
-        variant +
-        "-" +
-        rand(12));
-}
diff --git a/packages/mcp/build/lib/footnote-canonicalize.js b/packages/mcp/build/lib/footnote-canonicalize.js
deleted file mode 100644
index d2d91400..00000000
--- a/packages/mcp/build/lib/footnote-canonicalize.js
+++ /dev/null
@@ -1,215 +0,0 @@
-/**
- * Server-side footnote canonicalizer (MCP mirror — PURE).
- *
- * `canonicalizeFootnotes(doc)` is a pure ProseMirror-JSON port of the editor's
- * `footnoteSyncPlugin` end-state, identical in behaviour to
- * `@docmost/editor-ext`'s `canonicalizeFootnotes`. It is mirrored here — rather
- * than imported from editor-ext — for the SAME reason `footnote-lex.ts` and the
- * `docmost-schema.ts` nodes are mirrored: the MCP package is deliberately
- * decoupled from the browser/React-heavy editor barrel and operates on plain
- * JSON. The editor-ext copy owns the golden test against the live plugin; this
- * copy must stay behaviourally identical (a SHARED golden corpus, exercised by
- * both test suites, pins that — see `test/unit/footnote-corpus.mjs`).
- *
- * This module is the pure MIRROR only. The inline-authoring helpers
- * (`footnoteContentKey`, `makeFootnoteDefinition`, `generateFootnoteId`) used by
- * `insertInlineFootnote` live in the sibling `footnote-authoring.ts`, so this
- * file is compositionally symmetric to the editor-ext copy.
- *
- * Why it exists: every NON-editor write path (markdown import, update_page_json,
- * docmost_transform, insert_footnote) builds ProseMirror JSON directly, so the
- * editor's footnote plugins never run and the canonical topology (sequential
- * numbering by first reference, one trailing list, no orphans, no raw `[^id]`)
- * was never enforced. Running this at the end of every write path closes that
- * gap; because it is idempotent, it is a no-op when the footnotes are already
- * canonical (no spurious mutations / git-sync churn).
- *
- * ENFORCEMENT RULE (#228): any NEW FULL-document persist path MUST call
- * `canonicalizeFootnotes(doc)` before writing — the current callers are
- * `markdownToProseMirrorCanonical` (page markdown import/update; the plain
- * `markdownToProseMirror` used for COMMENT bodies must NOT, or it would drop a
- * reference-less definition), `update_page_json`, `docmost_transform`,
- * `insert_footnote`, and `copy_page_content`. Append/prepend FRAGMENT writes MUST
- * NOT canonicalize. This is deliberately per-call-site (the replace-vs-fragment
- * and comment-vs-page nuances make a single naive wrapper unsafe).
- */
-const FOOTNOTE_REFERENCE_NAME = "footnoteReference";
-const FOOTNOTES_LIST_NAME = "footnotesList";
-const FOOTNOTE_DEFINITION_NAME = "footnoteDefinition";
-function cloneJson(v) {
-    if (typeof structuredClone === "function")
-        return structuredClone(v);
-    return JSON.parse(JSON.stringify(v));
-}
-function isEmptyParagraph(node) {
-    return (!!node &&
-        node.type === "paragraph" &&
-        (!Array.isArray(node.content) || node.content.length === 0));
-}
-function collectReferenceIds(node, out, seen) {
-    if (!node || typeof node !== "object")
-        return;
-    if (node.type === FOOTNOTE_REFERENCE_NAME) {
-        const id = node?.attrs?.id;
-        if (id && !seen.has(id)) {
-            seen.add(id);
-            out.push(id);
-        }
-    }
-    if (Array.isArray(node.content)) {
-        for (const child of node.content)
-            collectReferenceIds(child, out, seen);
-    }
-}
-function collectDefinitions(node, out) {
-    if (!node || typeof node !== "object")
-        return;
-    if (node.type === FOOTNOTE_DEFINITION_NAME)
-        out.push(node);
-    if (Array.isArray(node.content)) {
-        for (const child of node.content)
-            collectDefinitions(child, out);
-    }
-}
-function emptyDefinition(id) {
-    return {
-        type: FOOTNOTE_DEFINITION_NAME,
-        attrs: { id },
-        content: [{ type: "paragraph" }],
-    };
-}
-/**
- * Deep equality over plain JSON: arrays are compared POSITIONALLY
- * (order-SENSITIVE), object keys order-insensitively. The array order-sensitivity
- * is required for correctness here — a reordered `footnotesList.content` must
- * compare UNEQUAL so the canonical rebuild fires instead of leaving it in place.
- */
-function deepEqualJson(a, b) {
-    if (a === b)
-        return true;
-    if (a == null || b == null || typeof a !== typeof b)
-        return false;
-    if (Array.isArray(a) || Array.isArray(b)) {
-        if (!Array.isArray(a) || !Array.isArray(b) || a.length !== b.length) {
-            return false;
-        }
-        for (let i = 0; i < a.length; i++) {
-            if (!deepEqualJson(a[i], b[i]))
-                return false;
-        }
-        return true;
-    }
-    if (typeof a === "object") {
-        const ka = Object.keys(a);
-        const kb = Object.keys(b);
-        if (ka.length !== kb.length)
-            return false;
-        for (const k of ka) {
-            if (!Object.prototype.hasOwnProperty.call(b, k))
-                return false;
-            if (!deepEqualJson(a[k], b[k]))
-                return false;
-        }
-        return true;
-    }
-    return false;
-}
-/**
- * Canonicalize footnotes in a ProseMirror-JSON document. See the file header and
- * the editor-ext twin for the full contract. Pure (deep-clones input,
- * deterministic, idempotent).
- */
-export function canonicalizeFootnotes(doc) {
-    if (doc == null ||
-        typeof doc !== "object" ||
-        !Array.isArray(doc.content)) {
-        return doc;
-    }
-    const out = cloneJson(doc);
-    // 1) Distinct reference ids in document order (deep — refs can live in
-    //    callouts, tables, list items, ...). The ordering/numbering truth.
-    const referenceIds = [];
-    collectReferenceIds(out, referenceIds, new Set());
-    // 2) Every definition node in document order (deep).
-    const defNodes = [];
-    collectDefinitions(out, defNodes);
-    // 3) First definition per id wins; later duplicates carry the SAME id, so they
-    //    cannot be referenced separately and would be orphans — they are dropped.
-    const defById = new Map();
-    for (const d of defNodes) {
-        const id = d?.attrs?.id;
-        if (id && !defById.has(id))
-            defById.set(id, d);
-    }
-    // 4) Build the ordered definition list: one per referenced id, in REFERENCE
-    //    order, reusing the existing node (shallow-copied, id normalized — `out` is
-    //    already deep-cloned and the old lists are cut) or synthesizing an empty
-    //    one. Definitions whose id is not referenced are orphans and never added.
-    const orderedDefs = [];
-    for (const id of referenceIds) {
-        const existing = defById.get(id);
-        if (existing) {
-            orderedDefs.push({
-                ...existing,
-                attrs: { ...(existing.attrs ?? {}), id },
-            });
-        }
-        else {
-            orderedDefs.push(emptyDefinition(id));
-        }
-    }
-    // 5) No references -> there must be NO list at all (at any depth).
-    if (referenceIds.length === 0) {
-        stripFootnotesListsDeep(out);
-        return out;
-    }
-    // 6) Placement parity with the live plugin: when the document is ALREADY in the
-    //    canonical single-list state, leave that list exactly where it sits rather
-    //    than cutting and re-inserting it at the end (the plugin never repositions a
-    //    sole correct list, so moving it would silently reorder any content that
-    //    follows the list on the first write).
-    const topLevelLists = out.content.filter((n) => n && n.type === FOOTNOTES_LIST_NAME);
-    if (topLevelLists.length === 1 &&
-        defNodes.length === orderedDefs.length &&
-        deepEqualJson(topLevelLists[0].content, orderedDefs)) {
-        return out;
-    }
-    // 7) Otherwise rebuild: strip every footnotesList AND every bare
-    //    footnoteDefinition at ANY depth (collectDefinitions gathers defs
-    //    recursively, so a list nested in a callout/blockquote — or a bare
-    //    definition outside any list — would otherwise have its defs copied into the
-    //    rebuilt list while the original survives in place → duplicates) and
-    //    re-insert exactly one list after the last meaningful (non-empty paragraph)
-    //    top-level block.
-    stripFootnotesListsDeep(out);
-    stripFootnoteDefinitionsDeep(out);
-    const top = out.content;
-    let insertAt = top.length;
-    while (insertAt > 0 && isEmptyParagraph(top[insertAt - 1]))
-        insertAt--;
-    top.splice(insertAt, 0, { type: FOOTNOTES_LIST_NAME, content: orderedDefs });
-    out.content = top;
-    return out;
-}
-/** Remove every `footnotesList` node at ANY depth (mutates the given clone). */
-function stripFootnotesListsDeep(node) {
-    if (!node || typeof node !== "object" || !Array.isArray(node.content))
-        return;
-    node.content = node.content.filter((c) => !(c && c.type === FOOTNOTES_LIST_NAME));
-    for (const child of node.content)
-        stripFootnotesListsDeep(child);
-}
-/**
- * Remove every BARE `footnoteDefinition` node at ANY depth (mutates the given
- * clone). Runs only in the rebuild path AFTER the lists are stripped, so it
- * targets definitions that were sitting outside a list (e.g. hand-authored via a
- * raw-JSON write path and nested in a callout); their content was already copied
- * into the rebuilt list, so leaving the originals would duplicate them.
- */
-function stripFootnoteDefinitionsDeep(node) {
-    if (!node || typeof node !== "object" || !Array.isArray(node.content))
-        return;
-    node.content = node.content.filter((c) => !(c && c.type === FOOTNOTE_DEFINITION_NAME));
-    for (const child of node.content)
-        stripFootnoteDefinitionsDeep(child);
-}
diff --git a/packages/mcp/build/lib/footnote-lex.js b/packages/mcp/build/lib/footnote-lex.js
deleted file mode 100644
index 3c22d149..00000000
--- a/packages/mcp/build/lib/footnote-lex.js
+++ /dev/null
@@ -1,55 +0,0 @@
-/**
- * Shared, fence-aware line lexer for footnote markdown (MCP-internal).
- *
- * Both the importer (`extractFootnotes` in collaboration.ts, which strips
- * definition lines and rebuilds a footnotes section) and the diagnostics
- * (`analyzeFootnotes` in footnote-analyze.ts) must agree EXACTLY on which lines
- * are definitions and which lines are inert (inside a code fence). Sharing one
- * lexer makes "the analyzer sees what the importer leaves" a structural property
- * instead of two hand-kept copies that can drift (#166 review).
- *
- * NOTE: this is deliberately NOT shared with editor-ext's
- * `extractFootnoteDefinitions` — that lives in a different package and the
- * decoupling between the editor and the MCP mirror is intentional.
- */
-/** A footnote DEFINITION line: `[^id]: text` (id + text captured). */
-export const FOOTNOTE_DEF_RE = /^\[\^([^\]\s]+)\]:[ \t]*(.*)$/;
-/** Every footnote REFERENCE `[^id]` in a line (global; id captured). */
-export const FOOTNOTE_REF_RE_G = /\[\^([^\]\s]+)\]/g;
-/** Opening/closing code fence marker (``` or ~~~). */
-const FENCE_RE = /^(\s*)(`{3,}|~{3,})/;
-/** Classify every line of `markdown`, tracking fenced-code state. Pure. */
-export function lexFootnoteLines(markdown) {
-    const out = [];
-    let fence = null;
-    for (const line of markdown.split("\n")) {
-        const fenceMatch = FENCE_RE.exec(line);
-        if (fenceMatch) {
-            const marker = fenceMatch[2][0];
-            if (fence === null)
-                fence = marker; // opening fence
-            else if (marker === fence)
-                fence = null; // matching closing fence
-            out.push({ line, inFence: true, definition: null });
-            continue;
-        }
-        if (fence !== null) {
-            out.push({ line, inFence: true, definition: null });
-            continue;
-        }
-        const m = FOOTNOTE_DEF_RE.exec(line);
-        out.push({
-            line,
-            inFence: false,
-            definition: m ? { id: m[1], text: m[2] } : null,
-        });
-    }
-    return out;
-}
-/** Scan a line for every `[^id]` reference, invoking `onRef(id)` for each. */
-export function forEachFootnoteReference(line, onRef) {
-    FOOTNOTE_REF_RE_G.lastIndex = 0;
-    let m;
-    while ((m = FOOTNOTE_REF_RE_G.exec(line)) !== null)
-        onRef(m[1]);
-}
diff --git a/packages/mcp/build/lib/internal-file-urls.js b/packages/mcp/build/lib/internal-file-urls.js
deleted file mode 100644
index 3fc89bbe..00000000
--- a/packages/mcp/build/lib/internal-file-urls.js
+++ /dev/null
@@ -1,110 +0,0 @@
-// Detection + collection of INTERNAL Docmost file URLs inside a ProseMirror doc.
-//
-// An internal file URL is a relative path served by Docmost's authenticated
-// attachment route (`GET /api/files/:fileId/:fileName`). It is useless to an
-// external consumer (relative + needs a Docmost session), so the stash tool
-// mirrors every such resource into the blob sandbox and rewrites its `src`.
-//
-// The criterion is "internal file URL", NOT the node TYPE: image, drawio,
-// excalidraw, video and file nodes all carry such a `src`, so a type-agnostic
-// walker covers them all. External http(s) srcs (CDNs) are left untouched.
-//
-// Mirrors editor-ext's isInternalFileUrl / normalizeFileUrl (kept as a local
-// dup so the ESM mcp package does not depend on the editor-ext build).
-function isInternalFileUrl(url) {
-    if (typeof url !== "string")
-        return false;
-    const normalized = url.trim();
-    return (normalized.startsWith("/api/files/") || normalized.startsWith("/files/"));
-}
-/** Normalize a bare `/files/...` src to the canonical `/api/files/...` form. */
-export function normalizeFileUrl(src) {
-    const trimmed = src.trim();
-    if (trimmed.startsWith("/files/"))
-        return "/api" + trimmed;
-    return trimmed;
-}
-/**
- * Resolve a page-content `src` into the safe, `/api`-relative path the stash
- * tool may fetch over the authenticated loopback client — or THROW.
- *
- * SECURITY (SSRF / path-traversal): `src` comes from page content and is fully
- * attacker-controllable. The mirroring fetch runs through the AUTHENTICATED
- * loopback axios client whose baseURL ends in `/api`, so a naive
- * `src.replace(/^\/api/, "")` lets a crafted value like
- * `/api/files/../auth/whoami` collapse (via axios/WHATWG URL `..` resolution)
- * into an ARBITRARY internal GET endpoint, whose authed response would then be
- * stored in the anonymous sandbox (SSRF + data exfiltration). A prefix-only
- * `startsWith("/api/files/")` check does NOT defend against this because the
- * `..` segments are still present in the raw string and resolved later.
- *
- * This function defeats that by resolving the canonical pathname FIRST and only
- * then asserting it still lives under `/api/files/`:
- *  - it rejects any percent-encoded dot/slash (`%2e` / `%2f`): the WHATWG URL
- *    parser collapses LITERAL `../` but does NOT decode `%2f` separators, so a
- *    content-controlled src must never be allowed to smuggle those past the
- *    canonicalization;
- *  - it resolves `new URL(trimmed, "http://internal.invalid").pathname`, which
- *    normalizes `..`/`.` segments (e.g. `/api/files/../auth/whoami` →
- *    `/api/auth/whoami`);
- *  - it then requires the canonical pathname to start with `/api/files/`, so a
- *    traversal that escaped that subtree is rejected.
- *
- * Returns the path RELATIVE to the `/api` base (e.g. `/files/<id>/<name>`),
- * ready to hand to the loopback client. The throw happens BEFORE any network
- * call, so a rejected src is counted as a failed mirror and its original src is
- * kept (the per-image try/catch in stashPage never aborts the whole document).
- */
-export function resolveInternalFilePath(src) {
-    const trimmed = src.trim();
-    // Percent-encoded dot/slash must never reach the URL canonicalizer: the
-    // WHATWG parser does NOT decode `%2f` into a path separator, so an encoded
-    // `..%2fauth` would survive canonicalization and still escape /api/files/.
-    if (/%2e|%2f/i.test(trimmed)) {
-        throw new Error(`Refusing internal file src with percent-encoded path segment: "${src}"`);
-    }
-    let pathname;
-    try {
-        // The base host is irrelevant (never contacted); it only lets the parser
-        // resolve a relative `src` and normalize `..`/`.` segments.
-        pathname = new URL(trimmed, "http://internal.invalid").pathname;
-    }
-    catch {
-        throw new Error(`Invalid internal file src: "${src}"`);
-    }
-    if (!pathname.startsWith("/api/files/")) {
-        throw new Error(`Refusing internal file src that escapes /api/files/: "${src}"`);
-    }
-    // Strip the `/api` base prefix; the loopback client's baseURL already ends
-    // in `/api`, so it expects the path relative to that (e.g. /files/<id>/<f>).
-    return pathname.replace(/^\/api/, "");
-}
-/**
- * Recursively collect every node whose `attrs.src` is an internal file URL.
- * Returns references to the live nodes (so the caller can rewrite `attrs.src`
- * in place on its clone). Descends `content` arrays, covering callouts, tables,
- * details and any other nested container.
- */
-export function collectInternalFileNodes(doc) {
-    const out = [];
-    const visit = (node) => {
-        if (!node)
-            return;
-        if (Array.isArray(node)) {
-            for (const child of node)
-                visit(child);
-            return;
-        }
-        if (typeof node !== "object")
-            return;
-        if (node.attrs && isInternalFileUrl(node.attrs.src)) {
-            out.push(node);
-        }
-        if (Array.isArray(node.content)) {
-            for (const child of node.content)
-                visit(child);
-        }
-    };
-    visit(doc);
-    return out;
-}
diff --git a/packages/mcp/build/lib/json-edit.js b/packages/mcp/build/lib/json-edit.js
deleted file mode 100644
index 4a98a4c5..00000000
--- a/packages/mcp/build/lib/json-edit.js
+++ /dev/null
@@ -1,393 +0,0 @@
-/**
- * Surgical text edits on a ProseMirror document without re-importing it.
- *
- * Each edit replaces an exact substring of a block's inline text, preserving
- * every node id, mark and attribute around it. Matching works at the
- * INLINE-CONTAINER (block) level: a block's text nodes are flattened into a
- * per-character array, so a `find` may freely cross bold/italic/link
- * boundaries (separate text nodes). The replacement inherits marks from the
- * unchanged common prefix/suffix of the match, so editing plain text next to a
- * bold word keeps the bold word bold, and editing the inside of a bold word
- * keeps the inserted text bold. This is the safe alternative to a full markdown
- * re-import for small wording fixes.
- */
-import { stripInlineMarkdown, stripBalancedWrappers } from "./text-normalize.js";
-/** Placeholder code unit standing in for one opaque (non-text) inline node. */
-const ATOM_PLACEHOLDER = "￼"; // OBJECT REPLACEMENT CHARACTER
-/**
- * Find every VALID occurrence of `needle` in a block's flattened slots.
- *
- * A candidate occurrence at slot range [start, start+needle.length) is valid
- * ONLY IF none of the slots in that range are atoms (non-text inline nodes).
- * This makes atom matching collision-safe against the U+FFFC placeholder: an
- * atom slot can never be part of a match, while a real text node containing a
- * literal U+FFFC code unit still matches normally (its slot has no `.atom`).
- *
- * Overlapping candidates that touch an atom are skipped (not counted, not
- * spliced); the scan resumes one code unit past the rejected start so a valid
- * match that begins just after an atom is not missed.
- */
-function findValidMatches(chars, plain, needle) {
-    if (!needle)
-        return [];
-    const positions = [];
-    let idx = plain.indexOf(needle);
-    while (idx !== -1) {
-        const end = idx + needle.length;
-        let hasAtom = false;
-        for (let i = idx; i < end; i++) {
-            if (chars[i] && chars[i].atom) {
-                hasAtom = true;
-                break;
-            }
-        }
-        if (!hasAtom) {
-            positions.push(idx);
-            // Non-overlapping: skip past this match.
-            idx = plain.indexOf(needle, end);
-        }
-        else {
-            // This candidate crosses an atom: reject it and resume one unit later so
-            // an overlapping valid match starting after the atom is still found.
-            idx = plain.indexOf(needle, idx + 1);
-        }
-    }
-    return positions;
-}
-/** Order-sensitive deep-equality of two marks arrays. */
-function marksEqual(a, b) {
-    if (a === b)
-        return true;
-    if (a.length !== b.length)
-        return false;
-    for (let i = 0; i < a.length; i++) {
-        if (JSON.stringify(a[i]) !== JSON.stringify(b[i]))
-            return false;
-    }
-    return true;
-}
-/** A block is any node that DIRECTLY contains at least one inline text child. */
-function isInlineBlock(node) {
-    return (Array.isArray(node?.content) &&
-        node.content.some((child) => child && child.type === "text"));
-}
-/** Flatten a block's inline content into a per-code-unit slot array. */
-function flattenBlock(node) {
-    const chars = [];
-    for (const child of node.content || []) {
-        if (child && child.type === "text" && typeof child.text === "string") {
-            const marks = child.marks || [];
-            // Iterate by UTF-16 code unit so indices align with String.indexOf.
-            for (let i = 0; i < child.text.length; i++) {
-                chars.push({ ch: child.text[i], marks });
-            }
-        }
-        else {
-            // Any non-text inline node becomes one opaque slot.
-            chars.push({
-                ch: ATOM_PLACEHOLDER,
-                marks: (child && child.marks) || [],
-                atom: child,
-            });
-        }
-    }
-    return chars;
-}
-/** Re-tokenize a slot array back into ProseMirror inline nodes. */
-function tokenizeChars(chars) {
-    const out = [];
-    let buffer = "";
-    let bufferMarks = null;
-    const flush = () => {
-        if (buffer.length === 0)
-            return;
-        const textNode = { type: "text", text: buffer };
-        if (bufferMarks && bufferMarks.length > 0)
-            textNode.marks = bufferMarks;
-        out.push(textNode);
-        buffer = "";
-        bufferMarks = null;
-    };
-    for (const slot of chars) {
-        if (slot.atom) {
-            flush();
-            out.push(slot.atom);
-            continue;
-        }
-        if (bufferMarks !== null && !marksEqual(bufferMarks, slot.marks)) {
-            flush();
-        }
-        if (bufferMarks === null)
-            bufferMarks = slot.marks;
-        buffer += slot.ch;
-    }
-    flush();
-    return out;
-}
-/** Longest common prefix length of two strings. */
-function commonPrefixLen(a, b) {
-    const max = Math.min(a.length, b.length);
-    let i = 0;
-    while (i < max && a[i] === b[i])
-        i++;
-    return i;
-}
-/** Longest common suffix length of two strings, capped so it can't overlap. */
-function commonSuffixLen(a, b, cap) {
-    const max = Math.min(a.length, b.length, cap);
-    let i = 0;
-    while (i < max && a[a.length - 1 - i] === b[b.length - 1 - i])
-        i++;
-    return i;
-}
-/**
- * Apply one edit to one block's flattened slot array.
- *
- * The caller passes only VALID (atom-free) match positions (see
- * findValidMatches), so no match range can overlap an atom slot here.
- */
-function applyEditToChars(chars, edit, matchPositions) {
-    // Pre-compute the diff slices once (find/replace are constant per edit).
-    const p = commonPrefixLen(edit.find, edit.replace);
-    const s = commonSuffixLen(edit.find, edit.replace, Math.min(edit.find.length, edit.replace.length) - p);
-    const insertText = edit.replace.slice(p, edit.replace.length - s);
-    // Rebuild the slot array in a single left-to-right pass, splicing at each
-    // match start. Offsets into `chars` stay valid because we copy through.
-    const newChars = [];
-    let cursor = 0;
-    let spliced = 0;
-    for (const mStart of matchPositions) {
-        const mEnd = mStart + edit.find.length;
-        const changedStart = mStart + p;
-        const changedEnd = mEnd - s;
-        // Copy through everything up to the changed region (incl. the prefix).
-        for (; cursor < changedStart; cursor++)
-            newChars.push(chars[cursor]);
-        const removed = chars.slice(changedStart, changedEnd);
-        // Choose the marks for the inserted characters.
-        let chosenMarks = [];
-        if (removed.length > 0 &&
-            removed.every((r) => marksEqual(r.marks, removed[0].marks))) {
-            // Uniform removed region: inherit its marks directly.
-            chosenMarks = removed[0].marks;
-        }
-        else {
-            // Empty or non-uniform removed region: inherit from the nearest TEXT
-            // neighbour, skipping atom slots (an atom carries marks that do not
-            // belong on inserted text). Scan left first, then right; fall back to [].
-            let inherited = null;
-            for (let i = changedStart - 1; i >= 0; i--) {
-                if (!chars[i].atom) {
-                    inherited = chars[i].marks;
-                    break;
-                }
-            }
-            if (inherited === null) {
-                for (let i = changedEnd; i < chars.length; i++) {
-                    if (!chars[i].atom) {
-                        inherited = chars[i].marks;
-                        break;
-                    }
-                }
-            }
-            chosenMarks = inherited === null ? [] : inherited;
-        }
-        // Emit the inserted text (one slot per code unit).
-        for (let i = 0; i < insertText.length; i++) {
-            newChars.push({ ch: insertText[i], marks: chosenMarks });
-        }
-        // Skip the removed region.
-        cursor = changedEnd;
-        spliced++;
-    }
-    // Copy through the tail.
-    for (; cursor < chars.length; cursor++)
-        newChars.push(chars[cursor]);
-    return { newChars, spliced };
-}
-/**
- * Apply text edits to a ProseMirror doc (operates on a deep copy, returns it).
- *
- * Returns { doc, results, failed }:
- *  - results: edits that applied (replacements >= 1).
- *  - failed:  edits that matched zero times, were ambiguous (multi-match
- *    without replaceAll), or whose changed region crosses a non-text inline
- *    node. These do NOT throw — they are recorded so the caller can surface an
- *    actionable message and still keep the edits that did apply.
- *
- * Edits apply IN ORDER to the same working copy, so a later edit can target
- * text produced by an earlier one. The input doc is never mutated. The only
- * thrown error is for invalid input (an empty `edit.find`).
- */
-export function applyTextEdits(doc, edits) {
-    const copy = JSON.parse(JSON.stringify(doc));
-    const results = [];
-    const failed = [];
-    for (const edit of edits) {
-        if (!edit.find)
-            throw new Error("edit.find must be a non-empty string");
-        // HARD-REFUSE formatting changes. edit_page_text edits PLAIN TEXT only and
-        // writes the replacement verbatim, so it cannot add/remove marks. We refuse
-        // only a pure formatting TOGGLE: find and replace differ ONLY by balanced
-        // markdown markers (e.g. find:"~~$69~~" / replace:"$69", or find:"M5Stack" /
-        // replace:"**M5Stack**" which would write literal `**`).
-        //
-        // The detector is the STRICT stripBalancedWrappers, NOT the lenient locator
-        // stripInlineMarkdown: the lenient one also trims whitespace/emoji and
-        // collapses lone `*`/`_` runs, which gives false positives on ordinary
-        // plain-text edits (trailing-space trim, snake_case, `2 * 3 * 4`, URLs with
-        // underscores) and wrongly refuses them. Comparing the strict strip of both
-        // sides symmetrically catches every real formatting toggle while leaving
-        // plain text alone; a typo fix wrapped in markdown still applies because its
-        // stripped find != stripped replace.
-        const formattingOnly = edit.find !== edit.replace &&
-            stripBalancedWrappers(edit.find) === stripBalancedWrappers(edit.replace);
-        if (formattingOnly) {
-            failed.push({
-                find: edit.find,
-                reason: "edit_page_text edits plain text only and cannot add or remove formatting marks (bold/italic/strike/code/link); it writes the replacement as LITERAL text. This edit looks like a formatting change (markdown markers in find/replace). To change marks, read the block with get_page_json and use patch_node (or update_page_json) to set the node's marks array.",
-            });
-            continue;
-        }
-        // Gather every inline block in document order (recurse the whole tree so
-        // nested containers — callouts, list items, table cells, blockquotes — are
-        // all covered).
-        const blocks = [];
-        (function collect(node) {
-            if (isInlineBlock(node))
-                blocks.push(node);
-            for (const child of node.content || [])
-                collect(child);
-        })(copy);
-        // Find every VALID (atom-free) occurrence per block. A candidate whose slot
-        // range overlaps a non-text inline atom is never a match (collision-safe vs
-        // the U+FFFC placeholder), so it is excluded from both the uniqueness count
-        // and the splicing.
-        const blockChars = blocks.map((b) => flattenBlock(b));
-        const blockPlain = blockChars.map((chars) => chars.map((c) => c.ch).join(""));
-        // EXACT MATCH WINS: try the verbatim locator first.
-        let effectiveFind = edit.find;
-        let normalized = false;
-        let validPerBlock = blockChars.map((chars, b) => findValidMatches(chars, blockPlain[b], edit.find));
-        let total = 0;
-        for (const positions of validPerBlock)
-            total += positions.length;
-        // FALLBACK: only if the verbatim locator matched nothing, retry with the
-        // markdown-stripped form. `edit.replace` is never touched — this only
-        // changes what we LOCATE, not what we insert.
-        const stripped = stripInlineMarkdown(edit.find);
-        if (total === 0 && stripped !== edit.find && stripped.length > 0) {
-            const strippedPerBlock = blockChars.map((chars, b) => findValidMatches(chars, blockPlain[b], stripped));
-            let strippedTotal = 0;
-            for (const positions of strippedPerBlock)
-                strippedTotal += positions.length;
-            if (strippedTotal >= 1) {
-                validPerBlock = strippedPerBlock;
-                total = strippedTotal;
-                effectiveFind = stripped;
-                normalized = true;
-            }
-        }
-        if (total === 0) {
-            // Distinguish "the text exists but only across an atom" from a plain
-            // not-found: if a raw substring scan (atoms included) WOULD have hit —
-            // for EITHER the verbatim or the stripped locator — the only thing
-            // blocking the edit is the atom, so report that.
-            const existsAcrossAtom = blockPlain.some((plain) => plain.indexOf(edit.find) !== -1 ||
-                (stripped !== edit.find && plain.indexOf(stripped) !== -1));
-            let reason;
-            if (existsAcrossAtom) {
-                reason =
-                    "match crosses a non-text inline node (image/break/mention); use update_page_json for structural changes.";
-            }
-            else {
-                // Append a bounded "closest text" hint: find the FIRST block that
-                // contains the longest whitespace-delimited token (>= 3 chars) of the
-                // (stripped, then raw) locator, and quote that block's plain text.
-                reason = "text not found in the document.";
-                const tokenSource = stripped.length > 0 ? stripped : edit.find;
-                const longestToken = tokenSource
-                    .split(/\s+/)
-                    .filter((t) => t.length >= 3)
-                    .sort((a, b) => b.length - a.length)[0];
-                if (longestToken) {
-                    const hitBlock = blockPlain.find((plain) => plain.includes(longestToken));
-                    if (hitBlock) {
-                        // Truncate by code point (spread iterates by code point) so a
-                        // surrogate pair is never split; append the ellipsis only when the
-                        // text was actually longer than the limit.
-                        const points = [...hitBlock];
-                        const snippet = points.length > 120
-                            ? points.slice(0, 120).join("") + "…"
-                            : hitBlock;
-                        reason += ` Closest block text: "${snippet}".`;
-                    }
-                }
-            }
-            failed.push({ find: edit.find, reason });
-            continue;
-        }
-        if (total > 1 && !edit.replaceAll) {
-            failed.push({
-                find: edit.find,
-                reason: `matches ${total} times. Provide a longer, unique fragment or set replaceAll: true.`,
-            });
-            continue;
-        }
-        // Plan the splices from the valid positions. For a non-replaceAll edit we
-        // splice only the first valid match (left-to-right across blocks); for
-        // replaceAll we splice every valid match.
-        const plannedPerBlock = blockChars.map(() => []);
-        let takenFirst = false;
-        for (let b = 0; b < validPerBlock.length; b++) {
-            for (const idx of validPerBlock[b]) {
-                if (edit.replaceAll) {
-                    plannedPerBlock[b].push(idx);
-                }
-                else if (!takenFirst) {
-                    plannedPerBlock[b].push(idx);
-                    takenFirst = true;
-                    break;
-                }
-                else {
-                    break;
-                }
-            }
-            if (!edit.replaceAll && takenFirst)
-                break;
-        }
-        // Apply the splices block-by-block and re-tokenize changed blocks. The
-        // local edit uses `effectiveFind` (verbatim or normalized) so the
-        // prefix/suffix diff is computed against the ACTUALLY matched text, while
-        // `edit.replace` stays literal — never stripped.
-        const effectiveEdit = {
-            find: effectiveFind,
-            replace: edit.replace,
-            replaceAll: edit.replaceAll,
-        };
-        let spliced = 0;
-        for (let b = 0; b < blocks.length; b++) {
-            if (plannedPerBlock[b].length === 0)
-                continue;
-            const { newChars, spliced: n } = applyEditToChars(blockChars[b], effectiveEdit, plannedPerBlock[b]);
-            spliced += n;
-            blocks[b].content = tokenizeChars(newChars);
-        }
-        // Keep `find: edit.find` (the original) so the caller can correlate.
-        const result = { find: edit.find, replacements: spliced };
-        if (normalized)
-            result.normalized = true;
-        results.push(result);
-    }
-    // Safety net: drop any empty text nodes (ProseMirror forbids them). The
-    // re-tokenizer never emits empty text nodes, but untouched blocks could in
-    // principle carry one in from upstream.
-    (function prune(node) {
-        if (Array.isArray(node.content)) {
-            node.content = node.content.filter((child) => !(child.type === "text" && child.text === ""));
-            for (const child of node.content)
-                prune(child);
-        }
-    })(copy);
-    return { doc: copy, results, failed };
-}
diff --git a/packages/mcp/build/lib/markdown-converter.js b/packages/mcp/build/lib/markdown-converter.js
deleted file mode 100644
index 96536036..00000000
--- a/packages/mcp/build/lib/markdown-converter.js
+++ /dev/null
@@ -1,835 +0,0 @@
-/**
- * Convert ProseMirror/TipTap JSON content to Markdown
- * Supports all Docmost-specific node types and extensions
- */
-export function convertProseMirrorToMarkdown(content) {
-    if (!content || !content.content)
-        return "";
-    // Escape a value interpolated into an HTML double-quoted attribute value
-    // (textAlign, colors, image src, math `text`, all data-* attrs, etc.). In the
-    // ATTRIBUTE context only the quote that delimits the value and the ampersand
-    // that starts an entity are special, so we escape ONLY & " (and ' for safety
-    // when single-quoted delimiters are used). We deliberately do NOT escape < or
-    // >: the HTML re-parser (parse5/jsdom via @tiptap/html) does NOT decode
-    // &lt;/&gt; back inside attribute values, so escaping them would corrupt the
-    // stored data (e.g. a math node's LaTeX `a < b`) and ACCUMULATE escapes on
-    // every round-trip (`a < b` -> `a &lt; b` -> `a &amp;lt; b`). Escaping & "
-    // keeps the value inert against attribute-injection while staying idempotent.
-    // NOTE: escape ONLY & and " here. The value is always wrapped in double
-    // quotes, so " is the only delimiter; ' is NOT special in a double-quoted
-    // value, and parse5 does not decode &#39; back inside attribute values, so
-    // escaping ' would (like < >) corrupt the value and accumulate &amp; on every
-    // round-trip. Escaping & and " is idempotent (parse5 decodes them back).
-    const escapeAttr = (value) => String(value)
-        .replace(/&/g, "&amp;")
-        .replace(/"/g, "&quot;");
-    // Escape a value placed as HTML element TEXT content (between tags), where
-    // <, >, and & are all significant. Used for text rendered inside raw-HTML
-    // blocks (table cells / columns) so stored characters cannot inject markup.
-    const escapeHtmlText = (value) => String(value)
-        .replace(/&/g, "&amp;")
-        .replace(/</g, "&lt;")
-        .replace(/>/g, "&gt;");
-    // Percent-encode characters that would break out of a markdown URL target
-    // (...) — whitespace/newlines and parentheses — so a stored src stays a
-    // single inert token (used for image/video/youtube srcs).
-    const encodeMdUrl = (value) => String(value || "")
-        .replace(/\s/g, (c) => (c === " " ? "%20" : encodeURIComponent(c)))
-        .replace(/\(/g, "%28")
-        .replace(/\)/g, "%29");
-    const processNode = (node) => {
-        const type = node.type;
-        const nodeContent = node.content || [];
-        switch (type) {
-            case "doc":
-                return nodeContent.map(processNode).join("\n\n");
-            case "paragraph":
-                const text = nodeContent.map(processNode).join("");
-                const align = node.attrs?.textAlign;
-                if (align && align !== "left") {
-                    return `<div align="${escapeAttr(align)}">${text}</div>`;
-                }
-                return text || "";
-            case "heading":
-                const level = node.attrs?.level || 1;
-                const headingText = nodeContent.map(processNode).join("");
-                return "#".repeat(level) + " " + headingText;
-            case "text":
-                let textContent = node.text || "";
-                // Apply marks (bold, italic, code, etc.)
-                if (node.marks) {
-                    // Markdown code spans (`...`) cannot carry inner formatting, so when a
-                    // run has the `code` mark alongside ANY other mark, backtick syntax
-                    // would leak literal ** / []() into the code text. In that case emit
-                    // nested HTML (<code> innermost, the other marks wrapping it as HTML)
-                    // so the output is at least well-formed and re-parseable.
-                    //
-                    // NOTE: this does NOT round-trip both marks. The schema's `code` mark
-                    // has `excludes: "_"` (it excludes every other mark), so on import the
-                    // co-occurring mark is always dropped — the run comes back as `code`
-                    // only. We keep the emission simple and accept that the other mark is
-                    // lost; preserving both is impossible while `code` excludes them.
-                    // Only use the backtick form when `code` is the sole mark.
-                    const markTypes = node.marks.map((m) => m.type);
-                    const hasCode = markTypes.includes("code");
-                    const codeCombined = hasCode && markTypes.length > 1;
-                    for (const mark of node.marks) {
-                        switch (mark.type) {
-                            case "bold":
-                                textContent = codeCombined
-                                    ? `<strong>${textContent}</strong>`
-                                    : `**${textContent}**`;
-                                break;
-                            case "italic":
-                                textContent = codeCombined
-                                    ? `<em>${textContent}</em>`
-                                    : `*${textContent}*`;
-                                break;
-                            case "code":
-                                // When combined with another mark, wrap as <code> so the
-                                // surrounding HTML marks can nest around it; otherwise use the
-                                // plain backtick span.
-                                textContent = codeCombined
-                                    ? `<code>${textContent}</code>`
-                                    : `\`${textContent}\``;
-                                break;
-                            case "link": {
-                                const href = mark.attrs?.href || "";
-                                const title = mark.attrs?.title;
-                                if (codeCombined) {
-                                    // Emit an HTML anchor so it can wrap the nested <code>.
-                                    const safeHref = escapeAttr(href);
-                                    if (title) {
-                                        textContent = `<a href="${safeHref}" title="${escapeAttr(String(title))}">${textContent}</a>`;
-                                    }
-                                    else {
-                                        textContent = `<a href="${safeHref}">${textContent}</a>`;
-                                    }
-                                }
-                                else if (title) {
-                                    // Emit the optional markdown link title; escape an embedded
-                                    // double-quote so it cannot terminate the title string early.
-                                    const safeTitle = String(title).replace(/"/g, '\\"');
-                                    textContent = `[${textContent}](${href} "${safeTitle}")`;
-                                }
-                                else {
-                                    textContent = `[${textContent}](${href})`;
-                                }
-                                break;
-                            }
-                            case "strike":
-                                textContent = codeCombined
-                                    ? `<s>${textContent}</s>`
-                                    : `~~${textContent}~~`;
-                                break;
-                            case "underline":
-                                textContent = `<u>${textContent}</u>`;
-                                break;
-                            case "subscript":
-                                textContent = `<sub>${textContent}</sub>`;
-                                break;
-                            case "superscript":
-                                textContent = `<sup>${textContent}</sup>`;
-                                break;
-                            case "highlight": {
-                                // Preserve a null/empty color as a plain highlight (a bare
-                                // <mark> with no background-color); only emit the style when a
-                                // color is actually set, so a plain highlight is not forced to
-                                // yellow on export.
-                                const color = mark.attrs?.color;
-                                textContent = color
-                                    ? `<mark style="background-color: ${escapeAttr(color)}">${textContent}</mark>`
-                                    : `<mark>${textContent}</mark>`;
-                                break;
-                            }
-                            case "textStyle":
-                                if (mark.attrs?.color) {
-                                    textContent = `<span style="color: ${escapeAttr(mark.attrs.color)}">${textContent}</span>`;
-                                }
-                                break;
-                            case "comment": {
-                                // Emit the inline comment anchor so highlights round-trip. The
-                                // schema's Comment mark parses span[data-comment-id] (attrs
-                                // commentId/resolved).
-                                const cid = mark.attrs?.commentId;
-                                if (cid) {
-                                    const resolvedAttr = mark.attrs?.resolved
-                                        ? ` data-resolved="true"`
-                                        : "";
-                                    textContent = `<span data-comment-id="${escapeAttr(cid)}"${resolvedAttr}>${textContent}</span>`;
-                                }
-                                break;
-                            }
-                            case "spoiler":
-                                // Markdown has no native spoiler syntax, so emit the same
-                                // lossless raw HTML the editor-ext turndown rule produces; the
-                                // schema's Spoiler mark parses span[data-spoiler] back on import.
-                                textContent = `<span data-spoiler="true">${textContent}</span>`;
-                                break;
-                        }
-                    }
-                }
-                return textContent;
-            case "codeBlock":
-                const language = node.attrs?.language || "";
-                // Strip ALL trailing newlines so the export is idempotent: marked
-                // re-adds exactly one trailing "\n" on import, so trimming only one
-                // here would let the text grow by "\n" on each round-trip. Removing
-                // every trailing newline makes repeated cycles stable.
-                const code = nodeContent
-                    .map(processNode)
-                    .join("")
-                    .replace(/\n+$/, "");
-                return "```" + language + "\n" + code + "\n```";
-            case "bulletList":
-                return nodeContent
-                    .map((item) => processListItem(item, "-"))
-                    .join("\n");
-            case "orderedList":
-                return nodeContent
-                    .map((item, index) => processListItem(item, `${index + 1}.`))
-                    .join("\n");
-            case "taskList":
-                return nodeContent.map((item) => processTaskItem(item)).join("\n");
-            case "taskItem":
-                // Delegate to the same helper used by taskList so multi-block and
-                // nested task items render and indent consistently.
-                return processTaskItem(node);
-            case "listItem":
-                return nodeContent.map(processNode).join("\n");
-            case "blockquote":
-                // Prefix EVERY line of EVERY child with "> " and separate block-level
-                // children with a blank ">" line so code blocks / multi-paragraph
-                // quotes round-trip correctly.
-                return nodeContent
-                    .map((n) => processNode(n)
-                    .split("\n")
-                    .map((line) => (line.length ? `> ${line}` : ">"))
-                    .join("\n"))
-                    .join("\n>\n");
-            case "horizontalRule":
-                return "---";
-            case "hardBreak":
-                // Two trailing spaces before the newline encode a markdown hard break;
-                // a bare "\n" would be reimported as a soft break and lost.
-                return "  \n";
-            case "image": {
-                const imgAlt = node.attrs?.alt || "";
-                const imgCaption = node.attrs?.caption || "";
-                if (imgCaption) {
-                    // ![]() can't carry a caption, so (symmetric to video) emit a raw
-                    // <img> wrapped in a block <div>. On import marked.parse keeps the raw
-                    // HTML and generateJSON runs the image extension's parseHTML, which
-                    // restores the caption from data-caption.
-                    const parts = [`src="${escapeAttr(node.attrs?.src ?? "")}"`];
-                    if (imgAlt)
-                        parts.push(`alt="${escapeAttr(imgAlt)}"`);
-                    parts.push(`data-caption="${escapeAttr(imgCaption)}"`);
-                    return `<div><img ${parts.join(" ")}></div>`;
-                }
-                // Neutralize characters that could break out of the markdown image
-                // URL: spaces/newlines and parentheses would terminate the (...) target
-                // and let a stored src inject following markdown/HTML. Percent-encode
-                // them so the URL stays a single inert token.
-                const imgSrc = encodeMdUrl(node.attrs?.src);
-                return `![${imgAlt}](${imgSrc})`;
-            }
-            case "video": {
-                // Emit the schema-matching <video> element so generateJSON rebuilds the
-                // node with its attrs intact. The schema's parseHTML reads src/aria-label
-                // from the standard attributes and the remaining attrs from data-*.
-                const attrs = node.attrs || {};
-                const parts = [`src="${escapeAttr(attrs.src ?? "")}"`];
-                if (attrs.alt)
-                    parts.push(`aria-label="${escapeAttr(attrs.alt)}"`);
-                if (attrs.attachmentId)
-                    parts.push(`data-attachment-id="${escapeAttr(attrs.attachmentId)}"`);
-                if (attrs.width != null)
-                    parts.push(`width="${escapeAttr(attrs.width)}"`);
-                if (attrs.height != null)
-                    parts.push(`height="${escapeAttr(attrs.height)}"`);
-                if (attrs.size != null)
-                    parts.push(`data-size="${escapeAttr(attrs.size)}"`);
-                if (attrs.align)
-                    parts.push(`data-align="${escapeAttr(attrs.align)}"`);
-                if (attrs.aspectRatio != null)
-                    parts.push(`data-aspect-ratio="${escapeAttr(attrs.aspectRatio)}"`);
-                // Wrap in a block <div> so marked treats it as a block (a bare <video>
-                // is inline-level HTML and marked wraps it in <p>, leaving a spurious
-                // empty paragraph beside the hoisted block atom). The wrapper has no
-                // data-type, so the schema parser ignores it and just hoists the video.
-                return `<div><video ${parts.join(" ")}></video></div>`;
-            }
-            case "youtube": {
-                // Emit the schema-matching div[data-type="youtube"]; the schema reads
-                // src from data-src and width/height/align from data-* attributes.
-                const attrs = node.attrs || {};
-                const parts = [
-                    `data-type="youtube"`,
-                    `data-src="${escapeAttr(attrs.src ?? "")}"`,
-                ];
-                if (attrs.width != null)
-                    parts.push(`data-width="${escapeAttr(attrs.width)}"`);
-                if (attrs.height != null)
-                    parts.push(`data-height="${escapeAttr(attrs.height)}"`);
-                if (attrs.align)
-                    parts.push(`data-align="${escapeAttr(attrs.align)}"`);
-                return `<div ${parts.join(" ")}></div>`;
-            }
-            case "table": {
-                // A GFM pipe table cannot represent merged cells. If ANY cell carries
-                // colspan>1 or rowspan>1, a pipe table would corrupt the grid on
-                // re-import, so emit the WHOLE table as raw HTML <table> instead: the
-                // schema's table family parseHTML (tag table/tr/td/th, with colspan/
-                // rowspan read from the same-named HTML attrs and align via parseHTML)
-                // round-trips it faithfully. Otherwise keep the lighter GFM pipe table.
-                const tableRows = nodeContent;
-                if (tableRows.length === 0)
-                    return "";
-                const hasSpan = tableRows.some((row) => (row.content || []).some((cell) => (cell.attrs?.colspan ?? 1) > 1 || (cell.attrs?.rowspan ?? 1) > 1));
-                if (hasSpan) {
-                    // Render each cell's block children to HTML (marked does NOT parse
-                    // markdown inside a raw HTML block, so emitting markdown here would
-                    // leak literal ** / `` into the cell). blockToHtml mirrors the schema
-                    // HTML so inner formatting re-parses into the right marks/nodes.
-                    const renderHtmlCell = (cell) => {
-                        const tag = cell.type === "tableHeader" ? "th" : "td";
-                        const a = cell.attrs || {};
-                        const cellParts = [];
-                        if ((a.colspan ?? 1) > 1)
-                            cellParts.push(`colspan="${escapeAttr(a.colspan)}"`);
-                        if ((a.rowspan ?? 1) > 1)
-                            cellParts.push(`rowspan="${escapeAttr(a.rowspan)}"`);
-                        if (a.align)
-                            cellParts.push(`align="${escapeAttr(a.align)}"`);
-                        const open = cellParts.length
-                            ? `<${tag} ${cellParts.join(" ")}>`
-                            : `<${tag}>`;
-                        const inner = (cell.content || [])
-                            .map((block) => blockToHtml(block))
-                            .join("");
-                        return `${open}${inner}</${tag}>`;
-                    };
-                    const htmlRows = tableRows
-                        .map((row) => `<tr>${(row.content || []).map(renderHtmlCell).join("")}</tr>`)
-                        .join("");
-                    return `<table><tbody>${htmlRows}</tbody></table>`;
-                }
-                // No merged cells: emit a GFM table (header row + separator) so the
-                // markdown can be parsed back into a table on re-import.
-                const rows = tableRows.map(processNode);
-                const headerCells = tableRows[0]?.content || [];
-                const columns = headerCells.length || 1;
-                // Derive alignment markers (:--, :-:, --:) from each header cell.
-                const markers = Array.from({ length: columns }, (_, i) => {
-                    const align = headerCells[i]?.attrs?.align;
-                    switch (align) {
-                        case "left":
-                            return ":--";
-                        case "center":
-                            return ":-:";
-                        case "right":
-                            return "--:";
-                        default:
-                            return "---";
-                    }
-                });
-                const separator = "| " + markers.join(" | ") + " |";
-                return [rows[0], separator, ...rows.slice(1)].join("\n");
-            }
-            case "tableRow":
-                return "| " + nodeContent.map(processNode).join(" | ") + " |";
-            case "tableCell":
-            case "tableHeader": {
-                // Join multiple block children with a space (not "") so adjacent blocks
-                // like a paragraph followed by a list don't collide into "line1- a".
-                // Then collapse newlines and escape pipes so a cell containing "|" or a
-                // line break cannot corrupt the surrounding GFM row.
-                return nodeContent
-                    .map(processNode)
-                    .join(" ")
-                    .replace(/\r?\n/g, " ")
-                    .replace(/\|/g, "\\|");
-            }
-            case "callout":
-                const calloutType = node.attrs?.type || "info";
-                const calloutContent = nodeContent.map(processNode).join("\n");
-                return `:::${calloutType.toLowerCase()}\n${calloutContent}\n:::`;
-            case "details":
-                return nodeContent.map(processNode).join("\n");
-            case "detailsSummary":
-                const summaryText = nodeContent.map(processNode).join("");
-                return `<details>\n<summary>${summaryText}</summary>\n`;
-            case "detailsContent":
-                const detailsText = nodeContent.map(processNode).join("\n");
-                return `${detailsText}\n</details>`;
-            case "mathInline": {
-                // The schema's `text` attribute has no parseHTML, so TipTap's default
-                // parser reads it from the `text` HTML attribute (NOT the element's text
-                // content). Emit span[data-type="mathInline"] carrying the LaTeX in a
-                // `text="..."` attribute so it round-trips. marked cannot parse $...$
-                // back, so the previous form was lossy.
-                const inlineMath = node.attrs?.text || "";
-                return `<span data-type="mathInline" data-katex="true" text="${escapeAttr(inlineMath)}"></span>`;
-            }
-            case "mathBlock": {
-                // Same as mathInline: the LaTeX must ride in the `text` HTML attribute
-                // for the schema's default parser to recover it.
-                const blockMath = node.attrs?.text || "";
-                return `<div data-type="mathBlock" data-katex="true" text="${escapeAttr(blockMath)}"></div>`;
-            }
-            case "mention": {
-                // Emit span[data-type="mention"] with the schema's data-* attributes so
-                // generateJSON rebuilds the mention node instead of leaving "@label"
-                // plain text that cannot re-parse.
-                const attrs = node.attrs || {};
-                const parts = [`data-type="mention"`];
-                if (attrs.id)
-                    parts.push(`data-id="${escapeAttr(attrs.id)}"`);
-                if (attrs.label)
-                    parts.push(`data-label="${escapeAttr(attrs.label)}"`);
-                if (attrs.entityType)
-                    parts.push(`data-entity-type="${escapeAttr(attrs.entityType)}"`);
-                if (attrs.entityId)
-                    parts.push(`data-entity-id="${escapeAttr(attrs.entityId)}"`);
-                if (attrs.slugId)
-                    parts.push(`data-slug-id="${escapeAttr(attrs.slugId)}"`);
-                if (attrs.creatorId)
-                    parts.push(`data-creator-id="${escapeAttr(attrs.creatorId)}"`);
-                if (attrs.anchorId)
-                    parts.push(`data-anchor-id="${escapeAttr(attrs.anchorId)}"`);
-                // Keep the label as visible text content too; the schema reads attrs
-                // from data-*, so the inner text is purely cosmetic and harmless.
-                const mentionLabel = attrs.label || attrs.id || "";
-                // The label is visible element TEXT content here (the data-* attrs above
-                // carry the real values), so escape it for the text context, not attrs.
-                return `<span ${parts.join(" ")}>@${escapeHtmlText(mentionLabel)}</span>`;
-            }
-            case "footnoteReference": {
-                // Pandoc/GFM inline marker. The number is derived (not stored), so the
-                // id is the stable anchor.
-                const fnId = node.attrs?.id || "";
-                return fnId ? `[^${fnId}]` : "";
-            }
-            case "footnotesList":
-                // The container renders its definitions, each on its own `[^id]: ...`
-                // line. A blank line separates the body from the notes block.
-                return nodeContent.map(processNode).join("\n");
-            case "footnoteDefinition": {
-                const defId = node.attrs?.id || "";
-                // Collapse the definition's paragraphs into a single line; multi-line
-                // footnotes are a v2 refinement.
-                const defText = nodeContent
-                    .map(processNode)
-                    .join(" ")
-                    .replace(/\s*\n+\s*/g, " ")
-                    .trim();
-                return defId ? `[^${defId}]: ${defText}` : "";
-            }
-            case "attachment": {
-                // BUG FIX: the old code read node.attrs.fileName / node.attrs.src, but
-                // the schema stores name/url (plus mime/size/attachmentId). Emit the
-                // schema-matching div[data-type="attachment"] with data-attachment-*
-                // attrs so the node round-trips instead of degrading to a markdown link.
-                const attrs = node.attrs || {};
-                const parts = [
-                    `data-type="attachment"`,
-                    `data-attachment-url="${escapeAttr(attrs.url ?? "")}"`,
-                ];
-                if (attrs.name)
-                    parts.push(`data-attachment-name="${escapeAttr(attrs.name)}"`);
-                if (attrs.mime)
-                    parts.push(`data-attachment-mime="${escapeAttr(attrs.mime)}"`);
-                if (attrs.size != null)
-                    parts.push(`data-attachment-size="${escapeAttr(attrs.size)}"`);
-                if (attrs.attachmentId)
-                    parts.push(`data-attachment-id="${escapeAttr(attrs.attachmentId)}"`);
-                return `<div ${parts.join(" ")}></div>`;
-            }
-            case "drawio":
-            case "excalidraw": {
-                // Emit the schema-matching div[data-type=...] carrying the diagram's
-                // attrs as data-* (the schema's diagramAttributes reads src/title/alt/
-                // width/height/size/aspectRatio/align/attachmentId from data-*), so the
-                // diagram round-trips instead of degrading to a lossy placeholder.
-                const attrs = node.attrs || {};
-                const parts = [
-                    `data-type="${type}"`,
-                    `data-src="${escapeAttr(attrs.src ?? "")}"`,
-                ];
-                if (attrs.title != null)
-                    parts.push(`data-title="${escapeAttr(attrs.title)}"`);
-                if (attrs.alt != null)
-                    parts.push(`data-alt="${escapeAttr(attrs.alt)}"`);
-                if (attrs.width != null)
-                    parts.push(`data-width="${escapeAttr(attrs.width)}"`);
-                if (attrs.height != null)
-                    parts.push(`data-height="${escapeAttr(attrs.height)}"`);
-                if (attrs.size != null)
-                    parts.push(`data-size="${escapeAttr(attrs.size)}"`);
-                if (attrs.aspectRatio != null)
-                    parts.push(`data-aspect-ratio="${escapeAttr(attrs.aspectRatio)}"`);
-                if (attrs.align)
-                    parts.push(`data-align="${escapeAttr(attrs.align)}"`);
-                if (attrs.attachmentId)
-                    parts.push(`data-attachment-id="${escapeAttr(attrs.attachmentId)}"`);
-                return `<div ${parts.join(" ")}></div>`;
-            }
-            case "embed": {
-                // Emit the schema-matching div[data-type="embed"]; the schema reads
-                // src/provider/align/width/height from data-* attributes so the node
-                // (and its provider iframe info) survives the round-trip.
-                const attrs = node.attrs || {};
-                const parts = [
-                    `data-type="embed"`,
-                    `data-src="${escapeAttr(attrs.src ?? "")}"`,
-                    `data-provider="${escapeAttr(attrs.provider ?? "")}"`,
-                ];
-                if (attrs.align)
-                    parts.push(`data-align="${escapeAttr(attrs.align)}"`);
-                if (attrs.width != null)
-                    parts.push(`data-width="${escapeAttr(attrs.width)}"`);
-                if (attrs.height != null)
-                    parts.push(`data-height="${escapeAttr(attrs.height)}"`);
-                return `<div ${parts.join(" ")}></div>`;
-            }
-            case "audio": {
-                // Emit the schema-matching <audio> element (was emitting nothing). The
-                // schema reads src from src and attachmentId/size from data-*.
-                const attrs = node.attrs || {};
-                const parts = [`src="${escapeAttr(attrs.src ?? "")}"`];
-                if (attrs.attachmentId)
-                    parts.push(`data-attachment-id="${escapeAttr(attrs.attachmentId)}"`);
-                if (attrs.size != null)
-                    parts.push(`data-size="${escapeAttr(attrs.size)}"`);
-                // Wrap in a block <div> for the same reason as video: a bare <audio> is
-                // inline-level HTML that marked would wrap in <p>.
-                return `<div><audio ${parts.join(" ")}></audio></div>`;
-            }
-            case "pdf": {
-                // Emit the schema-matching div[data-type="pdf"] (was emitting nothing).
-                // The schema reads src/width/height from standard attrs and name/
-                // attachmentId/size from data-*.
-                const attrs = node.attrs || {};
-                const parts = [
-                    `data-type="pdf"`,
-                    `src="${escapeAttr(attrs.src ?? "")}"`,
-                ];
-                if (attrs.name)
-                    parts.push(`data-name="${escapeAttr(attrs.name)}"`);
-                if (attrs.attachmentId)
-                    parts.push(`data-attachment-id="${escapeAttr(attrs.attachmentId)}"`);
-                if (attrs.size != null)
-                    parts.push(`data-size="${escapeAttr(attrs.size)}"`);
-                if (attrs.width != null)
-                    parts.push(`width="${escapeAttr(attrs.width)}"`);
-                if (attrs.height != null)
-                    parts.push(`height="${escapeAttr(attrs.height)}"`);
-                return `<div ${parts.join(" ")}></div>`;
-            }
-            case "columns": {
-                // Emit the schema-matching div[data-type="columns"] wrapper so the
-                // multi-column layout survives. Without a case the children were
-                // concatenated with no separator and the text merged. The schema reads
-                // layout from data-layout and widthMode from data-width-mode. The whole
-                // block is raw HTML, so render children via blockToHtml (NOT markdown,
-                // which marked would not re-parse inside a raw HTML block).
-                const attrs = node.attrs || {};
-                const parts = [`data-type="columns"`];
-                if (attrs.layout)
-                    parts.push(`data-layout="${escapeAttr(attrs.layout)}"`);
-                if (attrs.widthMode && attrs.widthMode !== "normal")
-                    parts.push(`data-width-mode="${escapeAttr(attrs.widthMode)}"`);
-                const inner = nodeContent.map((n) => blockToHtml(n)).join("");
-                return `<div ${parts.join(" ")}>${inner}</div>`;
-            }
-            case "column": {
-                // Emit the schema-matching div[data-type="column"]; the schema reads the
-                // column width from data-width. Children are rendered as HTML so their
-                // formatting survives inside this raw HTML block.
-                const attrs = node.attrs || {};
-                const parts = [`data-type="column"`];
-                if (attrs.width)
-                    parts.push(`data-width="${escapeAttr(attrs.width)}"`);
-                const inner = nodeContent.map((n) => blockToHtml(n)).join("");
-                return `<div ${parts.join(" ")}>${inner}</div>`;
-            }
-            case "subpages":
-                return "{{SUBPAGES}}";
-            default:
-                // Fallback: process children
-                return nodeContent.map(processNode).join("");
-        }
-    };
-    // Render inline content (text runs + their marks) to HTML. Used by the raw
-    // HTML fallbacks (spanned tables, columns) where marked will NOT re-parse
-    // markdown, so backtick/asterisk/bracket syntax would otherwise leak as
-    // literal characters. Each mark is mirrored to the HTML the schema's parseHTML
-    // accepts so it re-imports as the matching ProseMirror mark.
-    const inlineToHtml = (inlineNodes) => (inlineNodes || [])
-        .map((n) => {
-        if (n.type === "hardBreak")
-            return "<br>";
-        if (n.type !== "text") {
-            // Inline atoms (mention, mathInline) already emit schema HTML.
-            return processNode(n);
-        }
-        let t = escapeHtmlText(n.text || "");
-        for (const mark of n.marks || []) {
-            switch (mark.type) {
-                case "bold":
-                    t = `<strong>${t}</strong>`;
-                    break;
-                case "italic":
-                    t = `<em>${t}</em>`;
-                    break;
-                case "code":
-                    t = `<code>${t}</code>`;
-                    break;
-                case "strike":
-                    t = `<s>${t}</s>`;
-                    break;
-                case "underline":
-                    t = `<u>${t}</u>`;
-                    break;
-                case "subscript":
-                    t = `<sub>${t}</sub>`;
-                    break;
-                case "superscript":
-                    t = `<sup>${t}</sup>`;
-                    break;
-                case "link":
-                    t = `<a href="${escapeAttr(mark.attrs?.href || "")}">${t}</a>`;
-                    break;
-                case "highlight":
-                    t = mark.attrs?.color
-                        ? `<mark style="background-color: ${escapeAttr(mark.attrs.color)}">${t}</mark>`
-                        : `<mark>${t}</mark>`;
-                    break;
-                case "textStyle":
-                    if (mark.attrs?.color)
-                        t = `<span style="color: ${escapeAttr(mark.attrs.color)}">${t}</span>`;
-                    break;
-                case "comment":
-                    // Inline comment anchor inside a raw-HTML container (columns /
-                    // spanned table cells), so commented text there also round-trips.
-                    if (mark.attrs?.commentId) {
-                        const r = mark.attrs?.resolved ? ` data-resolved="true"` : "";
-                        t = `<span data-comment-id="${escapeAttr(mark.attrs.commentId)}"${r}>${t}</span>`;
-                    }
-                    break;
-            }
-        }
-        return t;
-    })
-        .join("");
-    // Emit the schema-matching <img> for an image node. Shared so the image is
-    // emitted as real HTML wherever a raw-HTML container needs it (inside a column
-    // or a spanned table cell), where markdown `![](...)` would NOT be re-parsed
-    // and would survive as literal text. The Image extension reads src/alt from
-    // the standard attributes; the Docmost extra attrs (width/height/align/size/
-    // attachmentId/aspectRatio) are global attributes read from same-named DOM
-    // attributes, so emit them by name.
-    const imageToHtml = (node) => {
-        const attrs = node.attrs || {};
-        const parts = [`src="${escapeAttr(attrs.src ?? "")}"`];
-        if (attrs.alt)
-            parts.push(`alt="${escapeAttr(attrs.alt)}"`);
-        if (attrs.caption)
-            parts.push(`data-caption="${escapeAttr(attrs.caption)}"`);
-        if (attrs.title)
-            parts.push(`title="${escapeAttr(attrs.title)}"`);
-        if (attrs.width != null)
-            parts.push(`width="${escapeAttr(attrs.width)}"`);
-        if (attrs.height != null)
-            parts.push(`height="${escapeAttr(attrs.height)}"`);
-        if (attrs.align)
-            parts.push(`align="${escapeAttr(attrs.align)}"`);
-        if (attrs.size != null)
-            parts.push(`data-size="${escapeAttr(attrs.size)}"`);
-        if (attrs.attachmentId)
-            parts.push(`data-attachment-id="${escapeAttr(attrs.attachmentId)}"`);
-        if (attrs.aspectRatio != null)
-            parts.push(`data-aspect-ratio="${escapeAttr(attrs.aspectRatio)}"`);
-        return `<img ${parts.join(" ")}>`;
-    };
-    // Emit the schema-matching div[data-type="callout"] for a callout node. The
-    // schema reads the banner type from data-callout-type. Children are rendered
-    // as HTML so they survive inside a raw-HTML container.
-    const calloutToHtml = (node) => {
-        const type = (node.attrs?.type || "info").toLowerCase();
-        const inner = (node.content || []).map(blockToHtml).join("");
-        return `<div data-type="callout" data-callout-type="${escapeAttr(type)}">${inner}</div>`;
-    };
-    // Emit a schema-matching <details> tree. The schema parses <details>,
-    // summary[data-type="detailsSummary"], and div[data-type="detailsContent"].
-    const detailsToHtml = (node) => {
-        const inner = (node.content || []).map(blockToHtml).join("");
-        return `<details>${inner}</details>`;
-    };
-    const detailsSummaryToHtml = (node) => `<summary data-type="detailsSummary">${inlineToHtml(node.content || [])}</summary>`;
-    const detailsContentToHtml = (node) => {
-        const inner = (node.content || []).map(blockToHtml).join("");
-        return `<div data-type="detailsContent">${inner}</div>`;
-    };
-    // Emit the schema-matching taskList/taskItem HTML. bridgeTaskLists (in
-    // collaboration.ts) recognizes ul[data-type="taskList"] with
-    // li[data-type="taskItem"][data-checked]; emitting that directly here keeps
-    // task lists inside columns/cells from degrading to literal "- [ ]" text.
-    const taskListToHtml = (node) => {
-        const items = (node.content || [])
-            .map((it) => {
-            const checked = it.attrs?.checked ? "true" : "false";
-            return `<li data-type="taskItem" data-checked="${checked}">${blockChildrenToHtml(it)}</li>`;
-        })
-            .join("");
-        return `<ul data-type="taskList">${items}</ul>`;
-    };
-    // Render a block node to HTML for the raw-HTML containers (spanned tables,
-    // columns). marked does NOT re-parse markdown inside a raw-HTML block, so
-    // EVERY block type that can appear inside a column or a spanned cell must be
-    // emitted as schema-matching HTML here — never as markdown, or it would land
-    // as literal text on re-import. Nodes whose processNode case already produces
-    // schema-matching HTML (math/media/embed/attachment/nested columns/spanned
-    // table) are delegated to processNode; the markdown-emitting cases
-    // (image/blockquote/callout/details/hr/taskList) get explicit HTML here.
-    const blockToHtml = (block) => {
-        const children = block.content || [];
-        switch (block.type) {
-            case "paragraph":
-                return `<p>${inlineToHtml(children)}</p>`;
-            case "heading": {
-                const level = block.attrs?.level || 1;
-                return `<h${level}>${inlineToHtml(children)}</h${level}>`;
-            }
-            case "bulletList":
-                return `<ul>${children
-                    .map((li) => `<li>${blockChildrenToHtml(li)}</li>`)
-                    .join("")}</ul>`;
-            case "orderedList":
-                return `<ol>${children
-                    .map((li) => `<li>${blockChildrenToHtml(li)}</li>`)
-                    .join("")}</ol>`;
-            case "codeBlock": {
-                const lang = block.attrs?.language || "";
-                // The code itself is element TEXT content (between <code> tags), so it
-                // must escape < > & — NOT the attribute escaper. The language rides in
-                // a class ATTRIBUTE, so it uses escapeAttr.
-                const code = escapeHtmlText(children
-                    .map(processNode)
-                    .join("")
-                    .replace(/\n+$/, ""));
-                const cls = lang ? ` class="language-${escapeAttr(lang)}"` : "";
-                return `<pre><code${cls}>${code}</code></pre>`;
-            }
-            case "image":
-                return imageToHtml(block);
-            case "blockquote":
-                return `<blockquote>${children.map(blockToHtml).join("")}</blockquote>`;
-            case "horizontalRule":
-                return "<hr>";
-            case "callout":
-                return calloutToHtml(block);
-            case "details":
-                return detailsToHtml(block);
-            case "detailsSummary":
-                return detailsSummaryToHtml(block);
-            case "detailsContent":
-                return detailsContentToHtml(block);
-            case "taskList":
-                return taskListToHtml(block);
-            case "taskItem":
-                // A bare taskItem (outside a taskList) still needs a wrapping list so
-                // the schema parses it; wrap it in a single-item taskList.
-                return taskListToHtml({ content: [block] });
-            // table (incl. spanned), columns/column, math, media, embed, attachment,
-            // mention, etc. already emit schema-matching HTML from processNode.
-            case "table":
-            case "columns":
-            case "column":
-            case "mathBlock":
-            case "video":
-            case "audio":
-            case "pdf":
-            case "youtube":
-            case "embed":
-            case "attachment":
-            case "drawio":
-            case "excalidraw":
-                return processNode(block);
-            default:
-                // Any still-unhandled block type: NEVER fall back to markdown inside a
-                // raw-HTML block (it would become literal text). Wrap its rendered
-                // children in a <div> so their content is preserved; if it has no block
-                // children, render its inline content instead.
-                if (children.length && children.some((c) => c.type !== "text")) {
-                    return `<div>${children.map(blockToHtml).join("")}</div>`;
-                }
-                return `<div>${inlineToHtml(children)}</div>`;
-        }
-    };
-    // Render the block children of a list item to HTML (a listItem holds block+
-    // content). Mirrors processListItem but for the HTML fallback path.
-    const blockChildrenToHtml = (item) => (item.content || []).map((b) => blockToHtml(b)).join("");
-    // Indent the rendered children of a list item under a marker prefix.
-    // Each child block is a (possibly multi-line) string. The very first physical
-    // line of the first child carries the marker (e.g. "- " or "1. "); EVERY
-    // other line — the remaining lines of the first child AND all lines of every
-    // subsequent child (nested lists, code blocks, extra paragraphs) — is indented
-    // to align under the marker. Without indenting these continuation lines, the
-    // 2nd/3rd line of a nested child collapses to column 0 and escapes the list.
-    //
-    // The continuation indent MUST equal the LIST marker width, which is not the
-    // same as the visible prefix width:
-    //   - bullet "- "          -> 2 columns
-    //   - task   "- [ ] "      -> marker is still "- " (the "[ ] " is content), 2
-    //   - ordered "1. "/"10. " -> 3/4 columns, scaling with the number's digits
-    // CommonMark anchors nested content to the marker column, so an ordered item
-    // indented to only 2 columns would be re-parsed as a sibling/loose content on
-    // re-import. Callers therefore pass the exact indent width to use.
-    const indentItemChildren = (childStrings, prefix, indentWidth) => {
-        const indent = " ".repeat(indentWidth);
-        const lines = [];
-        childStrings.forEach((child, childIndex) => {
-            child.split("\n").forEach((line, lineIndex) => {
-                if (childIndex === 0 && lineIndex === 0) {
-                    // First physical line of the first block gets the marker.
-                    lines.push(`${prefix} ${line}`);
-                }
-                else {
-                    // Indent every continuation line by the marker width; keep blank
-                    // lines blank rather than emitting trailing whitespace.
-                    lines.push(line.length ? `${indent}${line}` : "");
-                }
-            });
-        });
-        return lines.join("\n");
-    };
-    const processListItem = (item, prefix) => {
-        const itemContent = item.content || [];
-        const childStrings = itemContent.map(processNode);
-        if (childStrings.length === 0)
-            return prefix;
-        // The rendered marker is `${prefix} ` (prefix + one space), so its width —
-        // and thus the continuation indent — is prefix.length + 1. This is correct
-        // for both bullet ("-" -> 2) and ordered ("1." -> 3, "10." -> 4) markers,
-        // since for those the visible prefix IS the list marker.
-        return indentItemChildren(childStrings, prefix, prefix.length + 1);
-    };
-    const processTaskItem = (item) => {
-        const checked = item.attrs?.checked || false;
-        const checkbox = checked ? "[x]" : "[ ]";
-        const prefix = `- ${checkbox}`;
-        const itemContent = item.content || [];
-        const childStrings = itemContent.map(processNode);
-        // An empty task item still needs its checkbox marker; without this guard
-        // the indent below produces "" and the "- [ ]"/"- [x]" row disappears.
-        if (childStrings.length === 0)
-            return prefix;
-        // The list marker for a task item is just "- " (2 columns); the "[ ] "/"[x] "
-        // checkbox is item content, NOT part of the marker. So the continuation
-        // indent is a fixed 2 — do NOT derive it from the wider prefix.length.
-        return indentItemChildren(childStrings, prefix, 2);
-    };
-    return processNode(content).trim();
-}
diff --git a/packages/mcp/build/lib/markdown-document.js b/packages/mcp/build/lib/markdown-document.js
deleted file mode 100644
index d21d9686..00000000
--- a/packages/mcp/build/lib/markdown-document.js
+++ /dev/null
@@ -1,104 +0,0 @@
-/**
- * Self-contained Docmost-flavoured Markdown document (custom extensions).
- *
- * A single `.md` file that packages everything needed to losslessly round-trip
- * a page through "download -> edit body -> re-upload":
- *   - a leading `docmost:meta` block: a one-line JSON object with page identity;
- *   - the Markdown body (carrying inline comment anchors and diagrams as HTML);
- *   - a trailing `docmost:comments` block: a one-line JSON array of comment
- *     threads.
- *
- * Both metadata blocks are HTML comments on purpose: `marked`/`generateJSON`
- * drop HTML comments, so even if the WHOLE file were ever fed straight to the
- * importer without first stripping the blocks, the metadata cannot leak into the
- * document. (A fenced ```docmost-comments``` block would WRONGLY become a
- * codeBlock node, so a fenced block is deliberately NOT used.)
- *
- * The delimiter literals may legitimately appear in the BODY too (e.g. a user
- * re-pastes an exported `.md` into a page, or a page documents this very
- * format). To stay robust, parsing treats only the FINAL, document-ending
- * `docmost:comments` block as metadata: it is the last `<!-- docmost:comments`
- * opener whose closing `-->` sits at the very end of the file. Any earlier
- * literal occurrence is left in the body untouched.
- *
- * NOTE on comments: in this version the comment THREAD records are preserved in
- * the file but are NOT pushed back to the server on import — only the inline
- * comment marks (anchors) embedded in the body are restored. Managing comment
- * records stays with the comment tools/UI.
- */
-// Match the leading meta block (allow leading whitespace). Capture group 1 is
-// the JSON text between the markers.
-const META_RE = /^\s*<!--\s*docmost:meta\s*\n([\s\S]*?)\n-->/;
-// Match a `docmost:comments` opener. Used globally to scan for the LAST opener
-// rather than end-anchoring a single regex (which would mis-capture across a
-// literal opener that appears earlier in the body).
-const COMMENTS_OPEN_RE = /<!--[ \t]*docmost:comments[ \t]*\r?\n/g;
-/**
- * Assemble the full self-contained markdown file: meta block, body, and the
- * comments block. The meta block is always emitted; the comments block is always
- * emitted too (with `[]` when there are no comments) so the format stays uniform
- * and parsing stays simple.
- */
-export function serializeDocmostMarkdown(meta, body, comments) {
-    const metaJson = JSON.stringify(meta);
-    const commentsJson = JSON.stringify(Array.isArray(comments) ? comments : []);
-    const trimmedBody = (body ?? "").trim();
-    return (`<!-- docmost:meta\n${metaJson}\n-->\n\n` +
-        `${trimmedBody}\n\n` +
-        `<!-- docmost:comments\n${commentsJson}\n-->\n`);
-}
-/**
- * Split a self-contained file back into its parts. Tolerant: if the meta or
- * comments block is missing (e.g. a hand-written plain-markdown file), the
- * corresponding value is returned as `null` and the whole input is treated as
- * the body. This never throws on a MISSING block; only a `JSON.parse` failure
- * inside a block that IS present is surfaced as a thrown Error with a clear
- * message. Robust to `\r\n` line endings.
- */
-export function parseDocmostMarkdown(full) {
-    // Normalize line endings so the anchored regexes work regardless of CRLF.
-    const normalized = (full ?? "").replace(/\r\n/g, "\n");
-    // Extract the leading meta block (start-anchored — already unambiguous).
-    let meta = null;
-    let metaEnd = 0;
-    const metaMatch = normalized.match(META_RE);
-    if (metaMatch) {
-        try {
-            meta = JSON.parse(metaMatch[1]);
-        }
-        catch (e) {
-            throw new Error(`Invalid docmost:meta JSON block: ${e instanceof Error ? e.message : String(e)}`);
-        }
-        // Body starts right after the matched meta block.
-        metaEnd = (metaMatch.index ?? 0) + metaMatch[0].length;
-    }
-    // Find the LAST `<!-- docmost:comments` opener; the real file-level block is
-    // the final one whose closing `-->` ends the document. Any earlier literal
-    // occurrence inside the body (e.g. a re-pasted export) is left in the body.
-    let lastOpenStart = -1;
-    let lastOpenEnd = -1;
-    let m;
-    COMMENTS_OPEN_RE.lastIndex = 0;
-    while ((m = COMMENTS_OPEN_RE.exec(normalized)) !== null) {
-        lastOpenStart = m.index;
-        lastOpenEnd = m.index + m[0].length;
-    }
-    let comments = null;
-    let bodyEnd = normalized.length;
-    if (lastOpenStart !== -1) {
-        const rest = normalized.slice(lastOpenEnd);
-        const close = rest.match(/\r?\n-->[ \t]*\r?\n?\s*$/); // closer must end the doc
-        if (close) {
-            const jsonText = rest.slice(0, close.index);
-            try {
-                comments = JSON.parse(jsonText);
-            }
-            catch (e) {
-                throw new Error(`Invalid docmost:comments JSON block: ${e instanceof Error ? e.message : String(e)}`);
-            }
-            bodyEnd = lastOpenStart; // strip from the opener to end of document
-        }
-    }
-    const body = normalized.slice(metaEnd, bodyEnd).trim();
-    return { meta, body, comments };
-}
diff --git a/packages/mcp/build/lib/node-ops.js b/packages/mcp/build/lib/node-ops.js
deleted file mode 100644
index 7f8490ca..00000000
--- a/packages/mcp/build/lib/node-ops.js
+++ /dev/null
@@ -1,821 +0,0 @@
-/**
- * Pure, network-free helpers for manipulating a ProseMirror/TipTap document
- * tree by node id.
- *
- * A ProseMirror node here is a plain JSON object of the shape produced by
- * Docmost: `{ type, attrs?, content?, text?, marks? }`. Children live in the
- * `content` array; a node carries a stable id in `attrs.id`. Callouts and
- * table cells hold their children in `content` just like any other block, so a
- * single recursive walk reaches them all.
- *
- * Every exported function operates on a DEEP CLONE of the input document and
- * returns the new document. The input doc and any `newNode`/`node` argument are
- * never mutated. All functions are defensively null-safe: missing/!Array
- * `content`, non-object nodes, and absent `attrs` are tolerated.
- */
-import { stripInlineMarkdown } from "./text-normalize.js";
-/** Deep-clone a JSON-serializable value without mutating the original. */
-function clone(value) {
-    if (typeof structuredClone === "function") {
-        return structuredClone(value);
-    }
-    // Fallback for environments without structuredClone.
-    return JSON.parse(JSON.stringify(value));
-}
-/** True if `value` is a non-null object (and not an array). */
-function isObject(value) {
-    return value != null && typeof value === "object" && !Array.isArray(value);
-}
-/** True if `node` carries the given id in `node.attrs.id`. */
-function matchesId(node, nodeId) {
-    return isObject(node) && isObject(node.attrs) && node.attrs.id === nodeId;
-}
-/**
- * Recursively concatenate all text contained in a node.
- *
- * Text nodes contribute their `text` string; container nodes contribute the
- * joined `blockPlainText` of their `content` children. Returns "" for nullish
- * or non-object inputs.
- */
-export function blockPlainText(node) {
-    if (!isObject(node))
-        return "";
-    let out = "";
-    if (typeof node.text === "string") {
-        out += node.text;
-    }
-    if (Array.isArray(node.content)) {
-        for (const child of node.content) {
-            out += blockPlainText(child);
-        }
-    }
-    return out;
-}
-/** Truncate `text` to at most `n` chars, appending an ellipsis when cut. */
-function truncate(text, n) {
-    return text.length > n ? text.slice(0, n) + "…" : text;
-}
-/**
- * Build a COMPACT outline of the TOP-LEVEL blocks of `doc` (the entries in
- * `doc.content`). Deliberately does NOT recurse into paragraphs, list items, or
- * table cells — compactness is the point; use `getNodeByRef` to drill into a
- * specific block.
- *
- * Each entry carries `{ index, type, id, firstText }`, plus type-specific
- * extras: headings add `level`; tables add `rows`/`cols` and the first row's
- * cell texts as `header`; list blocks (types ending in "List") add `items`.
- * `firstText` is the block's plain text truncated to 100 chars. Null-safe:
- * a missing or non-object doc/content yields `[]`.
- */
-export function buildOutline(doc) {
-    if (!isObject(doc) || !Array.isArray(doc.content))
-        return [];
-    const out = [];
-    for (let i = 0; i < doc.content.length; i++) {
-        const block = doc.content[i];
-        const type = isObject(block) ? block.type : undefined;
-        const entry = {
-            index: i,
-            type,
-            id: isObject(block) && isObject(block.attrs)
-                ? (block.attrs.id ?? null)
-                : null,
-            firstText: truncate(blockPlainText(block), 100),
-        };
-        if (type === "heading") {
-            entry.level = isObject(block.attrs) ? (block.attrs.level ?? null) : null;
-        }
-        else if (type === "table") {
-            const headerRow = block.content?.[0]?.content ?? [];
-            entry.rows = block.content?.length ?? 0;
-            entry.cols = block.content?.[0]?.content?.length ?? 0;
-            entry.header = headerRow.map((cell) => truncate(blockPlainText(cell), 40));
-        }
-        else if (typeof type === "string" && type.endsWith("List")) {
-            entry.items = block.content?.length ?? 0;
-        }
-        out.push(entry);
-    }
-    return out;
-}
-/**
- * Resolve a single node by reference and return `{ node, path, type }`, or
- * `null` when nothing matches.
- *
- * - `ref` of the form `#<n>` (e.g. `#2`) selects the TOP-LEVEL block at index
- *   `n` in `doc.content`. This is the only way to address table/tableRow/
- *   tableCell nodes, which carry no `attrs.id`.
- * - Otherwise `ref` is treated as a block id: the FIRST node anywhere in the
- *   tree with `attrs.id === ref` is returned.
- *
- * `path` is the array of child indices from the doc root down to the node
- * (so a top-level block is `[index]`). The returned `node` is a DEEP CLONE,
- * so callers can mutate it without touching the input doc. Null-safe.
- */
-export function getNodeByRef(doc, ref) {
-    if (!isObject(doc))
-        return null;
-    // "#<n>": index into the top-level content array.
-    const indexMatch = typeof ref === "string" ? ref.match(/^#(\d+)$/) : null;
-    if (indexMatch) {
-        const index = Number(indexMatch[1]);
-        const block = Array.isArray(doc.content) ? doc.content[index] : undefined;
-        if (!isObject(block))
-            return null;
-        return { node: clone(block), path: [index], type: block.type };
-    }
-    // Otherwise: depth-first search for the first node with attrs.id === ref.
-    const search = (node, trail) => {
-        if (!isObject(node))
-            return null;
-        if (Array.isArray(node.content)) {
-            for (let i = 0; i < node.content.length; i++) {
-                const child = node.content[i];
-                const path = [...trail, i];
-                if (matchesId(child, ref)) {
-                    return { node: clone(child), path, type: child.type };
-                }
-                const hit = search(child, path);
-                if (hit != null)
-                    return hit;
-            }
-        }
-        return null;
-    };
-    return search(doc, []);
-}
-/**
- * Replace EVERY node whose `attrs.id === nodeId` with a deep clone of
- * `newNode`, anywhere in the tree (including inside callouts and table cells).
- *
- * Operates on a clone of `doc`; returns `{ doc, replaced }` where `replaced`
- * is the number of nodes substituted. A fresh clone of `newNode` is used for
- * each match so they do not share references.
- */
-export function replaceNodeById(doc, nodeId, newNode) {
-    const out = clone(doc);
-    let replaced = 0;
-    // Walk a content array, replacing direct matches and recursing into the
-    // (possibly new) children of non-matching nodes.
-    const walkContent = (content) => {
-        for (let i = 0; i < content.length; i++) {
-            const child = content[i];
-            if (matchesId(child, nodeId)) {
-                content[i] = clone(newNode);
-                replaced++;
-                // Do not recurse into a freshly substituted node.
-                continue;
-            }
-            if (isObject(child) && Array.isArray(child.content)) {
-                walkContent(child.content);
-            }
-        }
-    };
-    if (isObject(out) && Array.isArray(out.content)) {
-        walkContent(out.content);
-    }
-    return { doc: out, replaced };
-}
-/**
- * Remove EVERY node whose `attrs.id === nodeId` from its parent `content`
- * array, anywhere in the tree (recursive, including callouts and tables).
- *
- * Operates on a clone of `doc`; returns `{ doc, deleted }` where `deleted` is
- * the number of nodes removed.
- */
-export function deleteNodeById(doc, nodeId) {
-    const out = clone(doc);
-    let deleted = 0;
-    // Filter a content array in place, dropping matches and recursing into the
-    // surviving children.
-    const walkContent = (content) => {
-        const kept = [];
-        for (const child of content) {
-            if (matchesId(child, nodeId)) {
-                deleted++;
-                continue;
-            }
-            if (isObject(child) && Array.isArray(child.content)) {
-                child.content = walkContent(child.content);
-            }
-            kept.push(child);
-        }
-        return kept;
-    };
-    if (isObject(out) && Array.isArray(out.content)) {
-        out.content = walkContent(out.content);
-    }
-    return { doc: out, deleted };
-}
-/**
- * Throw a clear, model-actionable error when a node-id write op did NOT match
- * exactly one node (#159). `count === 0` -> "no node found"; `count > 1` ->
- * "ambiguous, refused" — Docmost duplicates block ids on copy/paste, so a write
- * by id could clobber/remove EVERY duplicate. The caller skips the write for any
- * `count !== 1` (the transform returns null), so this only REPORTS; nothing was
- * changed. No-op for the unambiguous single-match case.
- */
-export function assertUnambiguousMatch(op, verb, count, nodeId, pageId) {
-    if (count === 0) {
-        throw new Error(`${op}: no node with id "${nodeId}" found on page ${pageId}`);
-    }
-    if (count > 1) {
-        throw new Error(`${op}: id "${nodeId}" is ambiguous — ${count} nodes on page ${pageId} share it (block ids are duplicated on copy/paste). Refusing to ${verb} all of them; nothing was changed. Re-target with a more specific anchor.`);
-    }
-}
-/**
- * Deep-clone `doc` and strip every node/mark attribute whose value is strictly
- * `undefined`, so the result is safe to hand to Yjs (which throws an opaque
- * "Unexpected content type" when asked to store an `undefined` attribute value).
- *
- * Only `undefined` keys are removed; `null`, `false`, `0`, and `""` are all
- * legitimate JSON-storable values and are preserved. Operates on a clone and
- * returns it; the input is never mutated. Defensively null-safe like the rest
- * of the file.
- */
-export function sanitizeForYjs(doc) {
-    const out = clone(doc);
-    // Drop every key whose value is strictly `undefined` from an attrs object.
-    const stripUndefined = (attrs) => {
-        if (!isObject(attrs))
-            return;
-        for (const key of Object.keys(attrs)) {
-            if (attrs[key] === undefined) {
-                delete attrs[key];
-            }
-        }
-    };
-    const walk = (node) => {
-        if (!isObject(node))
-            return;
-        stripUndefined(node.attrs);
-        if (Array.isArray(node.marks)) {
-            for (const mark of node.marks) {
-                if (isObject(mark))
-                    stripUndefined(mark.attrs);
-            }
-        }
-        if (Array.isArray(node.content)) {
-            for (const child of node.content) {
-                walk(child);
-            }
-        }
-    };
-    walk(out);
-    return out;
-}
-/**
- * Diagnostics helper: walk the tree and return a human-readable path string for
- * the FIRST attribute value (in any `node.attrs` or `mark.attrs`) that Yjs
- * cannot store — i.e. `undefined`, a `function`, a `symbol`, or a `bigint`
- * (e.g. `content[3].content[0].attrs.indent (undefined)`). Returns `null` when
- * every attribute is storable. Null-safe.
- */
-export function findUnstorableAttr(doc) {
-    const isUnstorable = (value) => {
-        if (value === undefined)
-            return "undefined";
-        const t = typeof value;
-        if (t === "function")
-            return "function";
-        if (t === "symbol")
-            return "symbol";
-        if (t === "bigint")
-            return "bigint";
-        return null;
-    };
-    // Check an attrs object; return the offending sub-path or null.
-    const checkAttrs = (attrs, basePath) => {
-        if (!isObject(attrs))
-            return null;
-        for (const key of Object.keys(attrs)) {
-            const kind = isUnstorable(attrs[key]);
-            if (kind != null)
-                return `${basePath}.${key} (${kind})`;
-        }
-        return null;
-    };
-    const walk = (node, path) => {
-        if (!isObject(node))
-            return null;
-        const attrHit = checkAttrs(node.attrs, `${path}.attrs`);
-        if (attrHit != null)
-            return attrHit;
-        if (Array.isArray(node.marks)) {
-            for (let i = 0; i < node.marks.length; i++) {
-                const markHit = checkAttrs(node.marks[i]?.attrs, `${path}.marks[${i}].attrs`);
-                if (markHit != null)
-                    return markHit;
-            }
-        }
-        if (Array.isArray(node.content)) {
-            for (let i = 0; i < node.content.length; i++) {
-                const childHit = walk(node.content[i], `${path}.content[${i}]`);
-                if (childHit != null)
-                    return childHit;
-            }
-        }
-        return null;
-    };
-    // The root doc node carries no useful index, so start the path at "doc".
-    if (!isObject(doc))
-        return null;
-    const attrHit = checkAttrs(doc.attrs, "attrs");
-    if (attrHit != null)
-        return attrHit;
-    if (Array.isArray(doc.content)) {
-        for (let i = 0; i < doc.content.length; i++) {
-            const childHit = walk(doc.content[i], `content[${i}]`);
-            if (childHit != null)
-                return childHit;
-        }
-    }
-    return null;
-}
-/**
- * Table structural node types and the container each must live directly inside.
- * Used by `insertNodeRelative` to splice rows/cells into the correct ancestor
- * rather than blindly into the anchor's direct parent (which would corrupt the
- * table's nesting).
- */
-const STRUCTURAL_TYPES = new Set(["tableRow", "tableCell", "tableHeader"]);
-const REQUIRED_CONTAINER = {
-    tableRow: "table",
-    tableCell: "tableRow",
-    tableHeader: "tableRow",
-};
-/**
- * Find the index of the first TOP-LEVEL block whose plain text includes the
- * anchor, with a markdown-stripping FALLBACK. Returns -1 when none matches.
- *
- * Two passes preserve "exact wins globally":
- *  - Pass 1: first block containing the verbatim `anchorText`.
- *  - Pass 2 (only if pass 1 found nothing): first block containing the
- *    markdown-stripped anchor, when stripping actually changed it.
- */
-function findAnchorTextIndex(content, anchorText) {
-    if (!Array.isArray(content))
-        return -1;
-    // Pass 1: exact.
-    for (let i = 0; i < content.length; i++) {
-        if (blockPlainText(content[i]).includes(anchorText))
-            return i;
-    }
-    // Pass 2: markdown-stripped fallback.
-    const a = stripInlineMarkdown(anchorText);
-    if (a !== anchorText && a.length > 0) {
-        for (let i = 0; i < content.length; i++) {
-            if (blockPlainText(content[i]).includes(a))
-                return i;
-        }
-    }
-    return -1;
-}
-/**
- * Locate an anchor and return its ancestor chain (from `doc` down to and
- * including the matched node). Each chain entry is `{ node, index }` where
- * `index` is the node's position inside its parent's `content` array (the root
- * doc has index -1). Returns `null` when the anchor cannot be resolved.
- */
-function findAnchorChain(doc, opts) {
-    if (!isObject(doc))
-        return null;
-    // DFS by id anywhere in the tree, accumulating the path.
-    if (opts.anchorNodeId != null) {
-        const targetId = opts.anchorNodeId;
-        const search = (node, index, trail) => {
-            if (!isObject(node))
-                return null;
-            const here = [...trail, { node, index }];
-            if (matchesId(node, targetId))
-                return here;
-            if (Array.isArray(node.content)) {
-                for (let i = 0; i < node.content.length; i++) {
-                    const hit = search(node.content[i], i, here);
-                    if (hit != null)
-                        return hit;
-                }
-            }
-            return null;
-        };
-        return search(doc, -1, []);
-    }
-    // By text: only top-level blocks are scanned (same rule as the JSON path).
-    // Exact match wins; a markdown-stripped fallback is tried only on a miss.
-    if (opts.anchorText != null && Array.isArray(doc.content)) {
-        const i = findAnchorTextIndex(doc.content, opts.anchorText);
-        if (i !== -1) {
-            return [
-                { node: doc, index: -1 },
-                { node: doc.content[i], index: i },
-            ];
-        }
-    }
-    return null;
-}
-/**
- * Insert a deep clone of `node` relative to an anchor.
- *
- * - position "append": push the node onto the top-level `doc.content`.
- * - position "before"/"after": locate the anchor and splice the node into the
- *   anchor's parent `content` array immediately before / after it.
- *
- * Anchor resolution for before/after:
- *   - if `anchorNodeId` is given, find the node with `attrs.id === anchorNodeId`
- *     anywhere in the tree (recursive);
- *   - otherwise, if `anchorText` is given, scan only TOP-LEVEL `doc.content`
- *     blocks and pick the first whose `blockPlainText` includes `anchorText`.
- *
- * Operates on a clone of `doc`; returns `{ doc, inserted }`. `inserted` is
- * false when the anchor could not be resolved (the doc is returned unchanged
- * apart from being cloned).
- */
-export function insertNodeRelative(doc, node, opts) {
-    const out = clone(doc);
-    const fresh = clone(node);
-    // Defensive: stay null-safe like the other exports — a missing opts means
-    // there is nothing actionable to do.
-    if (!isObject(opts))
-        return { doc: out, inserted: false };
-    const isStructural = isObject(node) && STRUCTURAL_TYPES.has(node.type);
-    // "append": top-level push.
-    if (opts.position === "append") {
-        // Structural table nodes (tableRow/tableCell/tableHeader) cannot live at the
-        // top level — appending one would produce invalid nesting.
-        if (isStructural) {
-            throw new Error(`insert_node: cannot append a ${node.type} at the top level; use ` +
-                `position before/after with an anchor inside the target table`);
-        }
-        if (isObject(out)) {
-            if (!Array.isArray(out.content))
-                out.content = [];
-            out.content.push(fresh);
-            return { doc: out, inserted: true };
-        }
-        return { doc: out, inserted: false };
-    }
-    const offset = opts.position === "after" ? 1 : 0;
-    // Structural insert (before/after a tableRow/tableCell/tableHeader): splice
-    // into the nearest enclosing table/tableRow rather than the anchor's direct
-    // parent, so the row/cell lands at the correct level of the table.
-    if (isStructural) {
-        const containerType = REQUIRED_CONTAINER[node.type];
-        const chain = findAnchorChain(out, opts);
-        // Anchor not resolved at all — keep the existing "anchor not found" path.
-        if (chain == null)
-            return { doc: out, inserted: false };
-        // Find the DEEPEST ancestor (including the anchor itself) of the required
-        // container type.
-        let containerIdx = -1;
-        for (let i = chain.length - 1; i >= 0; i--) {
-            if (isObject(chain[i].node) && chain[i].node.type === containerType) {
-                containerIdx = i;
-                break;
-            }
-        }
-        if (containerIdx === -1) {
-            throw new Error(`insert_node: cannot insert a ${node.type} here — the anchor is not ` +
-                `inside a ${containerType}. Anchor on a cell's text or a block id ` +
-                `that lives inside the target table.`);
-        }
-        const container = chain[containerIdx].node;
-        if (!Array.isArray(container.content))
-            container.content = [];
-        if (containerIdx === chain.length - 1) {
-            // The matched container IS the anchor node itself (e.g. anchorText
-            // resolved to the table block): append/prepend within it.
-            const at = opts.position === "after" ? container.content.length : 0;
-            container.content.splice(at, 0, fresh);
-        }
-        else {
-            // The immediate child on the path leading to the anchor is the row/cell
-            // to splice next to.
-            const enclosingChildIndex = chain[containerIdx + 1].index;
-            container.content.splice(enclosingChildIndex + offset, 0, fresh);
-        }
-        return { doc: out, inserted: true };
-    }
-    // Resolve by id anywhere in the tree: splice into the parent content array.
-    if (opts.anchorNodeId != null) {
-        let inserted = false;
-        const walkContent = (content) => {
-            for (let i = 0; i < content.length; i++) {
-                const child = content[i];
-                if (matchesId(child, opts.anchorNodeId)) {
-                    content.splice(i + offset, 0, fresh);
-                    inserted = true;
-                    return;
-                }
-                if (isObject(child) && Array.isArray(child.content)) {
-                    walkContent(child.content);
-                    if (inserted)
-                        return;
-                }
-            }
-        };
-        if (isObject(out) && Array.isArray(out.content)) {
-            walkContent(out.content);
-        }
-        return { doc: out, inserted };
-    }
-    // Resolve by text: only top-level doc.content blocks are scanned. Exact
-    // match wins; a markdown-stripped fallback is tried only on a miss.
-    if (opts.anchorText != null && isObject(out) && Array.isArray(out.content)) {
-        const i = findAnchorTextIndex(out.content, opts.anchorText);
-        if (i !== -1) {
-            out.content.splice(i + offset, 0, fresh);
-            return { doc: out, inserted: true };
-        }
-    }
-    return { doc: out, inserted: false };
-}
-// ===========================================================================
-// Table editing helpers
-//
-// A Docmost table is a ProseMirror subtree with NO ids on the structural nodes:
-//   table   -> { type:"table",     content:[tableRow...] }
-//   row     -> { type:"tableRow",  content:[tableCell|tableHeader...] }
-//   cell    -> { type:"tableCell"|"tableHeader", attrs:{colspan,rowspan,colwidth},
-//                content:[paragraph...] }
-//   para    -> { type:"paragraph", attrs:{id,indent}, content:[textNode...] }
-// Only paragraphs/headings carry an `attrs.id`, so a cell is addressed via the
-// id of the paragraph inside it. The helpers below all operate on a DEEP CLONE
-// of the input doc (via `clone`) and never mutate their inputs.
-// ===========================================================================
-/**
- * Collect EVERY `attrs.id` present anywhere in `node` into `used`. Used to seed
- * `makeFreshId` so generated paragraph ids never collide with existing ones.
- */
-function collectIds(node, used) {
-    if (!isObject(node))
-        return;
-    if (isObject(node.attrs) && typeof node.attrs.id === "string") {
-        used.add(node.attrs.id);
-    }
-    if (Array.isArray(node.content)) {
-        for (const child of node.content)
-            collectIds(child, used);
-    }
-}
-/**
- * Fresh-id generator: returns a random Docmost-style id (12 chars from
- * lowercase `a-z0-9`) that is not already in `used`, and records it. On the
- * rare collision the id is regenerated. Callers rely on uniqueness, not on the
- * exact string, so randomness is fine — and unlike a module-local counter it
- * needs no reset and cannot become predictable across calls.
- */
-function makeFreshId(used) {
-    const alphabet = "abcdefghijklmnopqrstuvwxyz0123456789";
-    let id;
-    do {
-        id = "";
-        for (let i = 0; i < 12; i++) {
-            id += alphabet[Math.floor(Math.random() * alphabet.length)];
-        }
-    } while (used.has(id) || id === "");
-    used.add(id);
-    return id;
-}
-/**
- * Resolve a table reference against an ALREADY-CLONED doc and return the LIVE
- * table node (a reference inside `rootClone`, so the caller may mutate it) plus
- * its index path. Returns null when no table matches.
- *
- * - `#<n>`: the top-level block at index `n`, only if its `type === "table"`.
- * - otherwise: DFS for the node with `attrs.id === tableRef`, then walk UP its
- *   ancestor chain to the nearest `type === "table"` ancestor.
- */
-function locateTable(rootClone, tableRef) {
-    if (!isObject(rootClone))
-        return null;
-    // "#<n>": index into the top-level content array; must be a table.
-    const indexMatch = typeof tableRef === "string" ? tableRef.match(/^#(\d+)$/) : null;
-    if (indexMatch) {
-        const index = Number(indexMatch[1]);
-        const block = Array.isArray(rootClone.content)
-            ? rootClone.content[index]
-            : undefined;
-        if (isObject(block) && block.type === "table") {
-            return { table: block, path: [index] };
-        }
-        return null;
-    }
-    // Otherwise: DFS for attrs.id === tableRef, tracking the ancestor chain, then
-    // climb to the nearest enclosing table.
-    const search = (node, trail) => {
-        if (!isObject(node))
-            return null;
-        if (Array.isArray(node.content)) {
-            for (let i = 0; i < node.content.length; i++) {
-                const child = node.content[i];
-                const here = [...trail, { node: child, index: i }];
-                if (matchesId(child, tableRef)) {
-                    // Walk UP to the nearest table ancestor (including the match itself).
-                    for (let j = here.length - 1; j >= 0; j--) {
-                        if (isObject(here[j].node) && here[j].node.type === "table") {
-                            return {
-                                table: here[j].node,
-                                path: here.slice(0, j + 1).map((e) => e.index),
-                            };
-                        }
-                    }
-                    return null; // id found but no enclosing table
-                }
-                const hit = search(child, here);
-                if (hit != null)
-                    return hit;
-            }
-        }
-        return null;
-    };
-    return search(rootClone, []);
-}
-/** Build the plain-text → single-paragraph cell content used by all writers. */
-function makeCellParagraph(id, text) {
-    return {
-        type: "paragraph",
-        attrs: { id, indent: 0 },
-        // Empty string → a paragraph with an empty content array.
-        content: text ? [{ type: "text", text }] : [],
-    };
-}
-/**
- * Read a table as a matrix. Returns null when `tableRef` resolves to no table.
- *
- * - `rows`/`cols`: the table's row count and the column count of its FIRST row.
- *   Tables may be ragged (rows of differing length), so `cols` reflects only
- *   row 0; use the per-row length of `cells`/`cellIds` for each row's actual
- *   width.
- * - `cells`: `string[][]` of each cell's `blockPlainText`.
- * - `cellIds`: `(string|null)[][]` of each cell's FIRST paragraph id (or null),
- *   so callers can `patch_node` a cell for rich-formatted edits.
- * - `path`: index path of the table within the doc.
- */
-export function readTable(doc, tableRef) {
-    const root = clone(doc);
-    const located = locateTable(root, tableRef);
-    if (located == null)
-        return null;
-    const { table, path } = located;
-    const rowNodes = Array.isArray(table.content) ? table.content : [];
-    const rows = rowNodes.length;
-    const cols = rowNodes[0]?.content?.length ?? 0;
-    const cells = [];
-    const cellIds = [];
-    for (const rowNode of rowNodes) {
-        const cellNodes = Array.isArray(rowNode?.content) ? rowNode.content : [];
-        const rowText = [];
-        const rowIds = [];
-        for (const cellNode of cellNodes) {
-            rowText.push(blockPlainText(cellNode));
-            // The cell's first paragraph carries the id used for patch_node.
-            const firstPara = Array.isArray(cellNode?.content)
-                ? cellNode.content[0]
-                : undefined;
-            const id = isObject(firstPara) && isObject(firstPara.attrs)
-                ? (firstPara.attrs.id ?? null)
-                : null;
-            rowIds.push(id);
-        }
-        cells.push(rowText);
-        cellIds.push(rowIds);
-    }
-    return { rows, cols, cells, cellIds, path };
-}
-/**
- * Insert a row of plain-text cells into a table. Returns `{ doc, inserted }`.
- *
- * The row is padded to the table's column count (`cells[i] ?? ""`); supplying
- * MORE cells than columns throws. Each new cell copies `colwidth` for its
- * column from the header row when present, gets a fresh-id paragraph, and a
- * `colspan:1, rowspan:1` attrs. `index` (when an integer in `[0, rows]`) splices
- * the row there; otherwise the row is appended at the end.
- */
-export function insertTableRow(doc, tableRef, cells, index) {
-    const out = clone(doc);
-    const located = locateTable(out, tableRef);
-    if (located == null)
-        return { doc: out, inserted: false };
-    const { table } = located;
-    if (!Array.isArray(table.content))
-        table.content = [];
-    const rows = table.content.length;
-    const headerRow = table.content[0];
-    const headerCells = Array.isArray(headerRow?.content)
-        ? headerRow.content
-        : [];
-    // Column count is the WIDEST existing row, so the guard below stays
-    // meaningful for ragged tables and the new row matches the table's width.
-    // Fall back to the supplied cell count only when the table has no rows.
-    let colCount = 0;
-    for (const r of table.content) {
-        if (isObject(r) && Array.isArray(r.content))
-            colCount = Math.max(colCount, r.content.length);
-    }
-    if (colCount === 0)
-        colCount = Array.isArray(cells) ? cells.length : 0;
-    if (Array.isArray(cells) && cells.length > colCount) {
-        throw new Error(`table_insert_row: got ${cells.length} cell(s) but the table has ${colCount} column(s)`);
-    }
-    // Resolve the landing index up front so the cell-type decision and the splice
-    // below agree: a valid integer in [0, rows] splices there, else we append.
-    const landingIndex = typeof index === "number" &&
-        Number.isInteger(index) &&
-        index >= 0 &&
-        index <= rows
-        ? index
-        : rows;
-    // Seed the id generator with every id already in the doc so the new cell
-    // paragraph ids are unique within the whole document.
-    const used = new Set();
-    collectIds(out, used);
-    const newCells = [];
-    for (let i = 0; i < colCount; i++) {
-        const text = (Array.isArray(cells) ? cells[i] : undefined) ?? "";
-        const attrs = { colspan: 1, rowspan: 1 };
-        // Copy this column's colwidth from the header row's cell when present.
-        const colwidth = headerCells[i]?.attrs?.colwidth;
-        if (colwidth !== undefined)
-            attrs.colwidth = colwidth;
-        // A row landing at index 0 becomes the new header row, so inherit the
-        // current header cell's type per column (Docmost uses "tableHeader" there);
-        // every other position is a plain data cell.
-        const cellType = landingIndex === 0 ? (headerCells[i]?.type ?? "tableCell") : "tableCell";
-        newCells.push({
-            type: cellType,
-            attrs,
-            content: [makeCellParagraph(makeFreshId(used), text)],
-        });
-    }
-    const newRow = { type: "tableRow", content: newCells };
-    // Splice at the resolved landing index (append when index was omitted/invalid).
-    table.content.splice(landingIndex, 0, newRow);
-    return { doc: out, inserted: true };
-}
-/**
- * Delete the row at 0-based `index` from a table. Returns `{ doc, deleted }`.
- * `deleted` is false only when the table cannot be located. Throws on an
- * out-of-range index, and refuses to delete the table's only row.
- */
-export function deleteTableRow(doc, tableRef, index) {
-    const out = clone(doc);
-    const located = locateTable(out, tableRef);
-    if (located == null)
-        return { doc: out, deleted: false };
-    const { table } = located;
-    if (!Array.isArray(table.content))
-        table.content = [];
-    const rows = table.content.length;
-    if (!Number.isInteger(index) || index < 0 || index >= rows) {
-        throw new Error(`table_delete_row: row index ${index} out of range (table has ${rows} row(s))`);
-    }
-    if (rows <= 1) {
-        throw new Error("table_delete_row: refusing to delete the only row of the table");
-    }
-    table.content.splice(index, 1);
-    return { doc: out, deleted: true };
-}
-/**
- * Set the plain-text content of cell `[row, col]` (0-based) to `text`. Returns
- * `{ doc, updated }`; `updated` is false only when the table cannot be located.
- * Throws when `row`/`col` is out of range. The cell's own attrs (colspan/
- * rowspan/colwidth) are preserved; its content becomes a single text paragraph
- * that reuses the cell's existing first-paragraph id when present, else a fresh
- * one.
- */
-export function updateTableCell(doc, tableRef, row, col, text) {
-    const out = clone(doc);
-    const located = locateTable(out, tableRef);
-    if (located == null)
-        return { doc: out, updated: false };
-    const { table } = located;
-    const rowNodes = Array.isArray(table.content) ? table.content : [];
-    const rows = rowNodes.length;
-    const rowNode = rowNodes[row];
-    const cols = isObject(rowNode) && Array.isArray(rowNode.content)
-        ? rowNode.content.length
-        : 0;
-    if (!Number.isInteger(row) ||
-        row < 0 ||
-        row >= rows ||
-        !Number.isInteger(col) ||
-        col < 0 ||
-        col >= cols) {
-        throw new Error(`table_update_cell: cell [${row},${col}] out of range`);
-    }
-    const cellNode = rowNode.content[col];
-    // Reuse the cell's existing first-paragraph id, or mint a fresh unique one.
-    const existingPara = Array.isArray(cellNode?.content)
-        ? cellNode.content[0]
-        : undefined;
-    let id = isObject(existingPara) && isObject(existingPara.attrs)
-        ? existingPara.attrs.id
-        : undefined;
-    if (typeof id !== "string" || id.length === 0) {
-        const used = new Set();
-        collectIds(out, used);
-        id = makeFreshId(used);
-    }
-    cellNode.content = [makeCellParagraph(id, text)];
-    return { doc: out, updated: true };
-}
diff --git a/packages/mcp/build/lib/page-lock.js b/packages/mcp/build/lib/page-lock.js
deleted file mode 100644
index ddba2663..00000000
--- a/packages/mcp/build/lib/page-lock.js
+++ /dev/null
@@ -1,31 +0,0 @@
-/**
- * Per-page async mutex.
- *
- * Content writes over the collaboration websocket must never overlap for the
- * same page: two concurrent full-document replaces would race on the live Yjs
- * fragment. We serialize them with a per-pageId promise chain — each new
- * operation waits for the previous one on that page to settle (success or
- * failure) before it runs. Different pages never block each other.
- */
-const chains = new Map();
-// The returned promise carries the real result/rejection of `fn` and MUST be
-// awaited/handled by the caller; only the internal chaining tail swallows
-// errors (purely to gate ordering).
-export function withPageLock(pageId, fn) {
-    // Wait for the previous op on this page; swallow its error so a failure does
-    // not poison the queue for the next caller.
-    const prev = (chains.get(pageId) ?? Promise.resolve()).catch(() => { });
-    const run = prev.then(fn);
-    // The tail used for chaining must also swallow errors (it only gates order).
-    const tail = run.catch(() => { });
-    chains.set(pageId, tail);
-    // Drop the map entry once this op is the tail and has settled, to avoid an
-    // unbounded map of resolved promises.
-    tail.then(() => {
-        if (chains.get(pageId) === tail) {
-            chains.delete(pageId);
-        }
-    });
-    // Callers get the real result/rejection of fn.
-    return run;
-}
diff --git a/packages/mcp/build/lib/page-search.js b/packages/mcp/build/lib/page-search.js
deleted file mode 100644
index 34ca407b..00000000
--- a/packages/mcp/build/lib/page-search.js
+++ /dev/null
@@ -1,186 +0,0 @@
-/**
- * Pure, network-free in-page search over a ProseMirror/TipTap document tree.
- *
- * `searchInDoc(doc, query, opts)` finds every occurrence of a literal substring
- * (default) or a regular expression across the page's TEXT CONTAINERS and
- * reports WHERE each match is — the container's ref (for get_node/patch_node;
- * see the SearchMatch.nodeId note for the `#<index>` caveat), the top-level
- * block index, and a short context window around the hit. It never touches the
- * network, the DB, or the schema mirror; like `comment-anchor.ts` it is
- * isolated-testable.
- *
- * REGEX ENGINE: with `regex:true` the pattern is compiled with RE2 (Google's
- * linear-time engine), NOT the JS `RegExp`. RE2 has no backtracking, so a
- * catastrophic pattern (e.g. `(a+)+$`) can never wedge the shared event loop —
- * it runs in linear time. The trade-off is that RE2 does not support the
- * backtracking-only features lookaround (`(?=…)`, `(?<=…)`) and backreferences
- * (`\1`); such a pattern is rejected up front with a clear tool error (see
- * searchInDoc) rather than being run, which is the desired behaviour — a clear
- * error the agent can fix beats a server hang.
- *
- * WHY plain text (not markdown): each container's inline text is glued into ONE
- * string via `blockPlainText`, so a match survives inline-mark boundaries
- * (bold/italic/link splits that fracture a run like "т.е." into several text
- * nodes) and comment-anchor spans never clutter the haystack.
- *
- * The SEARCH UNIT is a text container: a node whose direct children include
- * text nodes (a paragraph/heading, or the paragraph inside a table cell / list
- * item). ProseMirror keeps block vs. inline content exclusive, so a container
- * never nests another container — the walk reaches each cell/item's own text and
- * the context window is naturally scoped to that specific cell/item, not the
- * whole top-level block's glued text.
- */
-import RE2 from "re2";
-import { blockPlainText } from "./node-ops.js";
-/** True if `value` is a non-null plain object (and not an array). */
-function isObject(value) {
-    return value != null && typeof value === "object" && !Array.isArray(value);
-}
-/**
- * A text container is a node with a `content` array holding at least one text
- * node (a child with a string `text`). These are the paragraphs/headings whose
- * glued inline text we search.
- */
-function isTextContainer(node) {
-    return (isObject(node) &&
-        Array.isArray(node.content) &&
-        node.content.some((c) => isObject(c) && typeof c.text === "string"));
-}
-// Result-size defaults/ceiling.
-const DEFAULT_LIMIT = 50;
-const MAX_LIMIT = 200;
-// Context window on each side of a match.
-const CONTEXT = 40;
-// Cheap sanity cap on the query/pattern length. ReDoS is handled structurally
-// by the RE2 engine (linear-time, no backtracking — see the module doc), so we
-// no longer truncate the per-container text: RE2 scans it in linear time and a
-// cap could silently drop real matches past it. This just rejects an absurdly
-// long pattern early with a clear error.
-const MAX_PATTERN_LENGTH = 1000;
-/** Clamp the requested limit into [1, MAX_LIMIT], defaulting when absent. */
-function resolveLimit(limit) {
-    const n = typeof limit === "number" && Number.isFinite(limit) ? limit : DEFAULT_LIMIT;
-    return Math.min(MAX_LIMIT, Math.max(1, Math.floor(n)));
-}
-/**
- * Yield the [start, length] of every occurrence of the engine in `text`, in
- * order. A literal engine uses indexOf (case-folded when requested); a regex
- * engine uses a global RE2 regex (RE2 extends `RegExp`, so `.exec` advances
- * `lastIndex` exactly like the native engine). Zero-length regex matches (e.g.
- * `\b`, `a*`) are SKIPPED and lastIndex is advanced, so a pattern that can match
- * the empty string cannot flood the results or spin forever.
- */
-function* eachMatch(text, query, re, caseSensitive) {
-    if (re) {
-        re.lastIndex = 0;
-        let m;
-        while ((m = re.exec(text)) != null) {
-            const len = m[0].length;
-            if (len === 0) {
-                // Empty match: advance past this position and do not record it.
-                re.lastIndex = m.index + 1;
-                continue;
-            }
-            yield [m.index, len];
-        }
-        return;
-    }
-    // Literal engine. For case-insensitive search, fold BOTH sides only to locate
-    // the indices; the reported match/context are always sliced from the original
-    // text so the caller gets the real casing (needed to build a unique selection).
-    const haystack = caseSensitive ? text : text.toLowerCase();
-    const needle = caseSensitive ? query : query.toLowerCase();
-    const len = needle.length;
-    let from = 0;
-    for (;;) {
-        const idx = haystack.indexOf(needle, from);
-        if (idx === -1)
-            return;
-        yield [idx, len];
-        from = idx + len;
-    }
-}
-/**
- * Search a ProseMirror document for `query` and return `{ total, truncated,
- * matches }`. `total` counts EVERY occurrence (even beyond the limit) and
- * `truncated` flags when the returned list was capped — nothing is silently
- * dropped.
- *
- * Throws a clear, model-actionable error (never a generic failure) on: an
- * empty/whitespace-only query, an over-long pattern, or — with `regex:true` — a
- * pattern RE2 rejects (invalid syntax, or the unsupported lookaround/
- * backreference features), so the agent can fix its input.
- */
-export function searchInDoc(doc, query, opts = {}) {
-    // --- edge-case guards (fail loudly so the agent can correct the call) ---
-    if (typeof query !== "string" || query.trim().length === 0) {
-        throw new Error("search_in_page: query is empty — pass the text (or regex) to look for.");
-    }
-    if (query.length > MAX_PATTERN_LENGTH) {
-        throw new Error(`search_in_page: query is too long (${query.length} chars; max ${MAX_PATTERN_LENGTH}). Shorten the search text/pattern.`);
-    }
-    const caseSensitive = opts.caseSensitive === true;
-    const limit = resolveLimit(opts.limit);
-    // Compile the pattern up front with RE2 (linear-time, ReDoS-safe) so a bad
-    // pattern is a clean tool error rather than a failure deep in the traversal —
-    // and so a catastrophic-backtracking pattern can never wedge the event loop.
-    // RE2 throws both on syntactically invalid input AND on backtracking-only
-    // features it does not implement (lookaround, backreferences); both map to the
-    // same actionable error so the agent rewrites the pattern.
-    let re = null;
-    if (opts.regex === true) {
-        try {
-            re = new RE2(query, caseSensitive ? "g" : "gi");
-        }
-        catch (e) {
-            throw new Error(`search_in_page: invalid or unsupported regular expression: ${e instanceof Error ? e.message : String(e)} — RE2 does not support lookaround ((?=…)/(?<=…)) or backreferences (\\1); rewrite the pattern without them.`);
-        }
-    }
-    const matches = [];
-    let total = 0;
-    const topLevel = isObject(doc) && Array.isArray(doc.content) ? doc.content : [];
-    // Descend a top-level block, collecting matches from every text container
-    // within it. blockIndex/topRef stay pinned to the enclosing top-level block.
-    const descend = (node, blockIndex, topRef) => {
-        if (!isObject(node))
-            return;
-        if (isTextContainer(node)) {
-            // Glue this container's inline text into one string (mark-safe). No length
-            // cap: RE2 scans it in linear time (no ReDoS) and the whole document is
-            // already in memory, so truncating would only risk dropping real matches
-            // in a very long container.
-            const text = blockPlainText(node);
-            // The container's own id addresses it verbatim in get_node/patch_node; a
-            // container with no id (e.g. a table-cell paragraph) falls back to the
-            // top-level block's #<index> (readable via get_node, but not patchable —
-            // see the SearchMatch.nodeId note).
-            const id = isObject(node.attrs) && typeof node.attrs.id === "string" && node.attrs.id.length > 0
-                ? node.attrs.id
-                : topRef;
-            for (const [idx, len] of eachMatch(text, query, re, caseSensitive)) {
-                total++;
-                if (matches.length < limit) {
-                    matches.push({
-                        nodeId: id,
-                        blockIndex,
-                        type: node.type,
-                        before: text.slice(Math.max(0, idx - CONTEXT), idx),
-                        match: text.slice(idx, idx + len),
-                        after: text.slice(idx + len, idx + len + CONTEXT),
-                    });
-                }
-            }
-            // A text container holds inline content only — no nested containers to
-            // recurse into.
-            return;
-        }
-        if (Array.isArray(node.content)) {
-            for (const child of node.content)
-                descend(child, blockIndex, topRef);
-        }
-    };
-    for (let i = 0; i < topLevel.length; i++) {
-        descend(topLevel[i], i, `#${i}`);
-    }
-    return { total, truncated: total > matches.length, matches };
-}
diff --git a/packages/mcp/build/lib/parse-node-arg.js b/packages/mcp/build/lib/parse-node-arg.js
deleted file mode 100644
index 4598b136..00000000
--- a/packages/mcp/build/lib/parse-node-arg.js
+++ /dev/null
@@ -1,15 +0,0 @@
-// The model sometimes serializes a ProseMirror node arg as a JSON string
-// instead of an object. Normalize: parse a string to an object (throwing on
-// invalid JSON), pass an object through unchanged. Shared by patch_node /
-// insert_node (and the analogous update_page_json content parsing).
-export function parseNodeArg(node, errMsg = "node was a string but not valid JSON") {
-    if (typeof node === "string") {
-        try {
-            return JSON.parse(node);
-        }
-        catch {
-            throw new Error(errMsg);
-        }
-    }
-    return node;
-}
diff --git a/packages/mcp/build/lib/text-normalize.js b/packages/mcp/build/lib/text-normalize.js
deleted file mode 100644
index 4db72e4b..00000000
--- a/packages/mcp/build/lib/text-normalize.js
+++ /dev/null
@@ -1,108 +0,0 @@
-/**
- * Locator normalization: strip inline markdown wrappers and trailing
- * decoration from a LOCATOR string so a find/anchor that the model wrote with
- * markdown (or a stray emoji) can still match the document's plain text.
- *
- * This is used ONLY as a fallback for LOCATING (after an exact match fails);
- * it is never applied to replacement text or inserted node content, so no
- * formatting is ever lost.
- */
-/** Maximum unwrap passes, so pathological/nested input cannot loop forever. */
-const MAX_PASSES = 8;
-/**
- * Inline emphasis/code/strikethrough wrappers, strong BEFORE emphasis so
- * `**x**` collapses to `x` rather than leaving a stray `*x*`. Each pattern is
- * non-greedy and capture group 1 is the inner text. Applied repeatedly until
- * the string stops changing (nested wrappers like `**_x_**`).
- */
-const WRAPPER_PATTERNS = [
-    /\*\*([^*]+?)\*\*/g, // **x**
-    /__([^_]+?)__/g, // __x__
-    /~~([^~]+?)~~/g, // ~~x~~
-    /\*([^*]+?)\*/g, // *x*
-    /_([^_]+?)_/g, // _x_
-    /``([^`]+?)``/g, // ``x``
-    /`([^`]+?)`/g, // `x`
-];
-/** Links/images -> their visible text. `!?` covers both `[t](u)` and `![a](s)`. */
-const LINK_IMAGE_RE = /!?\[([^\]]*)\]\([^)]*\)/g;
-/**
- * Apply ONLY the two balanced/link passes shared by both normalizers: first
- * collapse links/images to their visible text, then collapse balanced inline
- * wrappers repeatedly until stable. Does NOT trim decoration, does NOT guard
- * against an empty result — it returns exactly the transformed string.
- */
-function stripWrappersAndLinks(s) {
-    // 1. Links/images -> their visible text.
-    let out = s.replace(LINK_IMAGE_RE, "$1");
-    // 2. Strip balanced wrappers, repeating until the string is stable so nested
-    //    wrappers (`**_x_**`) and adjacent runs both collapse.
-    for (let pass = 0; pass < MAX_PASSES; pass++) {
-        const before = out;
-        for (const re of WRAPPER_PATTERNS) {
-            out = out.replace(re, "$1");
-        }
-        if (out === before)
-            break;
-    }
-    return out;
-}
-/**
- * STRICT formatting detector — distinct from the lenient locator
- * normalization below. It strips ONLY what unambiguously is markdown markup:
- *  1. links/images `[text](url)` -> `text`, `![alt](src)` -> `alt`, and
- *  2. balanced inline `**`/`__`/`~~`/`*`/`_`/`` ` `` wrappers (repeat-until-stable),
- * and DELIBERATELY does NOT trim leading/trailing whitespace, emoji, or lone
- * marker chars (the lenient extras `stripInlineMarkdown` does in its step 3).
- *
- * It exists ONLY to recognize formatting-vs-plain INTENT in `applyTextEdits`
- * (deciding whether find/replace differ purely by markdown markers). Because it
- * skips the lenient trimming, ordinary plain-text edits are NOT misread as
- * formatting: a trailing-space trim, snake_case (`my_var_name`), math (`2 * 3`),
- * and identifiers/URLs with underscores all stay untouched here (their `_x_` /
- * `*x*` runs are only collapsed when actually balanced, and even then they are
- * compared symmetrically, so plain text never collapses to a different string).
- *
- * Do NOT use this for LOCATING — the locator fallback must keep using the
- * lenient `stripInlineMarkdown` (it trims stray decoration so a find still
- * matches the document's plain text).
- */
-export function stripBalancedWrappers(s) {
-    if (typeof s !== "string" || s.length === 0)
-        return s;
-    return stripWrappersAndLinks(s);
-}
-/**
- * Conservatively strip inline markdown from a locator string.
- *
- * Deterministic, order-fixed steps:
- *  1. Links/images: `[text](url)` -> `text`, `![alt](src)` -> `alt`.
- *  2. Balanced inline wrappers (strong before emphasis, code, strikethrough),
- *     applied repeatedly until stable for nested cases.
- *  3. Trim leading/trailing decoration only: whitespace, leftover marker chars
- *     (`* _ ~ \``) and emoji. Letters/digits and sentence punctuation (`.`/`,`
- *     etc.) are NEVER trimmed.
- *
- * If the result is empty (e.g. the input was only markers like `***`), the
- * ORIGINAL string is returned so a locator can never normalize down to "" and
- * match everything.
- */
-export function stripInlineMarkdown(s) {
-    if (typeof s !== "string" || s.length === 0)
-        return s;
-    // 1 + 2. Shared link/image and balanced-wrapper passes.
-    let out = stripWrappersAndLinks(s);
-    // 3. Trim leading/trailing decoration: whitespace, leftover markdown markers,
-    //    and emoji (Extended_Pictographic plus the VS16 / ZWJ joiners, plus the
-    //    regional-indicator range U+1F1E6–U+1F1FF for flag emoji, which are NOT
-    //    Extended_Pictographic). The `u` flag enables the Unicode property escape.
-    //    Anchored runs only — interior text and sentence punctuation are untouched.
-    const DECORATION = "[\\s*_~\\x60\\p{Extended_Pictographic}\\u{1F1E6}-\\u{1F1FF}\\u{FE0F}\\u{200D}]+";
-    out = out
-        .replace(new RegExp("^" + DECORATION, "u"), "")
-        .replace(new RegExp(DECORATION + "$", "u"), "");
-    // 4. Never normalize a locator down to nothing.
-    if (out.length === 0)
-        return s;
-    return out;
-}
diff --git a/packages/mcp/build/lib/transforms.js b/packages/mcp/build/lib/transforms.js
deleted file mode 100644
index c1b822ba..00000000
--- a/packages/mcp/build/lib/transforms.js
+++ /dev/null
@@ -1,631 +0,0 @@
-/**
- * Pure, network-free transform primitives for a ProseMirror/TipTap document
- * tree, plus one higher-level orchestration (commentsToFootnotes).
- *
- * A ProseMirror node here is a plain JSON object of the shape produced by
- * Docmost: `{ type, attrs?, content?, text?, marks? }`. Children live in the
- * `content` array; callouts, tables, lists all hold their children in
- * `content`, so a single recursive walk reaches them all.
- *
- * Conventions (matching node-ops.ts):
- *  - functions that produce a new document deep-clone their input and return a
- *    `{ doc, ... }` object; the caller's objects are never mutated.
- *  - functions are defensively null-safe.
- *  - `marks` arrays are preserved verbatim when fragments are split/reordered.
- */
-import { blockPlainText } from "./node-ops.js";
-import { canonicalizeFootnotes } from "./footnote-canonicalize.js";
-import { footnoteContentKey, makeFootnoteDefinition, generateFootnoteId, } from "./footnote-authoring.js";
-export { canonicalizeFootnotes } from "./footnote-canonicalize.js";
-/** Deep-clone a JSON-serializable value without mutating the original. */
-function clone(value) {
-    if (typeof structuredClone === "function") {
-        return structuredClone(value);
-    }
-    // Fallback for environments without structuredClone.
-    return JSON.parse(JSON.stringify(value));
-}
-/** True if `value` is a non-null object (and not an array). */
-function isObject(value) {
-    return value != null && typeof value === "object" && !Array.isArray(value);
-}
-/**
- * Plain text of a node (re-export of node-ops' blockPlainText so transform
- * authors have a single import surface). Recurses through nested content.
- */
-export function blockText(node) {
-    return blockPlainText(node);
-}
-/**
- * Depth-first visit of every node in the tree, including the root and the
- * nested content of callouts, tables, lists, etc. `fn` is called once per node.
- * Null-safe: a nullish or non-object node is ignored.
- */
-export function walk(node, fn) {
-    if (!isObject(node))
-        return;
-    fn(node);
-    if (Array.isArray(node.content)) {
-        for (const child of node.content) {
-            walk(child, fn);
-        }
-    }
-}
-/**
- * Find the FIRST node (depth-first) matching `predicate`, anywhere in the tree.
- * Works even when the node carries no `attrs.id` (it searches the raw tree, not
- * an id index). Returns the live node reference inside `doc` (NOT a clone), or
- * null when nothing matches. Typical use: `getList(doc, n => n.type ===
- * "orderedList")`.
- */
-export function getList(doc, predicate) {
-    let found = null;
-    walk(doc, (node) => {
-        if (found == null && predicate(node)) {
-            found = node;
-        }
-    });
-    return found;
-}
-/**
- * Textblocks that hold raw text but do NOT accept inline atom nodes. A
- * `footnoteReference` is `group:"inline", atom:true`; `codeBlock` is
- * `content:"text*"` (text only), so splicing a footnoteReference into it yields
- * an invalid document. (paragraph/heading/detailsSummary are `inline*` and DO
- * accept it; footnote definitions live inside a footnotesList which the
- * footnote inserter excludes via `beforeBlock`.)
- */
-const INLINE_ATOM_FORBIDDEN_BLOCKS = new Set(["codeBlock"]);
-/**
- * Footnote-notes subtrees the inline footnote inserter must never split into (at
- * any depth): a `footnotesList` and the `footnoteDefinition`s it holds. Anchoring
- * a reference inside one of these would later be dropped as an orphan by the
- * canonicalizer, taking the existing definition's text with it.
- */
-const FOOTNOTE_NOTES_SUBTREES = new Set([
-    "footnotesList",
-    "footnoteDefinition",
-]);
-/** True if `node` IS, or contains at any depth, a footnotesList/footnoteDefinition. */
-function containsFootnoteNotes(node) {
-    if (!isObject(node))
-        return false;
-    if (FOOTNOTE_NOTES_SUBTREES.has(node.type))
-        return true;
-    if (Array.isArray(node.content)) {
-        return node.content.some((c) => containsFootnoteNotes(c));
-    }
-    return false;
-}
-/**
- * Insert `marker` as a PLAIN (unmarked) text run right after the first
- * occurrence of `anchor`.
- *
- * The text run that contains the END of the anchor is SPLIT at the anchor end,
- * so all existing marks (links, bold, ...) on the surrounding text are
- * preserved, while the inserted marker run carries NO marks. The marker is
- * inserted as a leading-space-padded run (`" " + marker`) so it visually
- * separates from the preceding word.
- *
- * The anchor is matched against the concatenated plain text of each top-level
- * block (so an anchor that spans several text/mark runs still matches). The
- * insertion happens inside the inline content array that holds the anchor's
- * final character.
- *
- * Operates on a clone of `doc`; returns `{ doc, inserted }`. `inserted` is
- * false when the anchor text was not found in any in-scope block.
- */
-export function insertMarkerAfter(doc, anchor, marker, opts = {}) {
-    // A plain marker is a leading-space-padded unmarked text run.
-    return insertNodesAfterAnchor(doc, anchor, () => [{ type: "text", text: " " + marker }], opts);
-}
-/**
- * Mark-safe insertion CORE: split the inline text run that holds the END of
- * `anchor` (preserving the surrounding marks) and splice the nodes produced by
- * `makeMiddle()` in at the split point. `insertMarkerAfter` (plain text marker)
- * and `insertInlineFootnote` (a `footnoteReference` node) are both thin callers —
- * the only difference is WHAT is inserted (a space-padded text run vs. a node
- * that should hug the preceding word), which is exactly what `makeMiddle`
- * decides. Operates on a clone; returns `{ doc, inserted }`.
- */
-function insertNodesAfterAnchor(doc, anchor, makeMiddle, opts = {}) {
-    const out = clone(doc);
-    if (!isObject(out) || !Array.isArray(out.content) || !anchor) {
-        return { doc: out, inserted: false };
-    }
-    const limit = typeof opts.beforeBlock === "number"
-        ? Math.min(opts.beforeBlock, out.content.length)
-        : out.content.length;
-    for (let b = 0; b < limit; b++) {
-        const block = out.content[b];
-        if (!isObject(block))
-            continue;
-        // Quick reject: skip blocks whose plain text cannot contain the anchor.
-        if (!blockPlainText(block).includes(anchor))
-            continue;
-        // Walk the inline content arrays inside this block, tracking a running
-        // character offset so we can locate the inline array + text run that holds
-        // the END of the anchor's first occurrence.
-        let inserted = false;
-        let offset = 0; // characters of plain text seen so far in this block
-        const anchorEnd = (() => blockPlainText(block).indexOf(anchor) + anchor.length)();
-        // Recurse into inline-bearing containers (paragraph, heading, table cell,
-        // callout child paragraphs, ...). We only split inside an array of inline
-        // nodes (text/inline atoms); the FIRST array whose cumulative range covers
-        // anchorEnd receives the split + marker.
-        const visit = (container) => {
-            if (inserted || !isObject(container) || !Array.isArray(container.content)) {
-                return;
-            }
-            // Skip a forbidden subtree entirely (e.g. footnotesList/footnoteDefinition):
-            // never split into it, but keep `offset` aligned for any sibling text after
-            // it within this block.
-            if (opts.skipSubtreeTypes && opts.skipSubtreeTypes.has(container.type)) {
-                offset += blockPlainText(container).length;
-                return;
-            }
-            const inline = container.content;
-            // Detect whether this array is an inline array (contains text nodes).
-            const hasText = inline.some((n) => isObject(n) && n.type === "text");
-            if (hasText) {
-                // Refuse a textblock whose content spec cannot hold the inserted nodes
-                // (e.g. a codeBlock for an inline atom). Keep `offset` aligned for any
-                // sibling textblocks in this same block, then bail so the search falls
-                // through to the next candidate block.
-                if (opts.forbidBlockTypes && opts.forbidBlockTypes.has(container.type)) {
-                    offset += blockPlainText(container).length;
-                    return;
-                }
-                for (let i = 0; i < inline.length; i++) {
-                    const n = inline[i];
-                    const len = isObject(n) ? blockPlainText(n).length : 0;
-                    const runStart = offset;
-                    const runEnd = offset + len;
-                    // The run that contains the anchor end (anchorEnd lands inside this
-                    // run, i.e. runStart < anchorEnd <= runEnd) is the split point.
-                    if (!inserted &&
-                        isObject(n) &&
-                        n.type === "text" &&
-                        typeof n.text === "string" &&
-                        anchorEnd > runStart &&
-                        anchorEnd <= runEnd) {
-                        const cut = anchorEnd - runStart; // split index within this text run
-                        const before = n.text.slice(0, cut);
-                        const after = n.text.slice(cut);
-                        const marks = Array.isArray(n.marks) ? n.marks : [];
-                        const parts = [];
-                        if (before.length > 0) {
-                            parts.push({ ...n, text: before, marks: [...marks] });
-                        }
-                        // The inserted nodes are caller-decided (a space-padded marker run,
-                        // or a node that hugs the word). They carry no copied marks.
-                        parts.push(...makeMiddle());
-                        if (after.length > 0) {
-                            parts.push({ ...n, text: after, marks: [...marks] });
-                        }
-                        inline.splice(i, 1, ...parts);
-                        inserted = true;
-                        return;
-                    }
-                    offset = runEnd;
-                }
-            }
-            else {
-                // Not an inline array: recurse into children (e.g. callout -> paragraph).
-                for (const child of inline) {
-                    visit(child);
-                    if (inserted)
-                        return;
-                }
-            }
-        };
-        visit(block);
-        if (inserted) {
-            return { doc: out, inserted: true };
-        }
-        // If the block matched in plain text but we could not split (e.g. anchor
-        // lands inside an atom), fall through to the next block rather than failing.
-    }
-    return { doc: out, inserted: false };
-}
-/**
- * In the disclaimer callout, replace a `[1]…[K]` range marker with `[1]…[n]`.
- *
- * Docmost translations use a callout that states the footnote range, e.g.
- * "[1]…[5]". When the number of notes changes, this rewrites the trailing
- * number of any `[1]…[K]` (or `[1]...[K]`, ASCII ellipsis) occurrence found in a
- * callout's text nodes to `[1]…[n]`. Operates on a clone; returns
- * `{ doc, changed }` where `changed` is the number of text nodes rewritten.
- */
-export function setCalloutRange(doc, n) {
-    const out = clone(doc);
-    let changed = 0;
-    // Match "[1]" + (… or ...) + "[<digits>]"; rewrite the last number to n.
-    const rangeRe = /(\[1\]\s*(?:…|\.\.\.)\s*\[)\d+(\])/g;
-    walk(out, (node) => {
-        if (node.type === "callout") {
-            walk(node, (inner) => {
-                if (inner.type === "text" &&
-                    typeof inner.text === "string" &&
-                    rangeRe.test(inner.text)) {
-                    rangeRe.lastIndex = 0;
-                    inner.text = inner.text.replace(rangeRe, `$1${n}$2`);
-                    changed++;
-                }
-                rangeRe.lastIndex = 0;
-            });
-        }
-    });
-    return { doc: out, changed };
-}
-/**
- * Generate a short random id for a new block's `attrs.id`. Docmost uses nanoid;
- * a base36 random string is sufficient here (uniqueness within one document).
- */
-function freshId() {
-    return (Math.random().toString(36).slice(2, 12) +
-        Math.random().toString(36).slice(2, 6));
-}
-/**
- * Wrap inline ProseMirror nodes in a list item:
- *   { type:"listItem", content:[{ type:"paragraph", attrs:{id}, content: inlineNodes }] }
- * with a fresh random block id on the paragraph. The inline nodes are cloned so
- * the result shares no references with the caller's input.
- */
-export function noteItem(inlineNodes) {
-    const content = Array.isArray(inlineNodes) ? clone(inlineNodes) : [];
-    return {
-        type: "listItem",
-        content: [
-            {
-                type: "paragraph",
-                attrs: { id: freshId() },
-                content,
-            },
-        ],
-    };
-}
-/**
- * Wrap inline ProseMirror nodes in a real footnoteDefinition node keyed by id:
- *   { type:"footnoteDefinition", attrs:{id}, content:[{ type:"paragraph", content }] }
- * (mirrors the editor-ext / docmost-schema FootnoteDefinition node).
- *
- * Built on the shared `makeFootnoteDefinition` factory (footnote-authoring.ts);
- * the only extra is a fresh block id on the inner paragraph (Docmost stamps one,
- * and the canonicalizer preserves attrs as-is). Single factory, one place to
- * change the definition shape.
- */
-export function footnoteDefinition(id, inlineNodes) {
-    const node = makeFootnoteDefinition(id, inlineNodes);
-    node.content[0].attrs = { id: freshId() };
-    return node;
-}
-/**
- * Replace every `[N]` body marker and `\u0000FN<i>\u0000` comment placeholder in
- * an inline content array with a real `footnoteReference` node, in reading
- * order. `onMarker` is called for each replaced marker (with the original `[N]`
- * number or the placeholder index) and returns the fresh footnote id to attach
- * to the inserted node. Mutates `inline` in place.
- */
-function replaceMarkersWithReferences(inline, onMarker) {
-    const re = /\[(\d+)\]|\u0000FN(\d+)\u0000/g;
-    for (let i = 0; i < inline.length; i++) {
-        const n = inline[i];
-        if (!isObject(n) || n.type !== "text" || typeof n.text !== "string") {
-            continue;
-        }
-        if (!re.test(n.text))
-            continue;
-        re.lastIndex = 0;
-        const marks = Array.isArray(n.marks) ? n.marks : [];
-        const parts = [];
-        let last = 0;
-        let m;
-        while ((m = re.exec(n.text)) !== null) {
-            if (m.index > last) {
-                parts.push({ ...n, text: n.text.slice(last, m.index), marks: [...marks] });
-            }
-            const oldNum = m[1] != null ? Number(m[1]) : undefined;
-            const phIdx = m[2] != null ? Number(m[2]) : undefined;
-            const fnId = onMarker({ oldNum, phIdx });
-            parts.push({ type: "footnoteReference", attrs: { id: fnId } });
-            last = m.index + m[0].length;
-        }
-        if (last < n.text.length) {
-            parts.push({ ...n, text: n.text.slice(last), marks: [...marks] });
-        }
-        // Drop any zero-length text runs the slicing may have produced.
-        const cleaned = parts.filter((p) => p.type !== "text" || (typeof p.text === "string" && p.text.length > 0));
-        inline.splice(i, 1, ...cleaned);
-        i += cleaned.length - 1;
-    }
-}
-/**
- * Convert a comment's markdown (e.g. `**Lead.** body...`) into inline
- * ProseMirror nodes.
- *
- * A leading `комментарий: ` (case-insensitive) or `N. ` numeric prefix is
- * stripped first. Then a minimal bold-split is applied: a leading
- * `**bold lead**` run becomes a text node with a bold mark, and the remainder
- * becomes a plain text node. This keeps the conversion synchronous (the
- * transform sandbox runs synchronously) and dependency-free; the existing
- * async markdownToProseMirror is intentionally NOT used here.
- */
-export function mdToInlineNodes(markdown) {
-    let md = typeof markdown === "string" ? markdown : "";
-    // Strip a leading "комментарий: " prefix (case-insensitive) or a "N. " prefix.
-    md = md.replace(/^\s*комментарий\s*:\s*/i, "");
-    md = md.replace(/^\s*\d+\.\s+/, "");
-    md = md.trim();
-    if (md === "")
-        return [];
-    const nodes = [];
-    // Leading bold lead: **...** at the very start.
-    const leadMatch = /^\*\*([^*]+)\*\*\s*/.exec(md);
-    if (leadMatch) {
-        const leadText = leadMatch[1];
-        nodes.push({
-            type: "text",
-            text: leadText,
-            marks: [{ type: "bold" }],
-        });
-        const rest = md.slice(leadMatch[0].length);
-        if (rest.length > 0) {
-            // Preserve the separating space that followed the bold lead.
-            const sep = /^\*\*[^*]+\*\*(\s*)/.exec(md);
-            const spacing = sep ? sep[1] : "";
-            nodes.push({ type: "text", text: spacing + rest });
-        }
-        return nodes;
-    }
-    // No bold lead: emit the whole thing as a single plain text node, with any
-    // remaining **bold** spans split out inline.
-    return splitInlineBold(md);
-}
-/**
- * Split a string with inline `**bold**` spans into text nodes, bolding the
- * spans. Used as the no-lead fallback in mdToInlineNodes.
- */
-function splitInlineBold(text) {
-    const nodes = [];
-    const re = /\*\*([^*]+)\*\*/g;
-    let last = 0;
-    let m;
-    while ((m = re.exec(text)) !== null) {
-        if (m.index > last) {
-            nodes.push({ type: "text", text: text.slice(last, m.index) });
-        }
-        nodes.push({ type: "text", text: m[1], marks: [{ type: "bold" }] });
-        last = m.index + m[0].length;
-    }
-    if (last < text.length) {
-        nodes.push({ type: "text", text: text.slice(last) });
-    }
-    return nodes.length > 0 ? nodes : [{ type: "text", text }];
-}
-/**
- * Turn inline comments into numbered footnotes.
- *
- * For each inline comment that carries a `selection`:
- *   1. insert a placeholder marker (a NUL-delimited "\u0000FN<i>\u0000"
- *      sentinel) right after the selection text in the BODY (before the
- *      notes heading);
- *   2. build a note list item from the comment's markdown content.
- *
- * Then RENUMBER every footnote marker in the body by reading order: existing
- * `[N]` markers and the new "\u0000FN<i>\u0000" placeholders are both replaced by a
- * sequential `[seq]`, and the notes orderedList is reordered so each note lines
- * up with its marker's reading-order position. Finally the disclaimer callout
- * range is synced to the new note count.
- *
- * Returns `{ doc, consumed }` where `consumed` lists the ids of comments that
- * were successfully anchored (their selection was found and a placeholder
- * inserted). Operates on a clone of `doc`.
- */
-export function commentsToFootnotes(doc, comments, opts = {}) {
-    let working = clone(doc);
-    const notesHeading = opts.notesHeading ?? "Примечания переводчика";
-    const top = Array.isArray(working.content) ? working.content : [];
-    const notesIdx = top.findIndex((n) => isObject(n) && n.type === "heading" && blockText(n).trim() === notesHeading);
-    if (notesIdx < 0) {
-        throw new Error(`heading "${notesHeading}" not found`);
-    }
-    // The notes orderedList lives at or after the heading.
-    const notesList = top
-        .slice(notesIdx)
-        .find((n) => isObject(n) && n.type === "orderedList");
-    if (!notesList) {
-        throw new Error("notes orderedList not found");
-    }
-    const consumed = [];
-    const noteInlineByPh = new Map();
-    (Array.isArray(comments) ? comments : []).forEach((c, i) => {
-        if (!c || !c.selection)
-            return;
-        // Collision-proof sentinel delimited by NUL control chars, which never occur
-        // in real Docmost prose - so the marker regex cannot mistake any body text
-        // (e.g. "Press F1 for help", model "FN2") for a placeholder. The NUL is
-        // transient: the placeholder is inserted here and replaced by a
-        // footnoteReference node below; it never persists in a returned document.
-        const ph = `\u0000FN${i}\u0000`;
-        // insertMarkerAfter returns a NEW cloned doc; reassign `working`.
-        const r = insertMarkerAfter(working, c.selection.trimEnd(), ph, {
-            beforeBlock: notesIdx,
-        });
-        if (!r.inserted)
-            return;
-        working = r.doc;
-        noteInlineByPh.set(ph, mdToInlineNodes(c.content));
-        consumed.push(c.id);
-    });
-    // Re-resolve references into the (possibly re-cloned) working doc.
-    const top2 = Array.isArray(working.content) ? working.content : [];
-    const notesIdx2 = top2.findIndex((n) => isObject(n) && n.type === "heading" && blockText(n).trim() === notesHeading);
-    const oldListIndex = top2.findIndex((n) => isObject(n) && n.type === "orderedList");
-    const notesList2 = oldListIndex >= 0 ? top2[oldListIndex] : null;
-    if (!notesList2) {
-        throw new Error("notes orderedList not found");
-    }
-    // Inline content of each existing note (listItem -> paragraph -> inline).
-    const oldNoteInline = (Array.isArray(notesList2.content)
-        ? notesList2.content
-        : []).map((item) => {
-        const para = isObject(item) && Array.isArray(item.content)
-            ? item.content.find((c) => isObject(c) && c.type === "paragraph")
-            : null;
-        return para && Array.isArray(para.content) ? para.content : [];
-    });
-    // Walk the body in reading order, turning each "[N]" / placeholder marker into
-    // a real footnoteReference node and collecting its definition inline content.
-    const definitions = [];
-    const disclaimerRangeRe = /(\[1\]\s*(?:…|\.\.\.)\s*\[)\d+(\])/;
-    // Recursively visit inline arrays inside a block (paragraph, heading, callout
-    // child paragraphs, table cells, ...), preserving document reading order.
-    const visitInlineArrays = (container) => {
-        if (!isObject(container) || !Array.isArray(container.content))
-            return;
-        const hasText = container.content.some((n) => isObject(n) && n.type === "text");
-        if (hasText) {
-            replaceMarkersWithReferences(container.content, ({ oldNum, phIdx }) => {
-                const fnId = freshId();
-                if (oldNum != null) {
-                    const inline = oldNoteInline[oldNum - 1];
-                    // Every existing body marker MUST map to a real note. An out-of-range
-                    // marker means the document is internally inconsistent; fail loudly.
-                    if (inline === undefined) {
-                        throw new Error(`footnote [${oldNum}] has no matching note (notes list has ${oldNoteInline.length} items); document is inconsistent`);
-                    }
-                    definitions.push(footnoteDefinition(fnId, inline));
-                }
-                else {
-                    const inline = noteInlineByPh.get(`\u0000FN${phIdx}\u0000`) || [];
-                    definitions.push(footnoteDefinition(fnId, inline));
-                }
-                return fnId;
-            });
-        }
-        else {
-            for (const child of container.content)
-                visitInlineArrays(child);
-        }
-    };
-    const notesBoundary = notesIdx2 >= 0 ? notesIdx2 : oldListIndex;
-    for (let i = 0; i < notesBoundary; i++) {
-        // Skip ONLY the disclaimer callout: its "[1]...[K]" range is NOT a footnote
-        // marker and is synced separately by setCalloutRange.
-        if (isObject(top2[i]) &&
-            top2[i].type === "callout" &&
-            disclaimerRangeRe.test(blockText(top2[i]))) {
-            continue;
-        }
-        visitInlineArrays(top2[i]);
-    }
-    // Replace the old orderedList with a real footnotesList of the collected
-    // definitions (reading order). If there are no definitions, drop the list.
-    if (definitions.length > 0) {
-        top2[oldListIndex] = {
-            type: "footnotesList",
-            content: definitions,
-        };
-    }
-    else {
-        top2.splice(oldListIndex, 1);
-    }
-    // Sync the disclaimer callout range to the new note count.
-    const synced = setCalloutRange(working, definitions.length);
-    return { doc: synced.doc, consumed };
-}
-/**
- * AUTHOR-INLINE footnote insertion. The caller supplies WHERE (anchorText) and
- * WHAT (markdown text); numbering and the bottom list are derived server-side by
- * `canonicalizeFootnotes`. The caller never sees or edits `footnotesList`, never
- * assigns a number, and cannot desync — orphans / out-of-order lists / raw
- * `[^id]` markdown are structurally impossible.
- *
- * Content DEDUP (#3 in the issue): if an existing definition has the SAME
- * normalized content key, its id is REUSED (the new reference points at it: one
- * number, one definition, several references). Otherwise a fresh uuid id is
- * minted and a new definition added. Conservative — only an exact content match
- * merges.
- *
- * Mechanics: the `footnoteReference` node is inserted DIRECTLY at the anchor via
- * the same mark-safe split as `insertMarkerAfter` (the shared
- * `insertNodesAfterAnchor` core), so it hugs the preceding word with no text
- * sentinel round-trip. The whole document is then canonicalized.
- *
- * Operates on a clone of `doc`. When the anchor is not found, returns the input
- * unchanged with `inserted:false`.
- */
-export function insertInlineFootnote(doc, opts) {
-    const inline = mdToInlineNodes(opts.text ?? "");
-    // footnoteContentKey only reads `.content`, so key off the inline array
-    // directly instead of building a throwaway definition node.
-    const key = footnoteContentKey({ content: inline });
-    // Content dedup: reuse an existing definition's id when its key matches.
-    let footnoteId = null;
-    let reused = false;
-    if (key !== "") {
-        walk(doc, (n) => {
-            if (footnoteId == null &&
-                isObject(n) &&
-                n.type === "footnoteDefinition" &&
-                n.attrs &&
-                typeof n.attrs.id === "string" &&
-                n.attrs.id !== "" &&
-                footnoteContentKey(n) === key) {
-                footnoteId = n.attrs.id;
-                reused = true;
-            }
-        });
-    }
-    if (footnoteId == null)
-        footnoteId = generateFootnoteId();
-    // Insert the footnoteReference node directly after the anchor (mark-safe
-    // split); it hugs the preceding word with no leading space. Two guards keep the
-    // inline atom out of the notes section and out of blocks that cannot hold it:
-    //  - beforeBlock bounds the search to the BODY, before the first top-level block
-    //    that IS or CONTAINS (at any depth) a footnotesList/footnoteDefinition — so
-    //    a NESTED list or a bare definition also bounds the search, not just a
-    //    top-level list;
-    //  - skipSubtreeTypes refuses to descend into any footnotesList/footnoteDefinition
-    //    subtree, so a reference is never glued inside an existing definition (which
-    //    the canonicalizer would then drop as an orphan, losing that definition's
-    //    prose); and forbidBlockTypes refuses codeBlocks (an inline atom there is a
-    //    schema-invalid doc; insert_footnote skips validateDocStructure).
-    // When the only anchor match is in such a place, the insert is refused and the
-    // write aborts cleanly (inserted:false) instead of destroying content.
-    const boundaryIdx = Array.isArray(doc?.content)
-        ? doc.content.findIndex((n) => containsFootnoteNotes(n))
-        : -1;
-    const r = insertNodesAfterAnchor(doc, (opts.anchorText ?? "").trimEnd(), () => [{ type: "footnoteReference", attrs: { id: footnoteId } }], {
-        ...(boundaryIdx >= 0 ? { beforeBlock: boundaryIdx } : {}),
-        forbidBlockTypes: INLINE_ATOM_FORBIDDEN_BLOCKS,
-        skipSubtreeTypes: FOOTNOTE_NOTES_SUBTREES,
-    });
-    if (!r.inserted) {
-        return { doc: clone(doc), inserted: false, footnoteId, reused };
-    }
-    let working = r.doc;
-    // Add a NEW definition (canonicalize will order/place it); a reused id needs
-    // no new definition (the existing one is shared).
-    if (!reused) {
-        appendDefinition(working, makeFootnoteDefinition(footnoteId, inline));
-    }
-    // Derive numbering + the single bottom list deterministically.
-    working = canonicalizeFootnotes(working);
-    return { doc: working, inserted: true, footnoteId, reused };
-}
-/**
- * Append a definition node so the canonicalizer can order/place it: into the
- * first existing footnotesList, or a new trailing list when none exists.
- */
-function appendDefinition(doc, defNode) {
-    const existingList = getList(doc, (n) => isObject(n) && n.type === "footnotesList");
-    if (existingList && Array.isArray(existingList.content)) {
-        existingList.content.push(defNode);
-        return;
-    }
-    if (Array.isArray(doc.content)) {
-        doc.content.push({ type: "footnotesList", content: [defNode] });
-    }
-}
diff --git a/packages/mcp/build/lib/tree.js b/packages/mcp/build/lib/tree.js
deleted file mode 100644
index dd8cb39e..00000000
--- a/packages/mcp/build/lib/tree.js
+++ /dev/null
@@ -1,89 +0,0 @@
-/**
- * Pure tree-builder: turn a flat array of sidebar-style page nodes (as produced
- * by `enumerateSpacePages`) into a nested tree.
- *
- * Input: a flat array of nodes. Each node is expected to carry at least
- *   { id, slugId, title, position, parentPageId } (extra fields are ignored).
- *
- * Output: an array of ROOT nodes, each shaped as
- *   { id, slugId, title, children? }
- * where `children` is the array of child nodes (same shape, recursively). The
- * `children` key is OMITTED entirely when a node has no children — consistent
- * with how `filterPage` omits an empty `subpages` array — to keep the payload
- * lean (nesting alone conveys the structure; parentPageId/position/hasChildren
- * are intentionally dropped from the output).
- *
- * Linking rule: a node is attached as a child of `parentPageId` only when that
- * parent id is actually present in the input. Otherwise — including a null /
- * undefined `parentPageId`, or a parent that was capped out of the bounded walk
- * — the node is promoted to a ROOT. So "orphan whose parent is missing" is the
- * defined behavior: it surfaces at the top level rather than disappearing.
- *
- * Ordering rule: the roots array and every `children` array are sorted ascending
- * by the node's `position` string. The comparator is a plain code-unit (byte)
- * comparison — NOT localeCompare — because the server orders sidebar pages by
- * `collate "C"` (byte order), which a raw `<`/`>` compare approximates for the
- * fractional-index ASCII keys (e.g. "a0", "a1"). Nodes with a missing/undefined
- * `position` sort last.
- *
- * Pure: no I/O, no network, deterministic.
- */
-export function buildPageTree(nodes) {
-    // Map id -> output node. Build the lean output shape up front.
-    const byId = new Map();
-    // Preserve the original position string for sorting (kept off the output).
-    const positionById = new Map();
-    for (const node of nodes) {
-        if (!node || typeof node !== "object" || !node.id)
-            continue;
-        // Defensive against duplicate ids: last one wins (overwrites the earlier
-        // entry). `enumerateSpacePages` already dedups, so this is belt-and-braces.
-        byId.set(node.id, {
-            id: node.id,
-            slugId: node.slugId,
-            title: node.title,
-        });
-        positionById.set(node.id, node.position);
-    }
-    // Stable comparator on the position string: code-unit order, missing last.
-    const byPosition = (aId, bId) => {
-        const a = positionById.get(aId);
-        const b = positionById.get(bId);
-        if (a === undefined || a === null)
-            return b === undefined || b === null ? 0 : 1;
-        if (b === undefined || b === null)
-            return -1;
-        if (a < b)
-            return -1;
-        if (a > b)
-            return 1;
-        return 0;
-    };
-    const roots = [];
-    const childrenIdsByParent = new Map();
-    for (const node of nodes) {
-        if (!node || typeof node !== "object" || !node.id)
-            continue;
-        const parentId = node.parentPageId;
-        // Child only when the parent is actually present in the input; otherwise
-        // (null/undefined parent, or parent capped out of the walk) -> root.
-        if (parentId && byId.has(parentId)) {
-            const list = childrenIdsByParent.get(parentId) ?? [];
-            list.push(node.id);
-            childrenIdsByParent.set(parentId, list);
-        }
-        else {
-            roots.push(node.id);
-        }
-    }
-    // Attach sorted children arrays to each parent, omitting empty ones.
-    for (const [parentId, childIds] of childrenIdsByParent) {
-        const parent = byId.get(parentId);
-        if (!parent)
-            continue;
-        childIds.sort(byPosition);
-        parent.children = childIds.map((id) => byId.get(id));
-    }
-    roots.sort(byPosition);
-    return roots.map((id) => byId.get(id));
-}
diff --git a/packages/mcp/build/stdio.js b/packages/mcp/build/stdio.js
deleted file mode 100755
index 55f9eccb..00000000
--- a/packages/mcp/build/stdio.js
+++ /dev/null
@@ -1,40 +0,0 @@
-#!/usr/bin/env node
-import { StdioServerTransport } from "@modelcontextprotocol/sdk/server/stdio.js";
-import { createDocmostMcpServer } from "./index.js";
-// Standalone stdio entrypoint. This restores the original behavior of the
-// package when run as a CLI (`docmost-mcp`): it reads credentials from the
-// environment and serves the MCP protocol over stdin/stdout. The factory in
-// index.ts stays side-effect-free; all the process/transport lifecycle lives
-// here.
-const API_URL = process.env.DOCMOST_API_URL;
-const EMAIL = process.env.DOCMOST_EMAIL;
-const PASSWORD = process.env.DOCMOST_PASSWORD;
-if (!API_URL || !EMAIL || !PASSWORD) {
-    console.error("Error: DOCMOST_API_URL, DOCMOST_EMAIL, and DOCMOST_PASSWORD environment variables are required.");
-    process.exit(1);
-}
-async function run() {
-    // Global safety nets so a stray rejection/exception cannot silently kill
-    // the stdio server. Per-tool errors still flow through the SDK and are not
-    // affected by these handlers; these only catch errors raised OUTSIDE a tool
-    // call (e.g. a transient ws/collab socket "error" event). Such errors must
-    // NOT tear down the whole stdio server, so we log only and keep running.
-    // Genuine startup failures are still fatal via run().catch(...) below.
-    process.on("unhandledRejection", (reason) => {
-        console.error("Unhandled promise rejection:", reason);
-    });
-    process.on("uncaughtException", (error) => {
-        console.error("Uncaught exception:", error);
-    });
-    const server = createDocmostMcpServer({
-        apiUrl: API_URL,
-        email: EMAIL,
-        password: PASSWORD,
-    });
-    const transport = new StdioServerTransport();
-    await server.connect(transport);
-}
-run().catch((error) => {
-    console.error("Fatal error running server:", error);
-    process.exit(1);
-});
diff --git a/packages/mcp/build/tool-specs.js b/packages/mcp/build/tool-specs.js
deleted file mode 100644
index 33319e18..00000000
--- a/packages/mcp/build/tool-specs.js
+++ /dev/null
@@ -1,371 +0,0 @@
-// Zod-agnostic shared tool-spec registry consumed by BOTH the zod-v3 MCP server
-// (packages/mcp/src/index.ts) and the zod-v4 in-app AI-SDK service
-// (apps/server/src/core/ai-chat/tools/ai-chat-tools.service.ts). Intentionally
-// imports NO zod: each consumer passes its OWN zod namespace into buildShape,
-// because the two packages are on different zod majors (v3 here, v4 in the
-// server) and a zod schema object built with one major cannot be reused by the
-// other. The builders below only touch z.string()/.min()/.optional()/.describe(),
-// z.array() and z.object() — API identical across v3 and v4 — so a single
-// builder works with either namespace.
-//
-// Only tools whose snake_case/camelCase name, input schema AND model-facing
-// description are genuinely identical across both layers live here. Tools that
-// diverge on purpose (security guardrails, tuned UX, "Reversible" framing on
-// some write tools, different limits, hybrid-RRF search, etc.) stay defined
-// per-layer and are NOT represented here.
-//
-// MAINTENANCE RULE: adding, renaming, or removing a spec here (or an inline
-// registerTool in index.ts) REQUIRES updating SERVER_INSTRUCTIONS in
-// packages/mcp/src/index.ts — the intent-routing guide MCP clients receive on
-// initialize. Enforced by test/unit/server-instructions.test.mjs.
-export const SHARED_TOOL_SPECS = {
-    // --- no-argument read tools ---
-    getWorkspace: {
-        mcpName: 'get_workspace',
-        inAppKey: 'getWorkspace',
-        description: 'Fetch metadata about the current workspace (name, settings).',
-    },
-    listSpaces: {
-        mcpName: 'list_spaces',
-        inAppKey: 'listSpaces',
-        description: 'List the spaces the current user can access. Returns the array of ' +
-            'spaces (id, name, slug, ...).',
-    },
-    listShares: {
-        mcpName: 'list_shares',
-        inAppKey: 'listShares',
-        description: 'List all public shares in the workspace with page titles and public URLs.',
-    },
-    // --- single-pageId read tools ---
-    getPageJson: {
-        mcpName: 'get_page_json',
-        inAppKey: 'getPageJson',
-        description: 'Get page details with the raw ProseMirror JSON content (lossless: ' +
-            'includes block ids, callouts, tables, link/image attributes) plus the ' +
-            'slugId used in URLs. Use the block ids it returns to make precise ' +
-            'structural edits or surgical text edits without resending the page.',
-        buildShape: (z) => ({
-            pageId: z.string().min(1),
-        }),
-    },
-    getOutline: {
-        mcpName: 'get_outline',
-        inAppKey: 'getOutline',
-        description: "Return a COMPACT outline of a page's top-level blocks ({index, type, " +
-            'id, level, firstText}; tables add rows/cols/header; lists add item ' +
-            'count) WITHOUT the full document body. Use it to locate sections/tables ' +
-            'and grab block ids cheaply before fetching, patching or inserting ' +
-            'individual blocks.',
-        buildShape: (z) => ({
-            pageId: z.string().min(1),
-        }),
-    },
-    // --- two-id read tool ---
-    getNode: {
-        mcpName: 'get_node',
-        inAppKey: 'getNode',
-        description: "Fetch a single node's full ProseMirror subtree (lossless) without " +
-            'pulling the whole document. `nodeId` is a block id from the page ' +
-            'outline or page-JSON view (works for headings/paragraphs/callouts/images), OR ' +
-            '`#<index>` to fetch a top-level block by its outline index — use the ' +
-            '`#<index>` form for tables/rows/cells, which carry no id.',
-        buildShape: (z) => ({
-            pageId: z.string().min(1),
-            nodeId: z.string().min(1),
-        }),
-    },
-    // --- in-page occurrence search (client-side, over ProseMirror plain text) ---
-    searchInPage: {
-        mcpName: 'search_in_page',
-        inAppKey: 'searchInPage',
-        description: 'Find every occurrence of a string (or regex) INSIDE one page and get ' +
-            'WHERE each is — instead of pulling blocks one-by-one with get_node. ' +
-            'Searches the plain text of each text block/cell (marks glued, so a match ' +
-            'survives bold/italic/link splits; comment anchors do not interfere). ' +
-            'Returns { total, truncated, matches:[{ nodeId, blockIndex, type, before, ' +
-            'match, after }] }: `nodeId` is the block id (or "#<index>" for ' +
-            'table/cell content) — pass it to get_node/patch_node (the "#<index>" ' +
-            'form resolves with get_node but NOT patch_node, which only accepts a real ' +
-            'block id). To anchor a comment, do NOT pass nodeId to create_comment (it ' +
-            'has no nodeId param); build a UNIQUE text selection from before+match+' +
-            'after and pass it as create_comment\'s `selection`. `blockIndex` is the ' +
-            'get_outline index; `before`/`after` give ~40 chars of context to build ' +
-            'that unique selection. `total` counts all ' +
-            'hits and `truncated` is true when more than `limit` were found (nothing ' +
-            'is silently dropped). Default is a literal, case-INSENSITIVE substring; ' +
-            'set regex:true for an RE2 regular expression (linear-time, ReDoS-safe: ' +
-            'char classes, word boundaries, anchors and quantifiers work; lookaround ' +
-            '(?=…)/(?<=…) and backreferences \\1 are NOT supported) and ' +
-            'caseSensitive:true to match case. Ideal for systematic ' +
-            'editorial sweeps (unquoted "ё", straight quotes, "т.е.", stray units). An ' +
-            'invalid regex or an empty query returns a clear error to fix.',
-        buildShape: (z) => ({
-            pageId: z.string().min(1).describe('ID of the page to search'),
-            query: z
-                .string()
-                .min(1)
-                .describe('The text to find (a literal substring, or a regex when regex:true)'),
-            regex: z
-                .boolean()
-                .optional()
-                .describe('Treat query as an RE2 regular expression — linear-time, ReDoS-safe; ' +
-                'no lookaround or backreferences (default false).'),
-            caseSensitive: z
-                .boolean()
-                .optional()
-                .describe('Case-sensitive matching (default false).'),
-            limit: z
-                .number()
-                .int()
-                .min(1)
-                .max(200)
-                .optional()
-                .describe('Max matches to RETURN (default 50, max 200); total is always reported.'),
-        }),
-    },
-    // --- node delete ---
-    deleteNode: {
-        mcpName: 'delete_node',
-        inAppKey: 'deleteNode',
-        description: 'Remove a single block by its attrs.id (from the page outline or ' +
-            'page-JSON view) WITHOUT resending the whole document.',
-        buildShape: (z) => ({
-            pageId: z.string().min(1),
-            nodeId: z.string().min(1),
-        }),
-    },
-    // --- single-block structural write (patch / insert) ---
-    //
-    // CANONICAL description merges both layers: the MCP copy's "WITHOUT resending
-    // the whole document" + "cheaper/safer than a full-document replace" guidance
-    // AND the in-app copy's "keeps the same node id" + "Reversible via page
-    // history" framing — nothing either side conveyed is dropped. Sibling tools are
-    // named in transport-neutral prose ("the page-JSON view", "a full-document
-    // replace") to match the rest of the registry, since the two layers expose
-    // those siblings under different (snake_case vs camelCase) identifiers.
-    patchNode: {
-        mcpName: 'patch_node',
-        inAppKey: 'patchNode',
-        description: 'Replace a single content block identified by its attrs.id with a new ' +
-            'ProseMirror node, WITHOUT resending the whole document; the replacement ' +
-            'keeps the same node id. Get the block id from the page outline (cheap) ' +
-            'or the page-JSON view, then ' +
-            'pass a ProseMirror node to put in its place. Example node: a paragraph ' +
-            '{"type":"paragraph","content":[{"type":"text","text":"Hello"}]} or a ' +
-            'heading {"type":"heading","attrs":{"level":2},"content":' +
-            '[{"type":"text","text":"Title"}]}. Bold is a mark: ' +
-            '{"type":"text","text":"x","marks":[{"type":"bold"}]}. The node may be a ' +
-            'JSON object or a JSON string (both accepted). Cheaper and safer than ' +
-            'replacing the whole document for one-block structural edits. Reversible: ' +
-            'the previous version is kept in page history.',
-        buildShape: (z) => ({
-            pageId: z.string().min(1).describe('ID of the page containing the block'),
-            nodeId: z
-                .string()
-                .min(1)
-                .describe('attrs.id of the block to replace (from the page outline or ' +
-                'page-JSON view)'),
-            node: z
-                .any()
-                .describe('ProseMirror node to put in place of the node with this id, e.g. ' +
-                '{"type":"paragraph","content":[{"type":"text","text":"Hello"}]}. ' +
-                'JSON object or JSON string both accepted.'),
-        }),
-    },
-    insertNode: {
-        mcpName: 'insert_node',
-        inAppKey: 'insertNode',
-        description: 'Insert a block before/after another block (by attrs.id or anchor text) ' +
-            'or append it at the end (top level). For before/after you MUST provide ' +
-            'EXACTLY ONE of anchorNodeId or anchorText. Get anchor block ids from the ' +
-            'page outline or the page-JSON view. Avoids resending the whole document. ' +
-            'Can also insert ' +
-            'table structure: to add a tableRow, pass a tableRow node with position ' +
-            'before/after and anchor INSIDE the target table — anchorNodeId of any ' +
-            'block/cell in it, or anchorText matching the table; to add a ' +
-            'tableCell/tableHeader, use anchorNodeId of a block inside the target row ' +
-            '(anchorText only resolves top-level blocks, so it cannot target a row). ' +
-            "`anchorText` is matched against the block's literal rendered plain text " +
-            '(no markdown); markdown/emoji are tolerated as a fallback; prefer plain ' +
-            'text or anchorNodeId. Note: append is top-level only and rejects ' +
-            'structural table nodes. Example node: a paragraph ' +
-            '{"type":"paragraph","content":[{"type":"text","text":"Hello"}]} or a ' +
-            'heading {"type":"heading","attrs":{"level":2},"content":' +
-            '[{"type":"text","text":"Title"}]}. Bold is a mark: ' +
-            '{"type":"text","text":"x","marks":[{"type":"bold"}]}. The node may be a ' +
-            'JSON object or a JSON string (both accepted). Reversible via page history.',
-        buildShape: (z) => ({
-            pageId: z.string().min(1),
-            node: z
-                .any()
-                .describe('ProseMirror node to insert, e.g. ' +
-                '{"type":"paragraph","content":[{"type":"text","text":"Hello"}]}. ' +
-                'JSON object or JSON string both accepted.'),
-            position: z
-                .enum(['before', 'after', 'append'])
-                .describe('Where to insert relative to the anchor.'),
-            anchorNodeId: z
-                .string()
-                .optional()
-                .describe('Anchor block id (for before/after).'),
-            anchorText: z
-                .string()
-                .optional()
-                .describe("Anchor text fragment (for before/after), matched against the " +
-                "block's literal rendered plain text (no markdown). Markdown/emoji " +
-                'are tolerated as a fallback; prefer plain text or anchorNodeId.'),
-        }),
-    },
-    // --- share management ---
-    unsharePage: {
-        mcpName: 'unshare_page',
-        inAppKey: 'unsharePage',
-        description: 'Remove the public share of a page (revokes the public URL).',
-        buildShape: (z) => ({
-            pageId: z.string().min(1).describe('ID of the page to unshare'),
-        }),
-    },
-    // --- version history ---
-    diffPageVersions: {
-        mcpName: 'diff_page_versions',
-        inAppKey: 'diffPageVersions',
-        description: 'Diff two versions of a page and return a Docmost-equivalent change set ' +
-            '(inserted/deleted text, integrity counts for images/links/tables/' +
-            'callouts/footnote markers, and a human-readable markdown summary). ' +
-            "`from`/`to` each accept a historyId, or null/'current' for the page's " +
-            'current content (defaults: from=current, to=current — pass a historyId ' +
-            'from the page-history list to compare against the live page).',
-        buildShape: (z) => ({
-            pageId: z.string().min(1),
-            from: z
-                .string()
-                .optional()
-                .describe("historyId, or 'current'/omit for current content"),
-            to: z
-                .string()
-                .optional()
-                .describe("historyId, or 'current'/omit for current content"),
-        }),
-    },
-    listPageHistory: {
-        mcpName: 'list_page_history',
-        inAppKey: 'listPageHistory',
-        description: "List a page's saved versions (Docmost auto-snapshots on every save), " +
-            'newest first, cursor-paginated. Returns { items, nextCursor }; each ' +
-            "item's id is the historyId to pass to the page diff or restore tools.",
-        buildShape: (z) => ({
-            pageId: z.string().min(1),
-            cursor: z
-                .string()
-                .optional()
-                .describe('Pagination cursor from a previous nextCursor'),
-        }),
-    },
-    restorePageVersion: {
-        mcpName: 'restore_page_version',
-        inAppKey: 'restorePageVersion',
-        description: 'Restore a page to a saved version: writes that version\'s content back ' +
-            'as the page\'s current content (Docmost has no restore endpoint, so ' +
-            'this creates a NEW history snapshot — the restore is itself revertible). ' +
-            'Get the historyId from the page-history list.',
-        buildShape: (z) => ({
-            historyId: z.string().min(1),
-        }),
-    },
-    // --- markdown round-trip ---
-    importPageMarkdown: {
-        mcpName: 'import_page_markdown',
-        inAppKey: 'importPageMarkdown',
-        description: "Replace a page's content from a self-contained Docmost-flavoured " +
-            'Markdown file produced by the page-Markdown export tool. Restores comment ' +
-            'highlight anchors and diagrams from their inline HTML. NOTE: comment ' +
-            'thread records are NOT created/updated/deleted on the server by this ' +
-            'tool — only the page body + inline comment marks are written; manage ' +
-            'comment threads via the comment tools/UI.',
-        buildShape: (z) => ({
-            pageId: z.string().min(1),
-            markdown: z.string().min(1),
-        }),
-    },
-    // --- server-side content copy ---
-    copyPageContent: {
-        mcpName: 'copy_page_content',
-        inAppKey: 'copyPageContent',
-        description: "Replace targetPageId's content with a copy of sourcePageId's content, " +
-            'entirely server-side — the document is NOT sent through the model. The ' +
-            'target keeps its own title and slug; only its body is replaced. Ideal ' +
-            "for 'make page A's content equal to B' or 'replace A with B but keep A's URL'.",
-        buildShape: (z) => ({
-            sourcePageId: z.string().min(1).describe('Page to copy content FROM'),
-            targetPageId: z
-                .string()
-                .min(1)
-                .describe('Page whose content is REPLACED (title/slug kept)'),
-        }),
-    },
-    // --- surgical text edit (folds in the documented drift-bug fix) ---
-    //
-    // CANONICAL description is the CORRECTED in-app wording: a formatting-only
-    // change is REFUSED into failed[] (not silently stripped-and-retried). The
-    // stale MCP claim that "Markdown wrappers are tolerated via a strip-and-retry
-    // fallback" is intentionally absent here.
-    editPageText: {
-        mcpName: 'edit_page_text',
-        inAppKey: 'editPageText',
-        description: "Surgical find/replace inside a page's text, preserving all block " +
-            'ids and marks. A find MAY cross bold/italic/link boundaries; the ' +
-            'replacement inherits marks from the unchanged common prefix/suffix ' +
-            '(so editing plain text next to a bold word keeps it bold, and ' +
-            'editing inside a bold word keeps the new text bold). Each find must ' +
-            'match exactly once unless replaceAll is set. The batch applies what ' +
-            'it can and returns applied[] + failed[] plus a verify change-report ' +
-            '(the text/marks/structure that ACTUALLY changed — read it to confirm ' +
-            'your edit landed; do not assume success); a fully-unmatched batch ' +
-            'writes nothing and errors. find and replace are LITERAL text, not ' +
-            'markdown. This tool edits plain text ONLY and CANNOT add or remove ' +
-            'formatting marks: a formatting change — find/replace that differ only ' +
-            'in markdown markers (e.g. find:"~~x~~", replace:"x"), or a replace ' +
-            'containing **bold**/~~strike~~/`code` wrappers — is REFUSED into ' +
-            'failed[]. To change bold/italic/strike/code/link, read the block as ' +
-            'page JSON and use a structural node patch/update to set its marks. ' +
-            'Examples: edits:[{find:"teh",replace:"the"}]; edits:[{find:"Hello ' +
-            'world",replace:"Hello there"}] (crosses a bold boundary).',
-        buildShape: (z) => ({
-            pageId: z.string().describe('ID of the page to edit'),
-            edits: z
-                .array(z.object({
-                find: z.string().describe('Exact text to find'),
-                replace: z.string().describe('Replacement text (may be empty)'),
-                replaceAll: z
-                    .boolean()
-                    .optional()
-                    .describe('Replace every occurrence (default: must match once)'),
-            }))
-                .min(1)
-                .describe('List of find/replace operations, applied in order'),
-        }),
-    },
-    // --- hand a large page to an external consumer without bloating context ---
-    stashPage: {
-        mcpName: 'stash_page',
-        inAppKey: 'stashPage',
-        description: 'Serialize a whole page (the full ProseMirror JSON, as get_page_json ' +
-            'returns) into an ephemeral in-memory blob and return ONLY a short ' +
-            'anonymous URL to it — the body NEVER enters the model context, so this ' +
-            'is the way to hand a large page (or its images) to an external consumer ' +
-            'without truncation. Every internal file/image attachment is mirrored ' +
-            'into the same sandbox and its src rewritten to a sandbox URL, so the ' +
-            'consumer can fetch the images anonymously too; external http(s) images ' +
-            'are left untouched. Returns { uri, size, sha256, images:{mirrored, ' +
-            'failed} }. Integrity: the blob is served with ETag = its sha256, so a ' +
-            'truncated/corrupted fetch is detectable. Blobs are RAM-only: they expire ' +
-            'after a short TTL (~1h) and are cleared on restart — consume the URL ' +
-            'within the TTL and one uptime, or re-stash. A blob is bound to the ' +
-            'server instance that created it: in a multi-replica deployment without ' +
-            'sticky sessions a blob stored on one instance is not retrievable via the ' +
-            'sandbox URL on another (it 404s like an expired one).',
-        buildShape: (z) => ({
-            pageId: z.string().min(1),
-        }),
-    },
-};
diff --git a/packages/mcp/package.json b/packages/mcp/package.json
index 9ca5b471..b19b5eca 100644
--- a/packages/mcp/package.json
+++ b/packages/mcp/package.json
@@ -32,6 +32,7 @@
   "author": "Moritz Krause",
   "license": "MIT",
   "dependencies": {
+    "@docmost/prosemirror-markdown": "workspace:*",
     "@fellow/prosemirror-recreate-transform": "^1.2.3",
     "@hocuspocus/provider": "^3.4.4",
     "@hocuspocus/transformer": "^3.4.4",
diff --git a/packages/mcp/src/client.ts b/packages/mcp/src/client.ts
index 7c6aef75..1ddc3432 100644
--- a/packages/mcp/src/client.ts
+++ b/packages/mcp/src/client.ts
@@ -808,8 +808,14 @@ export class DocmostClient {
     await this.ensureAuthenticated();
     const resultData = await this.getPageRaw(pageId);
 
+    // Agent read: hide resolved-comment anchors so the agent sees only active
+    // discussions. Active anchors are kept. (The lossless export_page_markdown
+    // round-trip deliberately does NOT pass this flag — resolved anchors there
+    // must be preserved.)
     let content = resultData.content
-      ? convertProseMirrorToMarkdown(resultData.content)
+      ? convertProseMirrorToMarkdown(resultData.content, {
+          dropResolvedCommentAnchors: true,
+        })
       : "";
 
     // Always fetch subpages to provide context to the agent
@@ -1798,7 +1804,10 @@ export class DocmostClient {
     const body = page.content ? convertProseMirrorToMarkdown(page.content) : "";
     let comments: any[] = [];
     try {
-      comments = await this.listComments(pageId);
+      // Lossless export: include RESOLVED threads so the export -> import
+      // round-trip preserves every comment. This is exactly why the active-only
+      // filter is an opt-in (default false) on listComments.
+      comments = (await this.listComments(pageId, true)).items;
     } catch (e) {
       // A comments fetch failure must not lose the body; export with [] and let
       // the caller see the (empty) comments block. Log under DEBUG only.
@@ -2367,8 +2376,21 @@ export class DocmostClient {
     }
   }
 
-  /** List all comments on a page (cursor-paginated), content as markdown. */
-  async listComments(pageId: string) {
+  /**
+   * List comments on a page (cursor-paginated), content as markdown.
+   *
+   * DEFAULT (`includeResolved = false`) hides RESOLVED THREADS WHOLESALE so the
+   * agent sees only active discussions: a top-level comment with `resolvedAt`
+   * set AND every reply under it (a reply of a closed thread is part of the
+   * closed thread) are dropped from `items`. `resolvedThreadsHidden` reports how
+   * many resolved top-level threads were hidden so the agent can re-query with
+   * `includeResolved: true` to see everything. Active threads always stay.
+   *
+   * Returns `{ items, resolvedThreadsHidden }` (NOT a bare array) — callers that
+   * need the full feed (lossless export, transformPage, checkNewComments) pass
+   * `includeResolved: true` and read `.items`.
+   */
+  async listComments(pageId: string, includeResolved = false) {
     await this.ensureAuthenticated();
     let allComments: any[] = [];
     let cursor: string | null = null;
@@ -2384,7 +2406,7 @@ export class DocmostClient {
       cursor = data.meta?.nextCursor || null;
     } while (cursor);
 
-    return allComments.map((comment: any) => {
+    const mapped = allComments.map((comment: any) => {
       const markdown = comment.content
         ? convertProseMirrorToMarkdown(
             this.parseCommentContent(comment.content),
@@ -2392,6 +2414,31 @@ export class DocmostClient {
         : "";
       return filterComment(comment, markdown);
     });
+
+    if (includeResolved) {
+      return { items: mapped, resolvedThreadsHidden: 0 };
+    }
+
+    // Ids of RESOLVED top-level threads (a top-level comment has no
+    // parentCommentId). A whole thread is hidden when its root is resolved.
+    const resolvedRootIds = new Set(
+      mapped
+        .filter((c) => !c.parentCommentId && c.resolvedAt != null)
+        .map((c) => c.id),
+    );
+
+    const items = mapped.filter((c) => {
+      // Hide the resolved root itself and every reply anchored to it. A reply's
+      // own resolvedAt is irrelevant — its membership follows the parent thread.
+      // ASSUMPTION: Docmost's comment model is FLAT — a reply's parentCommentId
+      // always points at the thread ROOT (no reply-of-reply nesting), so a single
+      // level of parent lookup covers a whole thread. If nested replies are ever
+      // introduced, a deep reply of a resolved thread would need a root-walk here.
+      if (!c.parentCommentId) return !resolvedRootIds.has(c.id);
+      return !resolvedRootIds.has(c.parentCommentId);
+    });
+
+    return { items, resolvedThreadsHidden: resolvedRootIds.size };
   }
 
   async getComment(commentId: string) {
@@ -2766,7 +2813,9 @@ export class DocmostClient {
     const results: any[] = [];
     for (const page of pagesInScope) {
       try {
-        const comments = await this.listComments(page.id);
+        // Full feed (incl. resolved): a "new comments since" scan reports all
+        // recent activity; the active-only filter is scoped to list_comments.
+        const comments = (await this.listComments(page.id, true)).items;
         const newComments = comments.filter(
           (c: any) => new Date(c.createdAt) > sinceDate,
         );
@@ -3512,7 +3561,9 @@ export class DocmostClient {
     const deleteComments = opts.deleteComments ?? false;
 
     await this.ensureAuthenticated();
-    const comments = await this.listComments(pageId);
+    // Full feed (incl. resolved): a page transform (e.g. comments -> footnotes)
+    // must operate on every comment, so it opts into the unfiltered feed.
+    const comments = (await this.listComments(pageId, true)).items;
 
     // ctx handed to the sandbox. consume() records ids; helpers are the pure
     // transform primitives. log is captured from console.log inside the sandbox.
diff --git a/packages/mcp/src/index.ts b/packages/mcp/src/index.ts
index db6c9274..fe6d8ffd 100644
--- a/packages/mcp/src/index.ts
+++ b/packages/mcp/src/index.ts
@@ -725,15 +725,24 @@ server.registerTool(
   "list_comments",
   {
     description:
-      "List ALL comments on a page in one call (pagination is handled " +
-      "internally), including RESOLVED threads — filter by resolvedAt when you " +
-      "need only open ones. Content is returned as Markdown.",
+      "List comments on a page in one call (pagination is handled " +
+      "internally). By DEFAULT only ACTIVE threads are returned; resolved " +
+      "threads (a resolved top-level comment and all its replies) are hidden " +
+      "and their count reported as `resolvedThreadsHidden` so you can re-query " +
+      "with `includeResolved: true` to see everything. Returns " +
+      "`{ items, resolvedThreadsHidden }`. Content is returned as Markdown.",
     inputSchema: {
       pageId: z.string().describe("ID of the page"),
+      includeResolved: z
+        .boolean()
+        .optional()
+        .describe(
+          "default only active threads; true — include resolved",
+        ),
     },
   },
-  async ({ pageId }) => {
-    const comments = await docmostClient.listComments(pageId);
+  async ({ pageId, includeResolved }) => {
+    const comments = await docmostClient.listComments(pageId, includeResolved);
     return jsonContent(comments);
   },
 );
diff --git a/packages/mcp/src/lib/collaboration.ts b/packages/mcp/src/lib/collaboration.ts
index c8b1cf40..c14afbf8 100644
--- a/packages/mcp/src/lib/collaboration.ts
+++ b/packages/mcp/src/lib/collaboration.ts
@@ -2,18 +2,24 @@ import { HocuspocusProvider } from "@hocuspocus/provider";
 import { TiptapTransformer } from "@hocuspocus/transformer";
 import * as Y from "yjs";
 import WebSocket from "ws";
-import { marked } from "marked";
-import { generateJSON } from "@tiptap/html";
 import { Node as PMNode } from "@tiptap/pm/model";
 import { updateYFragment } from "y-prosemirror";
 import { JSDOM } from "jsdom";
+// #293 STEP 5: the pure markdown -> ProseMirror import path is now owned by the
+// shared package (canonical `^[…]` footnotes, `$…$` math, `==` highlight, the
+// media-family md forms, comment-directive attrs, callouts and task lists all
+// handled there). MCP consumes it directly instead of maintaining its own
+// drifted marked pipeline; only the collab/yjs write glue and the footnote
+// canonicalization wrapper stay mcp-side.
+import { markdownToProseMirror } from "@docmost/prosemirror-markdown";
 import { docmostExtensions, docmostSchema } from "./docmost-schema.js";
 import { withPageLock } from "./page-lock.js";
 import { sanitizeForYjs, findUnstorableAttr } from "./node-ops.js";
-import { lexFootnoteLines } from "./footnote-lex.js";
 import { canonicalizeFootnotes } from "./footnote-canonicalize.js";
 import { summarizeChange, VerifyReport } from "./diff.js";
 
+export { markdownToProseMirror };
+
 /**
  * Build the descriptive error for an opaque Yjs encode failure ("Unexpected
  * content type"), shared by both encode paths (`buildYDoc` -> `toYdoc` and
@@ -51,382 +57,27 @@ global.WebSocket = WebSocket;
 // global.navigator = dom.window.navigator;
 
 /**
- * Hard ceiling above which we skip callout preprocessing entirely. The linear
- * scanner below has no quadratic blow-up, but we still cap input defensively so
- * a pathological multi-megabyte payload cannot tie up the event loop; in that
- * case the markdown is passed through verbatim (callouts are simply not
- * detected) rather than risking a slow scan.
- */
-const MAX_CALLOUT_PREPROCESS_BYTES = 4 * 1024 * 1024; // 4 MB
-
-/** Matches an opening callout fence: `:::type` (type captured, lower-cased). */
-const CALLOUT_OPEN_RE = /^:::\s*(\w+)\s*$/;
-/** Matches a bare closing callout fence: `:::`. */
-const CALLOUT_CLOSE_RE = /^:::\s*$/;
-/** Matches the start/end of a code fence (``` or ~~~), capturing the marker. */
-const CODE_FENCE_RE = /^(\s*)(`{3,}|~{3,})/;
-
-/**
- * Pre-process Docmost-flavoured markdown: convert `:::type ... :::`
- * callout blocks (the syntax our markdown export produces) into HTML
- * divs that the callout extension parses. The inner content is rendered
- * through marked as regular markdown.
+ * Page-write variant of the package's `markdownToProseMirror`: imports markdown
+ * then re-runs mcp's footnote canonicalizer over the result.
  *
- * Implemented as a single linear pass over the lines (no quadratic regex
- * rescan). It:
- *   - tracks fenced code regions (```...``` and ~~~...~~~) and never treats a
- *     `:::` line that lives inside a code fence as a callout delimiter, so a
- *     callout body that itself contains a fenced code block with a `:::` line is
- *     no longer corrupted;
- *   - matches an opening `:::type` line with the next CLOSING `:::` at the SAME
- *     nesting level, supporting NESTED callouts via a depth counter (an inner
- *     `:::type` opens a deeper level and consumes a matching `:::`);
- *   - emits the same `<div data-type="callout" data-callout-type="TYPE">` output
- *     (inner rendered through marked) as the previous regex implementation.
- */
-async function preprocessCallouts(markdown: string): Promise<string> {
-  // Defensive cap: skip preprocessing for pathologically large inputs.
-  if (markdown.length > MAX_CALLOUT_PREPROCESS_BYTES) {
-    return markdown;
-  }
-
-  // Recursively transform a slice of lines, converting top-level callouts in
-  // that slice into <div> blocks and rendering their inner content (which may
-  // itself contain nested callouts) through this same function.
-  const transform = async (lines: string[]): Promise<string> => {
-    const out: string[] = [];
-    let inCodeFence = false;
-    let codeFenceMarker = ""; // the exact run of backticks/tildes that opened it
-    let i = 0;
-
-    while (i < lines.length) {
-      const line = lines[i];
-
-      // Inside a code fence, only its matching closing fence is significant;
-      // everything else (including `:::` lines) is copied through verbatim.
-      if (inCodeFence) {
-        out.push(line);
-        const fence = line.match(CODE_FENCE_RE);
-        if (fence && fence[2].startsWith(codeFenceMarker[0]) &&
-            fence[2].length >= codeFenceMarker.length) {
-          inCodeFence = false;
-          codeFenceMarker = "";
-        }
-        i++;
-        continue;
-      }
-
-      // A code fence opening outside any callout body: enter code-fence mode.
-      const fenceOpen = line.match(CODE_FENCE_RE);
-      if (fenceOpen) {
-        inCodeFence = true;
-        codeFenceMarker = fenceOpen[2];
-        out.push(line);
-        i++;
-        continue;
-      }
-
-      // An opening callout fence: scan forward (with code-fence and nested
-      // callout awareness) for its matching closing `:::` at the same level.
-      const open = line.match(CALLOUT_OPEN_RE);
-      if (open) {
-        const type = open[1].toLowerCase();
-        const bodyLines: string[] = [];
-        let depth = 1;
-        let innerInCodeFence = false;
-        let innerCodeFenceMarker = "";
-        let j = i + 1;
-        for (; j < lines.length; j++) {
-          const bl = lines[j];
-          if (innerInCodeFence) {
-            const f = bl.match(CODE_FENCE_RE);
-            if (f && f[2].startsWith(innerCodeFenceMarker[0]) &&
-                f[2].length >= innerCodeFenceMarker.length) {
-              innerInCodeFence = false;
-              innerCodeFenceMarker = "";
-            }
-            bodyLines.push(bl);
-            continue;
-          }
-          const innerFence = bl.match(CODE_FENCE_RE);
-          if (innerFence) {
-            innerInCodeFence = true;
-            innerCodeFenceMarker = innerFence[2];
-            bodyLines.push(bl);
-            continue;
-          }
-          if (CALLOUT_OPEN_RE.test(bl)) {
-            depth++;
-            bodyLines.push(bl);
-            continue;
-          }
-          if (CALLOUT_CLOSE_RE.test(bl)) {
-            depth--;
-            if (depth === 0) break; // matching close for THIS callout
-            bodyLines.push(bl);
-            continue;
-          }
-          bodyLines.push(bl);
-        }
-
-        if (j < lines.length) {
-          // Found the matching closing fence: render the body (recursively, so
-          // nested callouts are handled) and emit the callout div.
-          const inner = await transform(bodyLines);
-          const renderedInner = await marked.parse(inner);
-          out.push(
-            `\n<div data-type="callout" data-callout-type="${type}">${renderedInner}</div>\n`,
-          );
-          i = j + 1; // skip past the closing `:::`
-          continue;
-        }
-        // No matching close (unterminated callout): treat the opener as a
-        // literal line and continue, preserving the original text.
-        out.push(line);
-        i++;
-        continue;
-      }
-
-      out.push(line);
-      i++;
-    }
-
-    return out.join("\n");
-  };
-
-  return transform(markdown.split("\n"));
-}
-
-/**
- * Bridge marked's checkbox lists to TipTap task lists.
+ * Footnote layering after #293 STEP 5:
+ *   - The package's `markdownToProseMirror` already ASSEMBLES footnotes on import
+ *     (canon #2): inline `^[body]` markers become the schema's
+ *     `footnoteReference` + a single doc-level `footnotesList`, with ids assigned
+ *     sequentially (`fn-1`, `fn-2`, …) in first-reference order and identical
+ *     bodies merged. So the import output is ALREADY in canonical footnote
+ *     topology.
+ *   - `canonicalizeFootnotes` runs AFTER as the mcp write-path invariant shared
+ *     with every other full-document persist path (`update_page_json`,
+ *     `docmost_transform`, `insert_footnote`, …). Because the package output is
+ *     already canonical, this layer is a no-op here (idempotent) — it exists so
+ *     the page-write contract is enforced uniformly regardless of how the PM doc
+ *     was produced, not because the import needs fixing.
  *
- * marked renders GitHub task list items (`- [x] done`) as a plain
- * `<ul><li><p><input type="checkbox" checked> text</p></li></ul>` WITHOUT the
- * markup TipTap's TaskList/TaskItem extensions parse. This rewrites such lists
- * into the shape those extensions expect:
- *   TaskList parseHTML matches `ul[data-type="taskList"]`,
- *   TaskItem matches `li[data-type="taskItem"]`,
- *   the checked state is read from `data-checked === "true"`.
- *
- * A list is only converted when it has at least one `<li>` and EVERY direct
- * `<li>` contains a checkbox input. Both `<ul>` and `<ol>` are considered: a
- * numbered checklist (`1. [x] a`, which marked renders as an `<ol>` of checkbox
- * `<li>`s) would otherwise lose its task state. TipTap task lists are unordered,
- * so a matching `<ol>` is emitted as `data-type="taskList"` exactly like a
- * `<ul>`. Mixed or ordinary lists (including ordinary `<ol>` lists) are left
- * untouched so they keep rendering as bullet/numbered lists. The marked `<p>`
- * wrapper is kept inside the `<li>` because TaskItem content allows paragraphs.
- */
-function bridgeTaskLists(html: string): string {
-  // Cheap early-out: if the markup contains no checkbox input at all there is
-  // nothing to bridge, so skip the expensive JSDOM parse entirely. This is the
-  // common case (most pages have no task lists).
-  if (!/type=["']?checkbox/i.test(html)) {
-    return html;
-  }
-  // Defensive cap (consistent with preprocessCallouts): skip the bridge for
-  // pathologically large inputs rather than running a second expensive JSDOM
-  // parse on a multi-megabyte payload. The markup is passed through verbatim.
-  if (html.length > MAX_CALLOUT_PREPROCESS_BYTES) {
-    return html;
-  }
-  const dom = new JSDOM(html);
-  const document = dom.window.document;
-  // Collect the checkbox(es) that belong to THIS <li> directly: either direct
-  // child <input type="checkbox"> elements or ones inside the <li>'s direct <p>
-  // child (the shape marked emits: `<li><p><input type="checkbox"> text</p></li>`).
-  // Checkboxes nested deeper (e.g. inside a child <ul>/<ol>) are excluded so a
-  // bullet <li> that merely contains a nested task sublist is not misdetected.
-  // Raw inline HTML can put more than one checkbox in a single <li>; we gather
-  // ALL of them so none survive into the converted item.
-  const directCheckboxes = (li: Element): Element[] => {
-    const found: Element[] = [];
-    for (const child of Array.from(li.children)) {
-      if (
-        child.tagName === "INPUT" &&
-        child.getAttribute("type") === "checkbox"
-      ) {
-        found.push(child);
-        continue;
-      }
-      if (child.tagName === "P") {
-        for (const inp of Array.from(
-          child.querySelectorAll(":scope > input[type='checkbox']"),
-        )) {
-          found.push(inp);
-        }
-      }
-    }
-    return found;
-  };
-  // Both <ul> and <ol> are candidates: an <ol> whose every direct <li> carries
-  // its own checkbox is a numbered checklist that must also become a taskList.
-  const lists = Array.from(document.querySelectorAll("ul, ol"));
-  for (const list of lists) {
-    // Only consider DIRECT child <li> elements; nested lists are handled by
-    // their own iteration of the outer loop.
-    const items = Array.from(list.children).filter(
-      (child) => child.tagName === "LI",
-    );
-    if (items.length === 0) continue;
-    const itemCheckboxes = items.map((li) => directCheckboxes(li));
-    // Convert only when every direct <li> carries at least one OWN checkbox.
-    if (!itemCheckboxes.every((boxes) => boxes.length > 0)) continue;
-
-    // A numbered checklist arrives as an <ol>. We must NOT leave the tag as
-    // <ol> while tagging it data-type="taskList": generateJSON would then match
-    // BOTH the orderedList rule (tag ol) and the taskList rule (data-type),
-    // emitting a phantom empty orderedList beside the real taskList. So rename a
-    // qualifying <ol> to a <ul> — move its <li> children over and replace it —
-    // leaving only the taskList rule to match. Already-<ul> lists are unchanged.
-    let target: Element = list;
-    if (list.tagName === "OL") {
-      const ul = document.createElement("ul");
-      // Carry over existing attributes (e.g. class) so nothing is silently lost.
-      for (const attr of Array.from(list.attributes)) {
-        ul.setAttribute(attr.name, attr.value);
-      }
-      // Move every child node (including the <li>s we collected) into the <ul>.
-      while (list.firstChild) {
-        ul.appendChild(list.firstChild);
-      }
-      list.replaceWith(ul);
-      target = ul;
-    }
-
-    target.setAttribute("data-type", "taskList");
-    items.forEach((li, index) => {
-      const boxes = itemCheckboxes[index];
-      // The first checkbox determines the checked state (matches the previous
-      // single-checkbox behaviour); any extras only need removing.
-      const input = boxes[0] ?? null;
-      li.setAttribute("data-type", "taskItem");
-      const checked =
-        input != null &&
-        (input.hasAttribute("checked") || (input as any).checked);
-      li.setAttribute("data-checked", checked ? "true" : "false");
-      // Remove ALL direct checkbox inputs so none survive into the content
-      // (a raw-inline-HTML <li> may carry more than one).
-      for (const box of boxes) {
-        box.remove();
-      }
-    });
-  }
-  return document.body.innerHTML;
-}
-
-// Mirror of packages/editor-ext footnote markdown handling. A `[^id]` inline
-// marker becomes <sup data-footnote-ref data-id="id">, and `[^id]: text`
-// definition lines are collected into a single <section data-footnotes>.
-// Definition detection + fence handling are shared with analyzeFootnotes via
-// lexFootnoteLines (footnote-lex.js). FOOTNOTE_REF_RE is the inline tokenizer's.
-const FOOTNOTE_REF_RE = /\[\^([^\]\s]+)\]/;
-
-function escapeFootnoteAttr(value: string): string {
-  return String(value).replace(/&/g, "&amp;").replace(/"/g, "&quot;");
-}
-
-const footnoteRefMarkedExtension = {
-  name: "footnoteRef",
-  level: "inline" as const,
-  start(src: string) {
-    return src.match(/\[\^/)?.index ?? -1;
-  },
-  tokenizer(src: string) {
-    const match = FOOTNOTE_REF_RE.exec(src);
-    if (match && match.index === 0) {
-      return { type: "footnoteRef", raw: match[0], id: match[1] };
-    }
-    return undefined;
-  },
-  renderer(token: any) {
-    return `<sup data-footnote-ref data-id="${escapeFootnoteAttr(
-      token.id,
-    )}"></sup>`;
-  },
-};
-
-marked.use({ extensions: [footnoteRefMarkedExtension] });
-
-/**
- * Pull `[^id]: text` definition lines out of the body and render a single
- * <section data-footnotes> for them (or "" when there are none).
- */
-function extractFootnotes(markdown: string): {
-  body: string;
-  section: string;
-} {
-  const bodyLines: string[] = [];
-  const defs: Array<{ id: string; text: string }> = [];
-  // Shared lexer (footnote-lex): a `[^id]: ...` line inside a ``` / ~~~ code
-  // block is inert and stays in the body verbatim; only real definition lines
-  // are pulled out. analyzeFootnotes() consumes the SAME lexer so its diagnostics
-  // match exactly what import keeps/strips (#166).
-  for (const tok of lexFootnoteLines(markdown)) {
-    if (!tok.inFence && tok.definition) defs.push(tok.definition);
-    else bodyLines.push(tok.line);
-  }
-  if (defs.length === 0) return { body: markdown, section: "" };
-
-  // Duplicate definition ids: FIRST WINS, the rest are DROPPED (mirror of
-  // editor-ext extractFootnoteDefinitions). Reference markers are left untouched
-  // so repeated `[^a]` references reuse the single footnote (Pandoc semantics,
-  // #166). The dropped duplicate is surfaced to the caller via analyzeFootnotes
-  // (`duplicateDefinitions`), not silently lost. MUST stay in sync with the
-  // editor-ext mirror.
-  const firstById = new Map<string, string>(); // id -> first definition text
-  for (const def of defs) {
-    if (!firstById.has(def.id)) firstById.set(def.id, def.text);
-  }
-
-  const inner = [...firstById.entries()]
-    .map(
-      ([id, text]) =>
-        `<div data-footnote-def data-id="${escapeFootnoteAttr(
-          id,
-        )}"><p>${marked.parseInline(text || "")}</p></div>`,
-    )
-    .join("");
-  return {
-    body: bodyLines.join("\n"),
-    section: `<section data-footnotes>${inner}</section>`,
-  };
-}
-
-/**
- * Convert markdown to a ProseMirror doc using the full Docmost schema.
- *
- * This conversion does NOT canonicalize footnotes — it is the shared, content-
- * preserving primitive used by BOTH page write paths and COMMENT bodies
- * (createComment / updateComment). Canonicalization MUST NOT run on a comment
- * body: a comment may legitimately contain a footnote-definition line
- * (`[^1]: text`) with no matching reference, and the canonicalizer drops a
- * reference-less footnotesList — which would silently delete the comment's text.
- *
- * Page write paths that DO need the canonical footnote topology call
- * `markdownToProseMirrorCanonical` instead (markdown import, update_page markdown
- * path). Keep this function reference-loss-free.
- */
-export async function markdownToProseMirror(
-  markdownContent: string,
-): Promise<any> {
-  const withCallouts = await preprocessCallouts(markdownContent);
-  const { body, section } = extractFootnotes(withCallouts);
-  const html = (await marked.parse(body)) + section;
-  const bridged = bridgeTaskLists(html);
-  return generateJSON(bridged, docmostExtensions);
-}
-
-/**
- * Page-write variant of `markdownToProseMirror`: converts markdown then enforces
- * the canonical footnote topology. The footnote `section` markdown is emitted in
- * DEFINITION order, but numbering derives from REFERENCE order, so without this
- * the bottom list renders out of order (`1, 4, 2, 3, …`); orphan definitions and
- * duplicate lists are also normalized. Idempotent — a no-op once canonical, and a
- * no-op for footnote-free content.
- *
- * Use this ONLY for full-document PAGE writes (never for comment bodies, where it
- * would drop a reference-less footnote definition — see `markdownToProseMirror`).
+ * Use this ONLY for full-document PAGE writes. Comment bodies call the package's
+ * plain `markdownToProseMirror` (no canonicalization) — safe now because inline
+ * `^[body]` footnotes carry their body at the reference point, so a comment can
+ * no longer produce a reference-less footnote definition to be dropped.
  */
 export async function markdownToProseMirrorCanonical(
   markdownContent: string,
diff --git a/packages/mcp/src/lib/docmost-schema.ts b/packages/mcp/src/lib/docmost-schema.ts
index 6478952b..200c4649 100644
--- a/packages/mcp/src/lib/docmost-schema.ts
+++ b/packages/mcp/src/lib/docmost-schema.ts
@@ -1,1273 +1,35 @@
 /**
- * Full TipTap extension set matching the real Docmost document schema.
+ * Docmost TipTap schema mirror.
  *
- * The default StarterKit-only schema silently destroys Docmost-specific
- * nodes (callout, table) and drops attributes it does not know about
- * (node ids, image sizing, link targets). Every code path that converts
- * to or from ProseMirror JSON must use THIS set, otherwise a round-trip
- * loses content.
- */
-import StarterKit from "@tiptap/starter-kit";
-import Image from "@tiptap/extension-image";
-import TaskList from "@tiptap/extension-task-list";
-import TaskItem from "@tiptap/extension-task-item";
-import Highlight from "@tiptap/extension-highlight";
-import Subscript from "@tiptap/extension-subscript";
-import Superscript from "@tiptap/extension-superscript";
-import { Node, Extension, Mark, getSchema } from "@tiptap/core";
-
-// Inlined from @tiptap/core's getStyleProperty (added after 3.20.x) so this
-// package can stay on the same @tiptap/core version as the editor and avoid a
-// duplicate-tiptap version split in the monorepo. Reads a single declaration
-// from an element's inline `style` attribute, last-wins, case-insensitive.
-function getStyleProperty(element: HTMLElement, propertyName: string): string | null {
-  const styleAttr = element.getAttribute("style");
-  if (!styleAttr) {
-    return null;
-  }
-  const decls = styleAttr.split(";").map((decl) => decl.trim()).filter(Boolean);
-  const target = propertyName.toLowerCase();
-  for (let i = decls.length - 1; i >= 0; i -= 1) {
-    const decl = decls[i];
-    const colonIndex = decl.indexOf(":");
-    if (colonIndex === -1) {
-      continue;
-    }
-    const prop = decl.slice(0, colonIndex).trim().toLowerCase();
-    if (prop === target) {
-      return decl.slice(colonIndex + 1).trim();
-    }
-  }
-  return null;
-}
-
-/** Allowed Docmost callout types; anything else falls back to "info". */
-const CALLOUT_TYPES = ["info", "warning", "danger", "success"];
-export const clampCalloutType = (value: string | null | undefined): string =>
-  value && CALLOUT_TYPES.includes(value.toLowerCase())
-    ? value.toLowerCase()
-    : "info";
-
-/**
- * Allowlist guard for CSS color values imported from HTML.
+ * #293 STEP 5: the extension set (and its parseHTML/renderHTML behaviour) is now
+ * owned by the shared `@docmost/prosemirror-markdown` package — the single
+ * canonical schema every converter path targets. MCP re-exports it here instead
+ * of maintaining its own drifted ~1200-line copy, so the schema can never drift
+ * between mcp and the package/git-sync again.
  *
- * Docmost interpolates stored mark colors straight into an inline style
- * attribute (e.g. style="background-color: ${color}" / "color: ${color}").
- * An unsanitized value such as `red; --x: url(...)` or `red"><script>` would
- * let a crafted document break out of the style attribute. We therefore only
- * accept a narrow, well-formed subset of CSS <color> syntax and reject (-> null)
- * anything else.
+ * `docmostExtensions` comes from the package; `docmostSchema` is derived from it
+ * exactly as before (`getSchema(docmostExtensions)`), built ONCE and reused by
+ * every consumer (diff, collaboration write-back) so the schema is identical at
+ * every call site.
  *
- * Accepted forms:
- *   - named colors:           letters only, e.g. "red", "rebeccapurple"
- *   - hex:                    #rgb, #rgba, #rrggbb, #rrggbbaa
- *   - functional notation:    rgb()/rgba()/hsl()/hsla() containing only
- *                             digits, %, ., commas, spaces and slashes
+ * The two schema sanitizers (`clampCalloutType`, `sanitizeCssColor`) are
+ * re-exported from the package's public barrel — they must NOT be re-defined
+ * here, or the mcp copy drifts from the package's (it already had: the local
+ * copy had lost the callout-type alias mapping the package applies). Single
+ * source of truth in the package (#326 invariant #2).
  */
-const SAFE_COLOR_RE =
-  /^(?:[a-zA-Z]+|#(?:[0-9a-fA-F]{3,4}|[0-9a-fA-F]{6}|[0-9a-fA-F]{8})|(?:rgb|rgba|hsl|hsla)\([0-9.,%/\s]+\))$/;
-export const sanitizeCssColor = (
-  value: string | null | undefined,
-): string | null => {
-  if (typeof value !== "string") return null;
-  const color = value.trim();
-  return color && SAFE_COLOR_RE.test(color) ? color : null;
-};
+import { getSchema } from "@tiptap/core";
+import {
+  docmostExtensions,
+  clampCalloutType,
+  sanitizeCssColor,
+} from "@docmost/prosemirror-markdown";
 
-/** Docmost callout (info/warning/danger/success banner). */
-const Callout = Node.create({
-  name: "callout",
-  group: "block",
-  content: "block+",
-  defining: true,
-  addAttributes() {
-    return {
-      // Read the type from data-callout-type so generateJSON(html) preserves
-      // it; without an explicit parseHTML every imported callout became "info".
-      type: {
-        default: "info",
-        parseHTML: (el: HTMLElement) =>
-          clampCalloutType(el.getAttribute("data-callout-type")),
-        renderHTML: (attrs: Record<string, any>) => ({
-          "data-callout-type": clampCalloutType(attrs.type),
-        }),
-      },
-      icon: {
-        default: null,
-        parseHTML: (el: HTMLElement) => el.getAttribute("data-icon"),
-        renderHTML: (attrs: Record<string, any>) =>
-          attrs.icon ? { "data-icon": attrs.icon } : {},
-      },
-    };
-  },
-  parseHTML() {
-    return [{ tag: 'div[data-type="callout"]' }];
-  },
-  renderHTML({ HTMLAttributes }) {
-    return ["div", { "data-type": "callout", ...HTMLAttributes }, 0];
-  },
-});
-
-/** Minimal table family: enough for schema round-trips and HTML parsing. */
-const Table = Node.create({
-  name: "table",
-  group: "block",
-  content: "tableRow+",
-  isolating: true,
-  parseHTML() {
-    return [{ tag: "table" }];
-  },
-  renderHTML() {
-    return ["table", ["tbody", 0]];
-  },
-});
-
-const TableRow = Node.create({
-  name: "tableRow",
-  content: "(tableCell | tableHeader)*",
-  parseHTML() {
-    return [{ tag: "tr" }];
-  },
-  renderHTML() {
-    return ["tr", 0];
-  },
-});
-
-const cellAttributes = () => ({
-  colspan: { default: 1 },
-  rowspan: { default: 1 },
-  colwidth: { default: null },
-  backgroundColor: { default: null },
-  backgroundColorName: { default: null },
-  // Column alignment so GFM aligned tables (|:--|:-:|--:|) round-trip.
-  align: {
-    default: null,
-    parseHTML: (el: HTMLElement) =>
-      el.getAttribute("align") || el.style.textAlign || null,
-    renderHTML: (attrs: Record<string, any>) =>
-      attrs.align ? { align: attrs.align } : {},
-  },
-});
-
-const TableCell = Node.create({
-  name: "tableCell",
-  content: "block+",
-  isolating: true,
-  addAttributes: cellAttributes,
-  parseHTML() {
-    return [{ tag: "td" }];
-  },
-  renderHTML() {
-    return ["td", 0];
-  },
-});
-
-const TableHeader = Node.create({
-  name: "tableHeader",
-  content: "block+",
-  isolating: true,
-  addAttributes: cellAttributes,
-  parseHTML() {
-    return [{ tag: "th" }];
-  },
-  renderHTML() {
-    return ["th", 0];
-  },
-});
-
-/**
- * Attributes Docmost stores on standard nodes that the stock extensions
- * do not declare. Without these, Node.fromJSON silently drops them —
- * including the block ids that heading anchors rely on.
- */
-const DocmostAttributes = Extension.create({
-  name: "docmostAttributes",
-  addGlobalAttributes() {
-    return [
-      {
-        types: ["heading", "paragraph"],
-        attributes: {
-          id: { default: null },
-          indent: { default: null },
-          textAlign: { default: null },
-        },
-      },
-      {
-        types: ["image"],
-        attributes: {
-          align: { default: null },
-          attachmentId: { default: null },
-          aspectRatio: { default: null },
-          height: { default: null },
-          placeholder: { default: null },
-          size: { default: null },
-          width: { default: null },
-        },
-      },
-      {
-        types: ["orderedList"],
-        attributes: { type: { default: null } },
-      },
-      {
-        types: ["link"],
-        attributes: { internal: { default: null }, title: { default: null } },
-      },
-    ];
-  },
-});
-
-/**
- * Docmost inline comment mark. Anchors a comment thread to a text range via
- * `commentId`. Without it, any document containing comment highlights fails to
- * round-trip through the schema ("There is no mark type comment in this schema"),
- * which breaks update_page_json and edit_page_text on every commented page.
- * Mirrors Docmost's @docmost/editor-ext comment mark (commentId / resolved).
- */
-const Comment = Mark.create({
-  name: "comment",
-  exitable: true,
-  inclusive: false,
-  addAttributes() {
-    return {
-      commentId: {
-        default: null,
-        parseHTML: (el: HTMLElement) => el.getAttribute("data-comment-id"),
-        renderHTML: (attrs: Record<string, any>) =>
-          attrs.commentId ? { "data-comment-id": attrs.commentId } : {},
-      },
-      resolved: {
-        default: false,
-        parseHTML: (el: HTMLElement) =>
-          el.getAttribute("data-resolved") === "true",
-        renderHTML: (attrs: Record<string, any>) =>
-          attrs.resolved ? { "data-resolved": "true" } : {},
-      },
-    };
-  },
-  parseHTML() {
-    return [{ tag: "span[data-comment-id]" }];
-  },
-  renderHTML({ HTMLAttributes }) {
-    return ["span", { class: "comment-mark", ...HTMLAttributes }, 0];
-  },
-});
-
-/**
- * Text color mark. The markdown-converter emits colored text as
- * <span style="color: ...">, but with no mark parsing it back the color was
- * silently dropped on import. This mirrors TipTap's @tiptap/extension-text-style
- * `textStyle` mark (the name Docmost expects) and carries a single `color`
- * attribute. The parsed color is passed through the allowlist guard so a crafted
- * style cannot break out of the attribute when Docmost re-renders it.
- */
-const TextStyle = Mark.create({
-  name: "textStyle",
-  addAttributes() {
-    return {
-      color: {
-        default: null,
-        parseHTML: (el: HTMLElement) =>
-          sanitizeCssColor(
-            el.style.color || el.getAttribute("data-color"),
-          ),
-        renderHTML: (attrs: Record<string, any>) => {
-          const color = sanitizeCssColor(attrs.color);
-          return color ? { style: `color: ${color}` } : {};
-        },
-      },
-    };
-  },
-  parseHTML() {
-    return [
-      {
-        tag: "span",
-        // Only claim a plain colored span. Do NOT match spans that are already a
-        // comment mark (data-comment-id) or a mention node (data-type=mention),
-        // otherwise importing such HTML would silently drop the comment/mention.
-        getAttrs: (el: HTMLElement) =>
-          el.style.color &&
-          !el.getAttribute("data-comment-id") &&
-          el.getAttribute("data-type") !== "mention"
-            ? {}
-            : false,
-      },
-    ];
-  },
-  renderHTML({ HTMLAttributes }) {
-    return ["span", HTMLAttributes, 0];
-  },
-});
-
-/**
- * Inline spoiler mark. Mirrors the @docmost/editor-ext `spoiler` mark so a
- * document carrying a spoiler survives the MCP read -> transform -> write path
- * (and markdown export) instead of silently dropping the unrecognized mark.
- * packages/mcp does NOT depend on editor-ext, so the definition is kept local;
- * it parses span[data-spoiler] and renders the same span[data-spoiler][class]
- * the editor-ext mark emits.
- */
-const Spoiler = Mark.create({
-  name: "spoiler",
-  // Don't bleed onto text typed at the boundary (mirrors editor-ext).
-  inclusive: false,
-  parseHTML() {
-    return [{ tag: "span[data-spoiler]" }];
-  },
-  renderHTML({ HTMLAttributes }) {
-    return ["span", { "data-spoiler": "true", class: "spoiler", ...HTMLAttributes }, 0];
-  },
-});
-
-/**
- * Passthrough definitions for the remaining Docmost-specific nodes.
- *
- * TiptapTransformer.toYdoc (the write path every mutation uses) throws
- * "Unknown node type: X" for any node not registered here, so editing ANY
- * page that contains one of these nodes used to fail outright. The read path
- * (fromYdoc) accepts them, which is why they appear in real documents.
- *
- * Each node below mirrors the real @docmost/editor-ext definition's name,
- * group, content, inline/atom flags and attribute keys (with the same data-*
- * HTML mapping) so that a fromYdoc -> transform -> toYdoc round-trip both
- * validates and preserves attributes faithfully. Interactive concerns
- * (node views, commands, keyboard shortcuts, input rules, suggestion plugins)
- * are intentionally omitted: the MCP server never renders these nodes, it only
- * needs the schema to accept and carry them. The Callout node above is the
- * pattern these follow.
- */
-
-/** Docmost @mention (user/page reference). Inline atom. */
-const Mention = Node.create({
-  name: "mention",
-  group: "inline",
-  inline: true,
-  selectable: true,
-  atom: true,
-  draggable: true,
-  addAttributes() {
-    return {
-      id: {
-        default: null,
-        parseHTML: (el: HTMLElement) => el.getAttribute("data-id"),
-        renderHTML: (attrs: Record<string, any>) =>
-          attrs.id ? { "data-id": attrs.id } : {},
-      },
-      label: {
-        default: null,
-        parseHTML: (el: HTMLElement) => el.getAttribute("data-label"),
-        renderHTML: (attrs: Record<string, any>) =>
-          attrs.label ? { "data-label": attrs.label } : {},
-      },
-      entityType: {
-        default: null,
-        parseHTML: (el: HTMLElement) => el.getAttribute("data-entity-type"),
-        renderHTML: (attrs: Record<string, any>) =>
-          attrs.entityType ? { "data-entity-type": attrs.entityType } : {},
-      },
-      entityId: {
-        default: null,
-        parseHTML: (el: HTMLElement) => el.getAttribute("data-entity-id"),
-        renderHTML: (attrs: Record<string, any>) =>
-          attrs.entityId ? { "data-entity-id": attrs.entityId } : {},
-      },
-      slugId: {
-        default: null,
-        parseHTML: (el: HTMLElement) => el.getAttribute("data-slug-id"),
-        renderHTML: (attrs: Record<string, any>) =>
-          attrs.slugId ? { "data-slug-id": attrs.slugId } : {},
-      },
-      creatorId: {
-        default: null,
-        parseHTML: (el: HTMLElement) => el.getAttribute("data-creator-id"),
-        renderHTML: (attrs: Record<string, any>) =>
-          attrs.creatorId ? { "data-creator-id": attrs.creatorId } : {},
-      },
-      anchorId: {
-        default: null,
-        parseHTML: (el: HTMLElement) => el.getAttribute("data-anchor-id"),
-        renderHTML: (attrs: Record<string, any>) =>
-          attrs.anchorId ? { "data-anchor-id": attrs.anchorId } : {},
-      },
-    };
-  },
-  parseHTML() {
-    return [{ tag: 'span[data-type="mention"]' }];
-  },
-  renderHTML({ HTMLAttributes }) {
-    return ["span", { "data-type": "mention", ...HTMLAttributes }, 0];
-  },
-});
-
-/**
- * Footnote feature (mirror of packages/editor-ext/src/lib/footnote). Three
- * nodes connected by `id`:
- *  - FootnoteReference: inline atom marker in the body (<sup data-footnote-ref>);
- *  - FootnotesList:     a single bottom container (<section data-footnotes>);
- *  - FootnoteDefinition: one editable note keyed by id (<div data-footnote-def>).
- * The visible number is not stored; it is derived from reference order.
- *
- * priority 101 so this node's <sup> parse rule beats the Superscript mark's
- * <sup> rule (otherwise an empty reference is parsed as an empty superscript
- * mark and dropped). Keep in sync with editor-ext.
- */
-const FootnoteReference = Node.create({
-  name: "footnoteReference",
-  priority: 101,
-  group: "inline",
-  inline: true,
-  atom: true,
-  selectable: true,
-  draggable: false,
-  addAttributes() {
-    return {
-      id: {
-        default: null,
-        parseHTML: (el: HTMLElement) => el.getAttribute("data-id"),
-        renderHTML: (attrs: Record<string, any>) =>
-          attrs.id ? { "data-id": attrs.id } : {},
-      },
-    };
-  },
-  parseHTML() {
-    return [{ tag: "sup[data-footnote-ref]", priority: 100 }];
-  },
-  renderHTML({ HTMLAttributes }) {
-    return ["sup", { "data-footnote-ref": "", ...HTMLAttributes }];
-  },
-});
-
-const FootnotesList = Node.create({
-  name: "footnotesList",
-  group: "block",
-  content: "footnoteDefinition+",
-  isolating: true,
-  selectable: false,
-  defining: true,
-  parseHTML() {
-    return [{ tag: "section[data-footnotes]" }];
-  },
-  renderHTML({ HTMLAttributes }) {
-    return ["section", { "data-footnotes": "", ...HTMLAttributes }, 0];
-  },
-});
-
-const FootnoteDefinition = Node.create({
-  name: "footnoteDefinition",
-  content: "paragraph+",
-  defining: true,
-  isolating: true,
-  selectable: false,
-  addAttributes() {
-    return {
-      id: {
-        default: null,
-        parseHTML: (el: HTMLElement) => el.getAttribute("data-id"),
-        renderHTML: (attrs: Record<string, any>) =>
-          attrs.id ? { "data-id": attrs.id } : {},
-      },
-    };
-  },
-  parseHTML() {
-    return [{ tag: "div[data-footnote-def]" }];
-  },
-  renderHTML({ HTMLAttributes }) {
-    return ["div", { "data-footnote-def": "", ...HTMLAttributes }, 0];
-  },
-});
-
-/** Inline KaTeX expression. Carries the LaTeX source in `text`. */
-const MathInline = Node.create({
-  name: "mathInline",
-  group: "inline",
-  inline: true,
-  atom: true,
-  addAttributes() {
-    return {
-      text: { default: "" },
-    };
-  },
-  parseHTML() {
-    return [{ tag: 'span[data-type="mathInline"]' }];
-  },
-  renderHTML({ HTMLAttributes }) {
-    return [
-      "span",
-      { "data-type": "mathInline", "data-katex": "true" },
-      `${HTMLAttributes.text ?? ""}`,
-    ];
-  },
-});
-
-/** Block KaTeX expression. Carries the LaTeX source in `text`. */
-const MathBlock = Node.create({
-  name: "mathBlock",
-  group: "block",
-  atom: true,
-  isolating: true,
-  addAttributes() {
-    return {
-      text: { default: "" },
-    };
-  },
-  parseHTML() {
-    return [{ tag: 'div[data-type="mathBlock"]' }];
-  },
-  renderHTML({ HTMLAttributes }) {
-    return [
-      "div",
-      { "data-type": "mathBlock", "data-katex": "true" },
-      `${HTMLAttributes.text ?? ""}`,
-    ];
-  },
-});
-
-/** Collapsible <details> wrapper: summary + content children. */
-const Details = Node.create({
-  name: "details",
-  group: "block",
-  content: "detailsSummary detailsContent",
-  defining: true,
-  isolating: true,
-  addAttributes() {
-    return {
-      open: {
-        default: false,
-        parseHTML: (el: HTMLElement) => el.getAttribute("open"),
-        renderHTML: (attrs: Record<string, any>) =>
-          attrs.open ? { open: "" } : {},
-      },
-    };
-  },
-  parseHTML() {
-    return [{ tag: "details" }];
-  },
-  renderHTML({ HTMLAttributes }) {
-    return ["details", { ...HTMLAttributes }, 0];
-  },
-});
-
-/** Clickable summary line of a <details> block. */
-const DetailsSummary = Node.create({
-  name: "detailsSummary",
-  group: "block",
-  content: "inline*",
-  defining: true,
-  isolating: true,
-  selectable: false,
-  parseHTML() {
-    return [{ tag: "summary" }];
-  },
-  renderHTML({ HTMLAttributes }) {
-    return ["summary", { "data-type": "detailsSummary", ...HTMLAttributes }, 0];
-  },
-});
-
-/** Body of a <details> block. Permissive content so fromYdoc output validates. */
-const DetailsContent = Node.create({
-  name: "detailsContent",
-  group: "block",
-  // Docmost declares block* (an empty details body is valid); block+ would
-  // reject a collapsed/empty details on round-trip.
-  content: "block*",
-  defining: true,
-  selectable: false,
-  parseHTML() {
-    return [{ tag: 'div[data-type="detailsContent"]' }];
-  },
-  renderHTML({ HTMLAttributes }) {
-    return ["div", { "data-type": "detailsContent", ...HTMLAttributes }, 0];
-  },
-});
-
-/** File attachment card (non-image upload). Block atom. */
-const Attachment = Node.create({
-  name: "attachment",
-  group: "block",
-  inline: false,
-  isolating: true,
-  atom: true,
-  defining: true,
-  draggable: true,
-  addAttributes() {
-    return {
-      url: {
-        default: "",
-        parseHTML: (el: HTMLElement) => el.getAttribute("data-attachment-url"),
-        renderHTML: (attrs: Record<string, any>) => ({
-          "data-attachment-url": attrs.url ?? "",
-        }),
-      },
-      name: {
-        default: null,
-        parseHTML: (el: HTMLElement) => el.getAttribute("data-attachment-name"),
-        renderHTML: (attrs: Record<string, any>) =>
-          attrs.name ? { "data-attachment-name": attrs.name } : {},
-      },
-      mime: {
-        default: null,
-        parseHTML: (el: HTMLElement) => el.getAttribute("data-attachment-mime"),
-        renderHTML: (attrs: Record<string, any>) =>
-          attrs.mime ? { "data-attachment-mime": attrs.mime } : {},
-      },
-      size: {
-        default: null,
-        parseHTML: (el: HTMLElement) => el.getAttribute("data-attachment-size"),
-        renderHTML: (attrs: Record<string, any>) =>
-          attrs.size != null ? { "data-attachment-size": attrs.size } : {},
-      },
-      attachmentId: {
-        default: null,
-        parseHTML: (el: HTMLElement) => el.getAttribute("data-attachment-id"),
-        renderHTML: (attrs: Record<string, any>) =>
-          attrs.attachmentId
-            ? { "data-attachment-id": attrs.attachmentId }
-            : {},
-      },
-      // Docmost declares `placeholder` (a transient upload key, not rendered
-      // to HTML). Carry it so a round-trip never hits "Unsupported attribute".
-      placeholder: { default: null },
-    };
-  },
-  parseHTML() {
-    return [{ tag: 'div[data-type="attachment"]' }];
-  },
-  renderHTML({ HTMLAttributes }) {
-    return ["div", { "data-type": "attachment", ...HTMLAttributes }, 0];
-  },
-});
-
-/** Uploaded <video> player. Block atom. */
-const Video = Node.create({
-  name: "video",
-  group: "block",
-  isolating: true,
-  atom: true,
-  defining: true,
-  draggable: true,
-  addAttributes() {
-    return {
-      src: {
-        default: "",
-        parseHTML: (el: HTMLElement) => el.getAttribute("src"),
-        renderHTML: (attrs: Record<string, any>) => ({ src: attrs.src ?? "" }),
-      },
-      alt: {
-        default: null,
-        parseHTML: (el: HTMLElement) => el.getAttribute("aria-label"),
-        renderHTML: (attrs: Record<string, any>) =>
-          attrs.alt ? { "aria-label": attrs.alt } : {},
-      },
-      attachmentId: {
-        default: null,
-        parseHTML: (el: HTMLElement) => el.getAttribute("data-attachment-id"),
-        renderHTML: (attrs: Record<string, any>) =>
-          attrs.attachmentId
-            ? { "data-attachment-id": attrs.attachmentId }
-            : {},
-      },
-      width: {
-        default: null,
-        parseHTML: (el: HTMLElement) => el.getAttribute("width"),
-        renderHTML: (attrs: Record<string, any>) =>
-          attrs.width != null ? { width: attrs.width } : {},
-      },
-      height: {
-        default: null,
-        parseHTML: (el: HTMLElement) => el.getAttribute("height"),
-        renderHTML: (attrs: Record<string, any>) =>
-          attrs.height != null ? { height: attrs.height } : {},
-      },
-      size: {
-        default: null,
-        parseHTML: (el: HTMLElement) => el.getAttribute("data-size"),
-        renderHTML: (attrs: Record<string, any>) =>
-          attrs.size != null ? { "data-size": attrs.size } : {},
-      },
-      align: {
-        default: "center",
-        parseHTML: (el: HTMLElement) => el.getAttribute("data-align"),
-        renderHTML: (attrs: Record<string, any>) =>
-          attrs.align ? { "data-align": attrs.align } : {},
-      },
-      aspectRatio: {
-        default: null,
-        parseHTML: (el: HTMLElement) => el.getAttribute("data-aspect-ratio"),
-        renderHTML: (attrs: Record<string, any>) =>
-          attrs.aspectRatio != null
-            ? { "data-aspect-ratio": attrs.aspectRatio }
-            : {},
-      },
-      // Docmost declares `placeholder` (a transient upload key, not rendered
-      // to HTML). Carry it so a round-trip never hits "Unsupported attribute".
-      placeholder: { default: null },
-    };
-  },
-  parseHTML() {
-    return [{ tag: "video" }];
-  },
-  renderHTML({ HTMLAttributes }) {
-    return ["video", { controls: "true", ...HTMLAttributes }];
-  },
-});
-
-/**
- * Defensive passthrough for a `youtube` node. Docmost itself has no dedicated
- * youtube node (YouTube is handled via `embed`), but the converter read path
- * references this type, so accept it as a generic block atom that preserves
- * its src so legacy/external documents survive a round-trip.
- */
-const Youtube = Node.create({
-  name: "youtube",
-  group: "block",
-  inline: false,
-  isolating: true,
-  atom: true,
-  defining: true,
-  draggable: true,
-  addAttributes() {
-    return {
-      src: {
-        default: "",
-        parseHTML: (el: HTMLElement) => el.getAttribute("data-src"),
-        renderHTML: (attrs: Record<string, any>) => ({
-          "data-src": attrs.src ?? "",
-        }),
-      },
-      width: {
-        default: null,
-        parseHTML: (el: HTMLElement) => el.getAttribute("data-width"),
-        renderHTML: (attrs: Record<string, any>) =>
-          attrs.width != null ? { "data-width": attrs.width } : {},
-      },
-      height: {
-        default: null,
-        parseHTML: (el: HTMLElement) => el.getAttribute("data-height"),
-        renderHTML: (attrs: Record<string, any>) =>
-          attrs.height != null ? { "data-height": attrs.height } : {},
-      },
-      align: {
-        default: "center",
-        parseHTML: (el: HTMLElement) => el.getAttribute("data-align"),
-        renderHTML: (attrs: Record<string, any>) =>
-          attrs.align ? { "data-align": attrs.align } : {},
-      },
-    };
-  },
-  parseHTML() {
-    return [{ tag: 'div[data-type="youtube"]' }];
-  },
-  renderHTML({ HTMLAttributes }) {
-    return ["div", { "data-type": "youtube", ...HTMLAttributes }, 0];
-  },
-});
-
-/** Generic embed (provider iframe). Block atom. */
-const Embed = Node.create({
-  name: "embed",
-  group: "block",
-  inline: false,
-  isolating: true,
-  atom: true,
-  defining: true,
-  draggable: true,
-  addAttributes() {
-    return {
-      src: {
-        default: "",
-        parseHTML: (el: HTMLElement) => el.getAttribute("data-src"),
-        renderHTML: (attrs: Record<string, any>) => ({
-          "data-src": attrs.src ?? "",
-        }),
-      },
-      provider: {
-        default: "",
-        parseHTML: (el: HTMLElement) => el.getAttribute("data-provider"),
-        renderHTML: (attrs: Record<string, any>) => ({
-          "data-provider": attrs.provider ?? "",
-        }),
-      },
-      align: {
-        default: "center",
-        parseHTML: (el: HTMLElement) => el.getAttribute("data-align"),
-        renderHTML: (attrs: Record<string, any>) => ({
-          "data-align": attrs.align ?? "center",
-        }),
-      },
-      width: {
-        default: 800,
-        parseHTML: (el: HTMLElement) => el.getAttribute("data-width"),
-        renderHTML: (attrs: Record<string, any>) => ({
-          "data-width": attrs.width,
-        }),
-      },
-      height: {
-        default: 600,
-        parseHTML: (el: HTMLElement) => el.getAttribute("data-height"),
-        renderHTML: (attrs: Record<string, any>) => ({
-          "data-height": attrs.height,
-        }),
-      },
-    };
-  },
-  parseHTML() {
-    return [{ tag: 'div[data-type="embed"]' }];
-  },
-  renderHTML({ HTMLAttributes }) {
-    return ["div", { "data-type": "embed", ...HTMLAttributes }, 0];
-  },
-});
-
-/**
- * Docmost raw HTML embed. Block atom; the client renders `source` inside a
- * sandboxed iframe. The MCP server never renders it — it only needs the
- * schema to accept and carry the node so a fromYdoc -> transform -> toYdoc
- * round-trip does not throw "Unknown node type: htmlEmbed". Mirrors the
- * @docmost/editor-ext node name, attribute keys and flags; keep in sync when
- * the editor-ext htmlEmbed schema changes.
- *
- * NOTE: unlike the canonical editor-ext node, `data-source` here is mapped as
- * plain text rather than base64-encoded. That is intentional: the MCP write
- * path carries the node through Yjs (fromYdoc -> toYdoc) on its JSON `source`
- * attribute and never invokes parseHTML/renderHTML, and htmlEmbed is not
- * produced from the markdown/HTML (generateJSON) path. If a future HTML path
- * for htmlEmbed is added here, this mapping must adopt editor-ext's base64
- * encode/decode to avoid double-encoding `source`.
- */
-const HtmlEmbed = Node.create({
-  name: "htmlEmbed",
-  group: "block",
-  inline: false,
-  isolating: true,
-  atom: true,
-  defining: true,
-  draggable: true,
-  addAttributes() {
-    return {
-      source: {
-        default: "",
-        parseHTML: (el: HTMLElement) => el.getAttribute("data-source") ?? "",
-        renderHTML: (attrs: Record<string, any>) => ({
-          "data-source": attrs.source ?? "",
-        }),
-      },
-      height: {
-        default: null,
-        parseHTML: (el: HTMLElement) => {
-          const v = el.getAttribute("data-height");
-          if (!v) return null;
-          const n = parseInt(v, 10);
-          return Number.isFinite(n) ? n : null;
-        },
-        renderHTML: (attrs: Record<string, any>) =>
-          attrs.height != null ? { "data-height": String(attrs.height) } : {},
-      },
-    };
-  },
-  parseHTML() {
-    return [{ tag: 'div[data-type="htmlEmbed"]' }];
-  },
-  renderHTML({ HTMLAttributes }) {
-    return ["div", { "data-type": "htmlEmbed", ...HTMLAttributes }, 0];
-  },
-});
-
-/** Shared attribute set for drawio/excalidraw diagram nodes. */
-const diagramAttributes = () => ({
-  src: {
-    default: "",
-    parseHTML: (el: HTMLElement) => el.getAttribute("data-src"),
-    renderHTML: (attrs: Record<string, any>) => ({
-      "data-src": attrs.src ?? "",
-    }),
-  },
-  title: {
-    default: null,
-    parseHTML: (el: HTMLElement) => el.getAttribute("data-title"),
-    renderHTML: (attrs: Record<string, any>) =>
-      attrs.title ? { "data-title": attrs.title } : {},
-  },
-  alt: {
-    default: null,
-    parseHTML: (el: HTMLElement) => el.getAttribute("data-alt"),
-    renderHTML: (attrs: Record<string, any>) =>
-      attrs.alt ? { "data-alt": attrs.alt } : {},
-  },
-  width: {
-    default: null,
-    parseHTML: (el: HTMLElement) => el.getAttribute("data-width"),
-    renderHTML: (attrs: Record<string, any>) =>
-      attrs.width != null ? { "data-width": attrs.width } : {},
-  },
-  height: {
-    default: null,
-    parseHTML: (el: HTMLElement) => el.getAttribute("data-height"),
-    renderHTML: (attrs: Record<string, any>) =>
-      attrs.height != null ? { "data-height": attrs.height } : {},
-  },
-  size: {
-    default: null,
-    parseHTML: (el: HTMLElement) => el.getAttribute("data-size"),
-    renderHTML: (attrs: Record<string, any>) =>
-      attrs.size != null ? { "data-size": attrs.size } : {},
-  },
-  aspectRatio: {
-    default: null,
-    parseHTML: (el: HTMLElement) => el.getAttribute("data-aspect-ratio"),
-    renderHTML: (attrs: Record<string, any>) =>
-      attrs.aspectRatio != null
-        ? { "data-aspect-ratio": attrs.aspectRatio }
-        : {},
-  },
-  align: {
-    default: "center",
-    parseHTML: (el: HTMLElement) => el.getAttribute("data-align"),
-    renderHTML: (attrs: Record<string, any>) =>
-      attrs.align ? { "data-align": attrs.align } : {},
-  },
-  attachmentId: {
-    default: null,
-    parseHTML: (el: HTMLElement) => el.getAttribute("data-attachment-id"),
-    renderHTML: (attrs: Record<string, any>) =>
-      attrs.attachmentId ? { "data-attachment-id": attrs.attachmentId } : {},
-  },
-});
-
-/** draw.io diagram. Block atom (image-backed). */
-const Drawio = Node.create({
-  name: "drawio",
-  group: "block",
-  inline: false,
-  isolating: true,
-  atom: true,
-  defining: true,
-  draggable: true,
-  addAttributes: diagramAttributes,
-  parseHTML() {
-    return [{ tag: 'div[data-type="drawio"]' }];
-  },
-  renderHTML({ HTMLAttributes }) {
-    return ["div", { "data-type": "drawio", ...HTMLAttributes }, 0];
-  },
-});
-
-/** Excalidraw diagram. Block atom (image-backed). */
-const Excalidraw = Node.create({
-  name: "excalidraw",
-  group: "block",
-  inline: false,
-  isolating: true,
-  atom: true,
-  defining: true,
-  draggable: true,
-  addAttributes: diagramAttributes,
-  parseHTML() {
-    return [{ tag: 'div[data-type="excalidraw"]' }];
-  },
-  renderHTML({ HTMLAttributes }) {
-    return ["div", { "data-type": "excalidraw", ...HTMLAttributes }, 0];
-  },
-});
-
-/** Multi-column layout container holding one or more `column` children. */
-const Columns = Node.create({
-  name: "columns",
-  group: "block",
-  content: "column+",
-  defining: true,
-  isolating: true,
-  addAttributes() {
-    return {
-      layout: {
-        default: "two_equal",
-        parseHTML: (el: HTMLElement) => el.getAttribute("data-layout"),
-        renderHTML: (attrs: Record<string, any>) =>
-          attrs.layout ? { "data-layout": attrs.layout } : {},
-      },
-      widthMode: {
-        default: "normal",
-        parseHTML: (el: HTMLElement) =>
-          el.getAttribute("data-width-mode") || "normal",
-        renderHTML: (attrs: Record<string, any>) =>
-          attrs.widthMode && attrs.widthMode !== "normal"
-            ? { "data-width-mode": attrs.widthMode }
-            : {},
-      },
-    };
-  },
-  parseHTML() {
-    return [{ tag: 'div[data-type="columns"]' }];
-  },
-  renderHTML({ HTMLAttributes }) {
-    return ["div", { "data-type": "columns", ...HTMLAttributes }, 0];
-  },
-});
-
-/** Single column within a `columns` layout. */
-const Column = Node.create({
-  name: "column",
-  group: "block",
-  content: "block+",
-  defining: true,
-  isolating: true,
-  selectable: false,
-  addAttributes() {
-    return {
-      width: {
-        default: null,
-        parseHTML: (el: HTMLElement) => {
-          const value = el.getAttribute("data-width");
-          return value ? parseFloat(value) : null;
-        },
-        renderHTML: (attrs: Record<string, any>) =>
-          attrs.width ? { "data-width": attrs.width } : {},
-      },
-    };
-  },
-  parseHTML() {
-    return [{ tag: 'div[data-type="column"]' }];
-  },
-  renderHTML({ HTMLAttributes }) {
-    return ["div", { "data-type": "column", ...HTMLAttributes }, 0];
-  },
-});
-
-/**
- * Subpages listing block (auto-generated index of child pages). Docmost
- * declares no attributes; the markdown-converter has a `case "subpages"`, so
- * the read path can emit it and toYdoc must accept it. Block atom.
- */
-const Subpages = Node.create({
-  name: "subpages",
-  group: "block",
-  inline: false,
-  isolating: true,
-  atom: true,
-  defining: true,
-  draggable: true,
-  parseHTML() {
-    return [{ tag: 'div[data-type="subpages"]' }];
-  },
-  renderHTML({ HTMLAttributes }) {
-    return ["div", { "data-type": "subpages", ...HTMLAttributes }, 0];
-  },
-});
-
-/** Uploaded <audio> player. Block atom. Mirrors Docmost audio attrs. */
-const Audio = Node.create({
-  name: "audio",
-  group: "block",
-  inline: false,
-  isolating: true,
-  atom: true,
-  defining: true,
-  draggable: true,
-  addAttributes() {
-    return {
-      src: {
-        default: "",
-        parseHTML: (el: HTMLElement) => el.getAttribute("src"),
-        renderHTML: (attrs: Record<string, any>) => ({ src: attrs.src ?? "" }),
-      },
-      attachmentId: {
-        default: null,
-        parseHTML: (el: HTMLElement) => el.getAttribute("data-attachment-id"),
-        renderHTML: (attrs: Record<string, any>) =>
-          attrs.attachmentId
-            ? { "data-attachment-id": attrs.attachmentId }
-            : {},
-      },
-      size: {
-        default: null,
-        parseHTML: (el: HTMLElement) => el.getAttribute("data-size"),
-        renderHTML: (attrs: Record<string, any>) =>
-          attrs.size != null ? { "data-size": attrs.size } : {},
-      },
-      // Transient upload key Docmost declares with rendered:false; carried so
-      // a round-trip never hits "Unsupported attribute".
-      placeholder: { default: null },
-    };
-  },
-  parseHTML() {
-    return [{ tag: "audio" }];
-  },
-  renderHTML({ HTMLAttributes }) {
-    return ["audio", { controls: "true", ...HTMLAttributes }];
-  },
-});
-
-/** Embedded PDF viewer. Block atom. Mirrors Docmost pdf attrs. */
-const Pdf = Node.create({
-  name: "pdf",
-  group: "block",
-  inline: false,
-  isolating: true,
-  atom: true,
-  defining: true,
-  draggable: true,
-  addAttributes() {
-    return {
-      src: {
-        default: "",
-        parseHTML: (el: HTMLElement) => el.getAttribute("src"),
-        renderHTML: (attrs: Record<string, any>) => ({ src: attrs.src ?? "" }),
-      },
-      name: {
-        default: null,
-        parseHTML: (el: HTMLElement) => el.getAttribute("data-name"),
-        renderHTML: (attrs: Record<string, any>) =>
-          attrs.name ? { "data-name": attrs.name } : {},
-      },
-      attachmentId: {
-        default: null,
-        parseHTML: (el: HTMLElement) => el.getAttribute("data-attachment-id"),
-        renderHTML: (attrs: Record<string, any>) =>
-          attrs.attachmentId
-            ? { "data-attachment-id": attrs.attachmentId }
-            : {},
-      },
-      size: {
-        default: null,
-        parseHTML: (el: HTMLElement) => el.getAttribute("data-size"),
-        renderHTML: (attrs: Record<string, any>) =>
-          attrs.size != null ? { "data-size": attrs.size } : {},
-      },
-      width: {
-        default: null,
-        parseHTML: (el: HTMLElement) => el.getAttribute("width"),
-        renderHTML: (attrs: Record<string, any>) =>
-          attrs.width != null ? { width: attrs.width } : {},
-      },
-      height: {
-        default: null,
-        parseHTML: (el: HTMLElement) => el.getAttribute("height"),
-        renderHTML: (attrs: Record<string, any>) =>
-          attrs.height != null ? { height: attrs.height } : {},
-      },
-      // Transient upload key Docmost declares with rendered:false; carried so
-      // a round-trip never hits "Unsupported attribute".
-      placeholder: { default: null },
-    };
-  },
-  parseHTML() {
-    return [{ tag: 'div[data-type="pdf"]' }];
-  },
-  renderHTML({ HTMLAttributes }) {
-    return ["div", { "data-type": "pdf", ...HTMLAttributes }, 0];
-  },
-});
-
-/** Page break (print/export divider). Block atom; Docmost declares no attrs. */
-const PageBreak = Node.create({
-  name: "pageBreak",
-  group: "block",
-  inline: false,
-  isolating: true,
-  atom: true,
-  defining: true,
-  draggable: true,
-  parseHTML() {
-    return [{ tag: 'div[data-type="pageBreak"]' }];
-  },
-  renderHTML({ HTMLAttributes }) {
-    return ["div", { "data-type": "pageBreak", ...HTMLAttributes }];
-  },
-});
-
-/**
- * Full extension list. Image is block-level (matches Docmost); the
- * ProseMirror DOM parser hoists <img> found inside <p> automatically.
- * StarterKit v3 already bundles the link extension, configured here.
- */
-export const docmostExtensions = [
-  StarterKit.configure({
-    codeBlock: {},
-    heading: {},
-    link: { openOnClick: false },
-  }),
-  // Stock @tiptap/extension-image has no caption attribute, so a round-trip
-  // through this schema would drop the data-caption the client TiptapImage
-  // emits. Mirror editor-ext image.ts: add a caption attribute that parses
-  // data-caption and re-renders it only when set (caption-less images stay
-  // clean), keeping the MCP markdown round-trip lossless.
-  Image.extend({
-    addAttributes() {
-      const parent = this.parent?.() ?? {};
-      return {
-        ...parent,
-        caption: {
-          default: undefined,
-          parseHTML: (el: HTMLElement) =>
-            el.getAttribute("data-caption") || undefined,
-          renderHTML: (attrs: Record<string, any>) =>
-            attrs.caption ? { "data-caption": attrs.caption } : {},
-        },
-      };
-    },
-  }).configure({ inline: false }),
-  TaskList,
-  TaskItem.configure({ nested: true }),
-  // Highlight stores its color unescaped and Docmost interpolates it into
-  // style="background-color: ${color}". Wrap the color attribute's parseHTML
-  // with the same allowlist guard used by textStyle so a crafted import color
-  // cannot break out of the style attribute. Multicolor behavior is preserved.
-  Highlight.extend({
-    addAttributes() {
-      const parent = this.parent?.() ?? {};
-      return {
-        ...parent,
-        color: {
-          ...(parent as Record<string, any>).color,
-          parseHTML: (el: HTMLElement) =>
-            sanitizeCssColor(
-              el.getAttribute("data-color") ||
-                getStyleProperty(el, "background-color") ||
-                el.style.backgroundColor,
-            ),
-        },
-      };
-    },
-  }).configure({ multicolor: true }),
-  Subscript,
-  Superscript,
-  // StarterKit does not provide a textStyle mark, so register ours; without it
-  // generateJSON drops <span style="color: ...">, defeating the color import.
-  TextStyle,
-  Comment,
-  Spoiler,
-  Callout,
-  Table,
-  TableRow,
-  TableCell,
-  TableHeader,
-  Mention,
-  FootnoteReference,
-  FootnotesList,
-  FootnoteDefinition,
-  MathInline,
-  MathBlock,
-  Details,
-  DetailsSummary,
-  DetailsContent,
-  Attachment,
-  Video,
-  Youtube,
-  Embed,
-  HtmlEmbed,
-  Drawio,
-  Excalidraw,
-  Columns,
-  Column,
-  Subpages,
-  Audio,
-  Pdf,
-  PageBreak,
-  DocmostAttributes,
-];
+export { docmostExtensions, clampCalloutType, sanitizeCssColor };
 
 /**
  * The ProseMirror schema for the docmost editor, built ONCE from
  * `docmostExtensions`. Pure and reused by every consumer (diff, collaboration
- * write-back) so the schema can never drift between call sites — it lives next
- * to the extension list it is derived from.
+ * write-back) so the schema can never drift between call sites.
  */
 export const docmostSchema = getSchema(docmostExtensions);
diff --git a/packages/mcp/src/lib/footnote-analyze.ts b/packages/mcp/src/lib/footnote-analyze.ts
index b259ea00..11178d25 100644
--- a/packages/mcp/src/lib/footnote-analyze.ts
+++ b/packages/mcp/src/lib/footnote-analyze.ts
@@ -1,5 +1,5 @@
 /**
- * Footnote diagnostics for imported Markdown (issue #166).
+ * Legacy footnote diagnostics for imported Markdown (issue #166).
  *
  * A PURE, fence-aware text scan (independent of the Markdown->ProseMirror
  * conversion path, so it reports the same problems for `create_page`,
@@ -7,11 +7,18 @@
  * importer still creates the page; this only surfaces footnote problems to the
  * caller so an agent can fix its own markup instead of shipping broken footnotes.
  *
+ * SCOPE after #293 STEP 5: the canonical import form is now inline `^[body]`
+ * footnotes (handled by `@docmost/prosemirror-markdown`), where these problems
+ * cannot arise. This scan therefore targets the LEGACY reference-style
+ * (`[^id]` / `[^id]:`) markup, which is now inert on import (left as literal
+ * text). The warnings remain useful as an advisory nudge when an agent still
+ * authors the old syntax, but they no longer describe what the importer builds.
+ *
  * Detected problems:
  *  - danglingReferences: a `[^id]` reference with no `[^id]:` definition.
  *  - emptyDefinitions:   a `[^id]:` whose (kept) text is empty/whitespace.
  *  - duplicateDefinitions: an id defined by two or more `[^id]:` lines (only the
- *    first is kept on import — first-wins; see extractFootnotes).
+ *    first would have been kept under the old first-wins import).
  *  - referencesInTables: a `[^id]` marker found in a GFM table row (heuristic:
  *    the line, trimmed, starts with `|`) — footnotes in table cells often do not
  *    render as expected.
diff --git a/packages/mcp/src/lib/footnote-lex.ts b/packages/mcp/src/lib/footnote-lex.ts
index 30da676b..4a684e86 100644
--- a/packages/mcp/src/lib/footnote-lex.ts
+++ b/packages/mcp/src/lib/footnote-lex.ts
@@ -1,12 +1,14 @@
 /**
- * Shared, fence-aware line lexer for footnote markdown (MCP-internal).
+ * Shared, fence-aware line lexer for legacy footnote markdown (MCP-internal).
  *
- * Both the importer (`extractFootnotes` in collaboration.ts, which strips
- * definition lines and rebuilds a footnotes section) and the diagnostics
- * (`analyzeFootnotes` in footnote-analyze.ts) must agree EXACTLY on which lines
- * are definitions and which lines are inert (inside a code fence). Sharing one
- * lexer makes "the analyzer sees what the importer leaves" a structural property
- * instead of two hand-kept copies that can drift (#166 review).
+ * Since #293 STEP 5 the markdown -> ProseMirror IMPORT path lives in the shared
+ * `@docmost/prosemirror-markdown` package (inline `^[body]` footnotes), so this
+ * lexer no longer backs an mcp importer. It now backs ONLY the import-time
+ * diagnostics (`analyzeFootnotes` in footnote-analyze.ts), which still scan the
+ * raw markdown for legacy reference-style `[^id]:` definition lines and surface
+ * advisory warnings (duplicate/orphan definitions) about content that is now
+ * inert on import. Fence-awareness (a `[^id]:` line inside a ``` / ~~~ block is
+ * NOT a definition) is the property the analyzer relies on.
  *
  * NOTE: this is deliberately NOT shared with editor-ext's
  * `extractFootnoteDefinitions` — that lives in a different package and the
diff --git a/packages/mcp/src/lib/markdown-converter.ts b/packages/mcp/src/lib/markdown-converter.ts
index f9758ace..b39f608b 100644
--- a/packages/mcp/src/lib/markdown-converter.ts
+++ b/packages/mcp/src/lib/markdown-converter.ts
@@ -1,903 +1,15 @@
 /**
- * Convert ProseMirror/TipTap JSON content to Markdown
- * Supports all Docmost-specific node types and extensions
+ * ProseMirror -> Docmost-flavoured Markdown converter.
+ *
+ * #293 STEP 5: the converter CORE now lives in the shared
+ * `@docmost/prosemirror-markdown` package (the canonical, lossless
+ * implementation carrying every git-sync fix and the #293 canon decisions).
+ * MCP consumes it directly instead of keeping its own drifted copy, so the two
+ * can never diverge again. This file is a thin re-export shim kept only so the
+ * many existing `./markdown-converter.js` importers (client.ts, tests) do not
+ * have to move.
  */
-export function convertProseMirrorToMarkdown(content: any): string {
-  if (!content || !content.content) return "";
-
-  // Escape a value interpolated into an HTML double-quoted attribute value
-  // (textAlign, colors, image src, math `text`, all data-* attrs, etc.). In the
-  // ATTRIBUTE context only the quote that delimits the value and the ampersand
-  // that starts an entity are special, so we escape ONLY & " (and ' for safety
-  // when single-quoted delimiters are used). We deliberately do NOT escape < or
-  // >: the HTML re-parser (parse5/jsdom via @tiptap/html) does NOT decode
-  // &lt;/&gt; back inside attribute values, so escaping them would corrupt the
-  // stored data (e.g. a math node's LaTeX `a < b`) and ACCUMULATE escapes on
-  // every round-trip (`a < b` -> `a &lt; b` -> `a &amp;lt; b`). Escaping & "
-  // keeps the value inert against attribute-injection while staying idempotent.
-  // NOTE: escape ONLY & and " here. The value is always wrapped in double
-  // quotes, so " is the only delimiter; ' is NOT special in a double-quoted
-  // value, and parse5 does not decode &#39; back inside attribute values, so
-  // escaping ' would (like < >) corrupt the value and accumulate &amp; on every
-  // round-trip. Escaping & and " is idempotent (parse5 decodes them back).
-  const escapeAttr = (value: unknown): string =>
-    String(value)
-      .replace(/&/g, "&amp;")
-      .replace(/"/g, "&quot;");
-
-  // Escape a value placed as HTML element TEXT content (between tags), where
-  // <, >, and & are all significant. Used for text rendered inside raw-HTML
-  // blocks (table cells / columns) so stored characters cannot inject markup.
-  const escapeHtmlText = (value: unknown): string =>
-    String(value)
-      .replace(/&/g, "&amp;")
-      .replace(/</g, "&lt;")
-      .replace(/>/g, "&gt;");
-
-  // Percent-encode characters that would break out of a markdown URL target
-  // (...) — whitespace/newlines and parentheses — so a stored src stays a
-  // single inert token (used for image/video/youtube srcs).
-  const encodeMdUrl = (value: unknown): string =>
-    String(value || "")
-      .replace(/\s/g, (c: string) => (c === " " ? "%20" : encodeURIComponent(c)))
-      .replace(/\(/g, "%28")
-      .replace(/\)/g, "%29");
-
-  const processNode = (node: any): string => {
-    const type = node.type;
-    const nodeContent = node.content || [];
-
-    switch (type) {
-      case "doc":
-        return nodeContent.map(processNode).join("\n\n");
-
-      case "paragraph":
-        const text = nodeContent.map(processNode).join("");
-        const align = node.attrs?.textAlign;
-        if (align && align !== "left") {
-          return `<div align="${escapeAttr(align)}">${text}</div>`;
-        }
-        return text || "";
-
-      case "heading":
-        const level = node.attrs?.level || 1;
-        const headingText = nodeContent.map(processNode).join("");
-        return "#".repeat(level) + " " + headingText;
-
-      case "text":
-        let textContent = node.text || "";
-        // Apply marks (bold, italic, code, etc.)
-        if (node.marks) {
-          // Markdown code spans (`...`) cannot carry inner formatting, so when a
-          // run has the `code` mark alongside ANY other mark, backtick syntax
-          // would leak literal ** / []() into the code text. In that case emit
-          // nested HTML (<code> innermost, the other marks wrapping it as HTML)
-          // so the output is at least well-formed and re-parseable.
-          //
-          // NOTE: this does NOT round-trip both marks. The schema's `code` mark
-          // has `excludes: "_"` (it excludes every other mark), so on import the
-          // co-occurring mark is always dropped — the run comes back as `code`
-          // only. We keep the emission simple and accept that the other mark is
-          // lost; preserving both is impossible while `code` excludes them.
-          // Only use the backtick form when `code` is the sole mark.
-          const markTypes = node.marks.map((m: any) => m.type);
-          const hasCode = markTypes.includes("code");
-          const codeCombined = hasCode && markTypes.length > 1;
-          for (const mark of node.marks) {
-            switch (mark.type) {
-              case "bold":
-                textContent = codeCombined
-                  ? `<strong>${textContent}</strong>`
-                  : `**${textContent}**`;
-                break;
-              case "italic":
-                textContent = codeCombined
-                  ? `<em>${textContent}</em>`
-                  : `*${textContent}*`;
-                break;
-              case "code":
-                // When combined with another mark, wrap as <code> so the
-                // surrounding HTML marks can nest around it; otherwise use the
-                // plain backtick span.
-                textContent = codeCombined
-                  ? `<code>${textContent}</code>`
-                  : `\`${textContent}\``;
-                break;
-              case "link": {
-                const href = mark.attrs?.href || "";
-                const title = mark.attrs?.title;
-                if (codeCombined) {
-                  // Emit an HTML anchor so it can wrap the nested <code>.
-                  const safeHref = escapeAttr(href);
-                  if (title) {
-                    textContent = `<a href="${safeHref}" title="${escapeAttr(String(title))}">${textContent}</a>`;
-                  } else {
-                    textContent = `<a href="${safeHref}">${textContent}</a>`;
-                  }
-                } else if (title) {
-                  // Emit the optional markdown link title; escape an embedded
-                  // double-quote so it cannot terminate the title string early.
-                  const safeTitle = String(title).replace(/"/g, '\\"');
-                  textContent = `[${textContent}](${href} "${safeTitle}")`;
-                } else {
-                  textContent = `[${textContent}](${href})`;
-                }
-                break;
-              }
-              case "strike":
-                textContent = codeCombined
-                  ? `<s>${textContent}</s>`
-                  : `~~${textContent}~~`;
-                break;
-              case "underline":
-                textContent = `<u>${textContent}</u>`;
-                break;
-              case "subscript":
-                textContent = `<sub>${textContent}</sub>`;
-                break;
-              case "superscript":
-                textContent = `<sup>${textContent}</sup>`;
-                break;
-              case "highlight": {
-                // Preserve a null/empty color as a plain highlight (a bare
-                // <mark> with no background-color); only emit the style when a
-                // color is actually set, so a plain highlight is not forced to
-                // yellow on export.
-                const color = mark.attrs?.color;
-                textContent = color
-                  ? `<mark style="background-color: ${escapeAttr(color)}">${textContent}</mark>`
-                  : `<mark>${textContent}</mark>`;
-                break;
-              }
-              case "textStyle":
-                if (mark.attrs?.color) {
-                  textContent = `<span style="color: ${escapeAttr(mark.attrs.color)}">${textContent}</span>`;
-                }
-                break;
-              case "comment": {
-                // Emit the inline comment anchor so highlights round-trip. The
-                // schema's Comment mark parses span[data-comment-id] (attrs
-                // commentId/resolved).
-                const cid = mark.attrs?.commentId;
-                if (cid) {
-                  const resolvedAttr = mark.attrs?.resolved
-                    ? ` data-resolved="true"`
-                    : "";
-                  textContent = `<span data-comment-id="${escapeAttr(cid)}"${resolvedAttr}>${textContent}</span>`;
-                }
-                break;
-              }
-              case "spoiler":
-                // Markdown has no native spoiler syntax, so emit the same
-                // lossless raw HTML the editor-ext turndown rule produces; the
-                // schema's Spoiler mark parses span[data-spoiler] back on import.
-                textContent = `<span data-spoiler="true">${textContent}</span>`;
-                break;
-            }
-          }
-        }
-        return textContent;
-
-      case "codeBlock":
-        const language = node.attrs?.language || "";
-        // Strip ALL trailing newlines so the export is idempotent: marked
-        // re-adds exactly one trailing "\n" on import, so trimming only one
-        // here would let the text grow by "\n" on each round-trip. Removing
-        // every trailing newline makes repeated cycles stable.
-        const code = nodeContent
-          .map(processNode)
-          .join("")
-          .replace(/\n+$/, "");
-        return "```" + language + "\n" + code + "\n```";
-
-      case "bulletList":
-        return nodeContent
-          .map((item: any) => processListItem(item, "-"))
-          .join("\n");
-
-      case "orderedList":
-        return nodeContent
-          .map((item: any, index: number) =>
-            processListItem(item, `${index + 1}.`),
-          )
-          .join("\n");
-
-      case "taskList":
-        return nodeContent.map((item: any) => processTaskItem(item)).join("\n");
-
-      case "taskItem":
-        // Delegate to the same helper used by taskList so multi-block and
-        // nested task items render and indent consistently.
-        return processTaskItem(node);
-
-      case "listItem":
-        return nodeContent.map(processNode).join("\n");
-
-      case "blockquote":
-        // Prefix EVERY line of EVERY child with "> " and separate block-level
-        // children with a blank ">" line so code blocks / multi-paragraph
-        // quotes round-trip correctly.
-        return nodeContent
-          .map((n: any) =>
-            processNode(n)
-              .split("\n")
-              .map((line: string) => (line.length ? `> ${line}` : ">"))
-              .join("\n"),
-          )
-          .join("\n>\n");
-
-      case "horizontalRule":
-        return "---";
-
-      case "hardBreak":
-        // Two trailing spaces before the newline encode a markdown hard break;
-        // a bare "\n" would be reimported as a soft break and lost.
-        return "  \n";
-
-      case "image": {
-        const imgAlt = node.attrs?.alt || "";
-        const imgCaption = node.attrs?.caption || "";
-        if (imgCaption) {
-          // ![]() can't carry a caption, so (symmetric to video) emit a raw
-          // <img> wrapped in a block <div>. On import marked.parse keeps the raw
-          // HTML and generateJSON runs the image extension's parseHTML, which
-          // restores the caption from data-caption.
-          const parts: string[] = [`src="${escapeAttr(node.attrs?.src ?? "")}"`];
-          if (imgAlt) parts.push(`alt="${escapeAttr(imgAlt)}"`);
-          parts.push(`data-caption="${escapeAttr(imgCaption)}"`);
-          return `<div><img ${parts.join(" ")}></div>`;
-        }
-        // Neutralize characters that could break out of the markdown image
-        // URL: spaces/newlines and parentheses would terminate the (...) target
-        // and let a stored src inject following markdown/HTML. Percent-encode
-        // them so the URL stays a single inert token.
-        const imgSrc = encodeMdUrl(node.attrs?.src);
-        return `![${imgAlt}](${imgSrc})`;
-      }
-
-      case "video": {
-        // Emit the schema-matching <video> element so generateJSON rebuilds the
-        // node with its attrs intact. The schema's parseHTML reads src/aria-label
-        // from the standard attributes and the remaining attrs from data-*.
-        const attrs = node.attrs || {};
-        const parts: string[] = [`src="${escapeAttr(attrs.src ?? "")}"`];
-        if (attrs.alt) parts.push(`aria-label="${escapeAttr(attrs.alt)}"`);
-        if (attrs.attachmentId)
-          parts.push(
-            `data-attachment-id="${escapeAttr(attrs.attachmentId)}"`,
-          );
-        if (attrs.width != null)
-          parts.push(`width="${escapeAttr(attrs.width)}"`);
-        if (attrs.height != null)
-          parts.push(`height="${escapeAttr(attrs.height)}"`);
-        if (attrs.size != null)
-          parts.push(`data-size="${escapeAttr(attrs.size)}"`);
-        if (attrs.align)
-          parts.push(`data-align="${escapeAttr(attrs.align)}"`);
-        if (attrs.aspectRatio != null)
-          parts.push(`data-aspect-ratio="${escapeAttr(attrs.aspectRatio)}"`);
-        // Wrap in a block <div> so marked treats it as a block (a bare <video>
-        // is inline-level HTML and marked wraps it in <p>, leaving a spurious
-        // empty paragraph beside the hoisted block atom). The wrapper has no
-        // data-type, so the schema parser ignores it and just hoists the video.
-        return `<div><video ${parts.join(" ")}></video></div>`;
-      }
-
-      case "youtube": {
-        // Emit the schema-matching div[data-type="youtube"]; the schema reads
-        // src from data-src and width/height/align from data-* attributes.
-        const attrs = node.attrs || {};
-        const parts: string[] = [
-          `data-type="youtube"`,
-          `data-src="${escapeAttr(attrs.src ?? "")}"`,
-        ];
-        if (attrs.width != null)
-          parts.push(`data-width="${escapeAttr(attrs.width)}"`);
-        if (attrs.height != null)
-          parts.push(`data-height="${escapeAttr(attrs.height)}"`);
-        if (attrs.align)
-          parts.push(`data-align="${escapeAttr(attrs.align)}"`);
-        return `<div ${parts.join(" ")}></div>`;
-      }
-
-      case "table": {
-        // A GFM pipe table cannot represent merged cells. If ANY cell carries
-        // colspan>1 or rowspan>1, a pipe table would corrupt the grid on
-        // re-import, so emit the WHOLE table as raw HTML <table> instead: the
-        // schema's table family parseHTML (tag table/tr/td/th, with colspan/
-        // rowspan read from the same-named HTML attrs and align via parseHTML)
-        // round-trips it faithfully. Otherwise keep the lighter GFM pipe table.
-        const tableRows: any[] = nodeContent;
-        if (tableRows.length === 0) return "";
-        const hasSpan = tableRows.some((row: any) =>
-          (row.content || []).some(
-            (cell: any) =>
-              (cell.attrs?.colspan ?? 1) > 1 || (cell.attrs?.rowspan ?? 1) > 1,
-          ),
-        );
-
-        if (hasSpan) {
-          // Render each cell's block children to HTML (marked does NOT parse
-          // markdown inside a raw HTML block, so emitting markdown here would
-          // leak literal ** / `` into the cell). blockToHtml mirrors the schema
-          // HTML so inner formatting re-parses into the right marks/nodes.
-          const renderHtmlCell = (cell: any): string => {
-            const tag = cell.type === "tableHeader" ? "th" : "td";
-            const a = cell.attrs || {};
-            const cellParts: string[] = [];
-            if ((a.colspan ?? 1) > 1)
-              cellParts.push(`colspan="${escapeAttr(a.colspan)}"`);
-            if ((a.rowspan ?? 1) > 1)
-              cellParts.push(`rowspan="${escapeAttr(a.rowspan)}"`);
-            if (a.align) cellParts.push(`align="${escapeAttr(a.align)}"`);
-            const open = cellParts.length
-              ? `<${tag} ${cellParts.join(" ")}>`
-              : `<${tag}>`;
-            const inner = (cell.content || [])
-              .map((block: any) => blockToHtml(block))
-              .join("");
-            return `${open}${inner}</${tag}>`;
-          };
-          const htmlRows = tableRows
-            .map(
-              (row: any) =>
-                `<tr>${(row.content || []).map(renderHtmlCell).join("")}</tr>`,
-            )
-            .join("");
-          return `<table><tbody>${htmlRows}</tbody></table>`;
-        }
-
-        // No merged cells: emit a GFM table (header row + separator) so the
-        // markdown can be parsed back into a table on re-import.
-        const rows = tableRows.map(processNode);
-        const headerCells = tableRows[0]?.content || [];
-        const columns = headerCells.length || 1;
-        // Derive alignment markers (:--, :-:, --:) from each header cell.
-        const markers = Array.from({ length: columns }, (_, i) => {
-          const align = headerCells[i]?.attrs?.align;
-          switch (align) {
-            case "left":
-              return ":--";
-            case "center":
-              return ":-:";
-            case "right":
-              return "--:";
-            default:
-              return "---";
-          }
-        });
-        const separator = "| " + markers.join(" | ") + " |";
-        return [rows[0], separator, ...rows.slice(1)].join("\n");
-      }
-
-      case "tableRow":
-        return "| " + nodeContent.map(processNode).join(" | ") + " |";
-
-      case "tableCell":
-      case "tableHeader": {
-        // Join multiple block children with a space (not "") so adjacent blocks
-        // like a paragraph followed by a list don't collide into "line1- a".
-        // Then collapse newlines and escape pipes so a cell containing "|" or a
-        // line break cannot corrupt the surrounding GFM row.
-        return nodeContent
-          .map(processNode)
-          .join(" ")
-          .replace(/\r?\n/g, " ")
-          .replace(/\|/g, "\\|");
-      }
-
-      case "callout":
-        const calloutType = node.attrs?.type || "info";
-        const calloutContent = nodeContent.map(processNode).join("\n");
-        return `:::${calloutType.toLowerCase()}\n${calloutContent}\n:::`;
-
-      case "details":
-        return nodeContent.map(processNode).join("\n");
-
-      case "detailsSummary":
-        const summaryText = nodeContent.map(processNode).join("");
-        return `<details>\n<summary>${summaryText}</summary>\n`;
-
-      case "detailsContent":
-        const detailsText = nodeContent.map(processNode).join("\n");
-        return `${detailsText}\n</details>`;
-
-      case "mathInline": {
-        // The schema's `text` attribute has no parseHTML, so TipTap's default
-        // parser reads it from the `text` HTML attribute (NOT the element's text
-        // content). Emit span[data-type="mathInline"] carrying the LaTeX in a
-        // `text="..."` attribute so it round-trips. marked cannot parse $...$
-        // back, so the previous form was lossy.
-        const inlineMath = node.attrs?.text || "";
-        return `<span data-type="mathInline" data-katex="true" text="${escapeAttr(inlineMath)}"></span>`;
-      }
-
-      case "mathBlock": {
-        // Same as mathInline: the LaTeX must ride in the `text` HTML attribute
-        // for the schema's default parser to recover it.
-        const blockMath = node.attrs?.text || "";
-        return `<div data-type="mathBlock" data-katex="true" text="${escapeAttr(blockMath)}"></div>`;
-      }
-
-      case "mention": {
-        // Emit span[data-type="mention"] with the schema's data-* attributes so
-        // generateJSON rebuilds the mention node instead of leaving "@label"
-        // plain text that cannot re-parse.
-        const attrs = node.attrs || {};
-        const parts: string[] = [`data-type="mention"`];
-        if (attrs.id) parts.push(`data-id="${escapeAttr(attrs.id)}"`);
-        if (attrs.label)
-          parts.push(`data-label="${escapeAttr(attrs.label)}"`);
-        if (attrs.entityType)
-          parts.push(`data-entity-type="${escapeAttr(attrs.entityType)}"`);
-        if (attrs.entityId)
-          parts.push(`data-entity-id="${escapeAttr(attrs.entityId)}"`);
-        if (attrs.slugId)
-          parts.push(`data-slug-id="${escapeAttr(attrs.slugId)}"`);
-        if (attrs.creatorId)
-          parts.push(`data-creator-id="${escapeAttr(attrs.creatorId)}"`);
-        if (attrs.anchorId)
-          parts.push(`data-anchor-id="${escapeAttr(attrs.anchorId)}"`);
-        // Keep the label as visible text content too; the schema reads attrs
-        // from data-*, so the inner text is purely cosmetic and harmless.
-        const mentionLabel = attrs.label || attrs.id || "";
-        // The label is visible element TEXT content here (the data-* attrs above
-        // carry the real values), so escape it for the text context, not attrs.
-        return `<span ${parts.join(" ")}>@${escapeHtmlText(mentionLabel)}</span>`;
-      }
-
-      case "footnoteReference": {
-        // Pandoc/GFM inline marker. The number is derived (not stored), so the
-        // id is the stable anchor.
-        const fnId = node.attrs?.id || "";
-        return fnId ? `[^${fnId}]` : "";
-      }
-
-      case "footnotesList":
-        // The container renders its definitions, each on its own `[^id]: ...`
-        // line. A blank line separates the body from the notes block.
-        return nodeContent.map(processNode).join("\n");
-
-      case "footnoteDefinition": {
-        const defId = node.attrs?.id || "";
-        // Collapse the definition's paragraphs into a single line; multi-line
-        // footnotes are a v2 refinement.
-        const defText = nodeContent
-          .map(processNode)
-          .join(" ")
-          .replace(/\s*\n+\s*/g, " ")
-          .trim();
-        return defId ? `[^${defId}]: ${defText}` : "";
-      }
-
-      case "attachment": {
-        // BUG FIX: the old code read node.attrs.fileName / node.attrs.src, but
-        // the schema stores name/url (plus mime/size/attachmentId). Emit the
-        // schema-matching div[data-type="attachment"] with data-attachment-*
-        // attrs so the node round-trips instead of degrading to a markdown link.
-        const attrs = node.attrs || {};
-        const parts: string[] = [
-          `data-type="attachment"`,
-          `data-attachment-url="${escapeAttr(attrs.url ?? "")}"`,
-        ];
-        if (attrs.name)
-          parts.push(`data-attachment-name="${escapeAttr(attrs.name)}"`);
-        if (attrs.mime)
-          parts.push(`data-attachment-mime="${escapeAttr(attrs.mime)}"`);
-        if (attrs.size != null)
-          parts.push(`data-attachment-size="${escapeAttr(attrs.size)}"`);
-        if (attrs.attachmentId)
-          parts.push(
-            `data-attachment-id="${escapeAttr(attrs.attachmentId)}"`,
-          );
-        return `<div ${parts.join(" ")}></div>`;
-      }
-
-      case "drawio":
-      case "excalidraw": {
-        // Emit the schema-matching div[data-type=...] carrying the diagram's
-        // attrs as data-* (the schema's diagramAttributes reads src/title/alt/
-        // width/height/size/aspectRatio/align/attachmentId from data-*), so the
-        // diagram round-trips instead of degrading to a lossy placeholder.
-        const attrs = node.attrs || {};
-        const parts: string[] = [
-          `data-type="${type}"`,
-          `data-src="${escapeAttr(attrs.src ?? "")}"`,
-        ];
-        if (attrs.title != null)
-          parts.push(`data-title="${escapeAttr(attrs.title)}"`);
-        if (attrs.alt != null) parts.push(`data-alt="${escapeAttr(attrs.alt)}"`);
-        if (attrs.width != null)
-          parts.push(`data-width="${escapeAttr(attrs.width)}"`);
-        if (attrs.height != null)
-          parts.push(`data-height="${escapeAttr(attrs.height)}"`);
-        if (attrs.size != null)
-          parts.push(`data-size="${escapeAttr(attrs.size)}"`);
-        if (attrs.aspectRatio != null)
-          parts.push(`data-aspect-ratio="${escapeAttr(attrs.aspectRatio)}"`);
-        if (attrs.align)
-          parts.push(`data-align="${escapeAttr(attrs.align)}"`);
-        if (attrs.attachmentId)
-          parts.push(
-            `data-attachment-id="${escapeAttr(attrs.attachmentId)}"`,
-          );
-        return `<div ${parts.join(" ")}></div>`;
-      }
-
-      case "embed": {
-        // Emit the schema-matching div[data-type="embed"]; the schema reads
-        // src/provider/align/width/height from data-* attributes so the node
-        // (and its provider iframe info) survives the round-trip.
-        const attrs = node.attrs || {};
-        const parts: string[] = [
-          `data-type="embed"`,
-          `data-src="${escapeAttr(attrs.src ?? "")}"`,
-          `data-provider="${escapeAttr(attrs.provider ?? "")}"`,
-        ];
-        if (attrs.align)
-          parts.push(`data-align="${escapeAttr(attrs.align)}"`);
-        if (attrs.width != null)
-          parts.push(`data-width="${escapeAttr(attrs.width)}"`);
-        if (attrs.height != null)
-          parts.push(`data-height="${escapeAttr(attrs.height)}"`);
-        return `<div ${parts.join(" ")}></div>`;
-      }
-
-      case "audio": {
-        // Emit the schema-matching <audio> element (was emitting nothing). The
-        // schema reads src from src and attachmentId/size from data-*.
-        const attrs = node.attrs || {};
-        const parts: string[] = [`src="${escapeAttr(attrs.src ?? "")}"`];
-        if (attrs.attachmentId)
-          parts.push(
-            `data-attachment-id="${escapeAttr(attrs.attachmentId)}"`,
-          );
-        if (attrs.size != null)
-          parts.push(`data-size="${escapeAttr(attrs.size)}"`);
-        // Wrap in a block <div> for the same reason as video: a bare <audio> is
-        // inline-level HTML that marked would wrap in <p>.
-        return `<div><audio ${parts.join(" ")}></audio></div>`;
-      }
-
-      case "pdf": {
-        // Emit the schema-matching div[data-type="pdf"] (was emitting nothing).
-        // The schema reads src/width/height from standard attrs and name/
-        // attachmentId/size from data-*.
-        const attrs = node.attrs || {};
-        const parts: string[] = [
-          `data-type="pdf"`,
-          `src="${escapeAttr(attrs.src ?? "")}"`,
-        ];
-        if (attrs.name) parts.push(`data-name="${escapeAttr(attrs.name)}"`);
-        if (attrs.attachmentId)
-          parts.push(
-            `data-attachment-id="${escapeAttr(attrs.attachmentId)}"`,
-          );
-        if (attrs.size != null)
-          parts.push(`data-size="${escapeAttr(attrs.size)}"`);
-        if (attrs.width != null)
-          parts.push(`width="${escapeAttr(attrs.width)}"`);
-        if (attrs.height != null)
-          parts.push(`height="${escapeAttr(attrs.height)}"`);
-        return `<div ${parts.join(" ")}></div>`;
-      }
-
-      case "columns": {
-        // Emit the schema-matching div[data-type="columns"] wrapper so the
-        // multi-column layout survives. Without a case the children were
-        // concatenated with no separator and the text merged. The schema reads
-        // layout from data-layout and widthMode from data-width-mode. The whole
-        // block is raw HTML, so render children via blockToHtml (NOT markdown,
-        // which marked would not re-parse inside a raw HTML block).
-        const attrs = node.attrs || {};
-        const parts: string[] = [`data-type="columns"`];
-        if (attrs.layout)
-          parts.push(`data-layout="${escapeAttr(attrs.layout)}"`);
-        if (attrs.widthMode && attrs.widthMode !== "normal")
-          parts.push(`data-width-mode="${escapeAttr(attrs.widthMode)}"`);
-        const inner = nodeContent.map((n: any) => blockToHtml(n)).join("");
-        return `<div ${parts.join(" ")}>${inner}</div>`;
-      }
-
-      case "column": {
-        // Emit the schema-matching div[data-type="column"]; the schema reads the
-        // column width from data-width. Children are rendered as HTML so their
-        // formatting survives inside this raw HTML block.
-        const attrs = node.attrs || {};
-        const parts: string[] = [`data-type="column"`];
-        if (attrs.width)
-          parts.push(`data-width="${escapeAttr(attrs.width)}"`);
-        const inner = nodeContent.map((n: any) => blockToHtml(n)).join("");
-        return `<div ${parts.join(" ")}>${inner}</div>`;
-      }
-
-      case "subpages":
-        return "{{SUBPAGES}}";
-
-      default:
-        // Fallback: process children
-        return nodeContent.map(processNode).join("");
-    }
-  };
-
-  // Render inline content (text runs + their marks) to HTML. Used by the raw
-  // HTML fallbacks (spanned tables, columns) where marked will NOT re-parse
-  // markdown, so backtick/asterisk/bracket syntax would otherwise leak as
-  // literal characters. Each mark is mirrored to the HTML the schema's parseHTML
-  // accepts so it re-imports as the matching ProseMirror mark.
-  const inlineToHtml = (inlineNodes: any[]): string =>
-    (inlineNodes || [])
-      .map((n: any) => {
-        if (n.type === "hardBreak") return "<br>";
-        if (n.type !== "text") {
-          // Inline atoms (mention, mathInline) already emit schema HTML.
-          return processNode(n);
-        }
-        let t = escapeHtmlText(n.text || "");
-        for (const mark of n.marks || []) {
-          switch (mark.type) {
-            case "bold":
-              t = `<strong>${t}</strong>`;
-              break;
-            case "italic":
-              t = `<em>${t}</em>`;
-              break;
-            case "code":
-              t = `<code>${t}</code>`;
-              break;
-            case "strike":
-              t = `<s>${t}</s>`;
-              break;
-            case "underline":
-              t = `<u>${t}</u>`;
-              break;
-            case "subscript":
-              t = `<sub>${t}</sub>`;
-              break;
-            case "superscript":
-              t = `<sup>${t}</sup>`;
-              break;
-            case "link":
-              t = `<a href="${escapeAttr(mark.attrs?.href || "")}">${t}</a>`;
-              break;
-            case "highlight":
-              t = mark.attrs?.color
-                ? `<mark style="background-color: ${escapeAttr(mark.attrs.color)}">${t}</mark>`
-                : `<mark>${t}</mark>`;
-              break;
-            case "textStyle":
-              if (mark.attrs?.color)
-                t = `<span style="color: ${escapeAttr(mark.attrs.color)}">${t}</span>`;
-              break;
-            case "comment":
-              // Inline comment anchor inside a raw-HTML container (columns /
-              // spanned table cells), so commented text there also round-trips.
-              if (mark.attrs?.commentId) {
-                const r = mark.attrs?.resolved ? ` data-resolved="true"` : "";
-                t = `<span data-comment-id="${escapeAttr(mark.attrs.commentId)}"${r}>${t}</span>`;
-              }
-              break;
-          }
-        }
-        return t;
-      })
-      .join("");
-
-  // Emit the schema-matching <img> for an image node. Shared so the image is
-  // emitted as real HTML wherever a raw-HTML container needs it (inside a column
-  // or a spanned table cell), where markdown `![](...)` would NOT be re-parsed
-  // and would survive as literal text. The Image extension reads src/alt from
-  // the standard attributes; the Docmost extra attrs (width/height/align/size/
-  // attachmentId/aspectRatio) are global attributes read from same-named DOM
-  // attributes, so emit them by name.
-  const imageToHtml = (node: any): string => {
-    const attrs = node.attrs || {};
-    const parts: string[] = [`src="${escapeAttr(attrs.src ?? "")}"`];
-    if (attrs.alt) parts.push(`alt="${escapeAttr(attrs.alt)}"`);
-    if (attrs.caption)
-      parts.push(`data-caption="${escapeAttr(attrs.caption)}"`);
-    if (attrs.title) parts.push(`title="${escapeAttr(attrs.title)}"`);
-    if (attrs.width != null) parts.push(`width="${escapeAttr(attrs.width)}"`);
-    if (attrs.height != null) parts.push(`height="${escapeAttr(attrs.height)}"`);
-    if (attrs.align) parts.push(`align="${escapeAttr(attrs.align)}"`);
-    if (attrs.size != null) parts.push(`data-size="${escapeAttr(attrs.size)}"`);
-    if (attrs.attachmentId)
-      parts.push(`data-attachment-id="${escapeAttr(attrs.attachmentId)}"`);
-    if (attrs.aspectRatio != null)
-      parts.push(`data-aspect-ratio="${escapeAttr(attrs.aspectRatio)}"`);
-    return `<img ${parts.join(" ")}>`;
-  };
-
-  // Emit the schema-matching div[data-type="callout"] for a callout node. The
-  // schema reads the banner type from data-callout-type. Children are rendered
-  // as HTML so they survive inside a raw-HTML container.
-  const calloutToHtml = (node: any): string => {
-    const type = (node.attrs?.type || "info").toLowerCase();
-    const inner = (node.content || []).map(blockToHtml).join("");
-    return `<div data-type="callout" data-callout-type="${escapeAttr(type)}">${inner}</div>`;
-  };
-
-  // Emit a schema-matching <details> tree. The schema parses <details>,
-  // summary[data-type="detailsSummary"], and div[data-type="detailsContent"].
-  const detailsToHtml = (node: any): string => {
-    const inner = (node.content || []).map(blockToHtml).join("");
-    return `<details>${inner}</details>`;
-  };
-  const detailsSummaryToHtml = (node: any): string =>
-    `<summary data-type="detailsSummary">${inlineToHtml(node.content || [])}</summary>`;
-  const detailsContentToHtml = (node: any): string => {
-    const inner = (node.content || []).map(blockToHtml).join("");
-    return `<div data-type="detailsContent">${inner}</div>`;
-  };
-
-  // Emit the schema-matching taskList/taskItem HTML. bridgeTaskLists (in
-  // collaboration.ts) recognizes ul[data-type="taskList"] with
-  // li[data-type="taskItem"][data-checked]; emitting that directly here keeps
-  // task lists inside columns/cells from degrading to literal "- [ ]" text.
-  const taskListToHtml = (node: any): string => {
-    const items = (node.content || [])
-      .map((it: any) => {
-        const checked = it.attrs?.checked ? "true" : "false";
-        return `<li data-type="taskItem" data-checked="${checked}">${blockChildrenToHtml(it)}</li>`;
-      })
-      .join("");
-    return `<ul data-type="taskList">${items}</ul>`;
-  };
-
-  // Render a block node to HTML for the raw-HTML containers (spanned tables,
-  // columns). marked does NOT re-parse markdown inside a raw-HTML block, so
-  // EVERY block type that can appear inside a column or a spanned cell must be
-  // emitted as schema-matching HTML here — never as markdown, or it would land
-  // as literal text on re-import. Nodes whose processNode case already produces
-  // schema-matching HTML (math/media/embed/attachment/nested columns/spanned
-  // table) are delegated to processNode; the markdown-emitting cases
-  // (image/blockquote/callout/details/hr/taskList) get explicit HTML here.
-  const blockToHtml = (block: any): string => {
-    const children = block.content || [];
-    switch (block.type) {
-      case "paragraph":
-        return `<p>${inlineToHtml(children)}</p>`;
-      case "heading": {
-        const level = block.attrs?.level || 1;
-        return `<h${level}>${inlineToHtml(children)}</h${level}>`;
-      }
-      case "bulletList":
-        return `<ul>${children
-          .map((li: any) => `<li>${blockChildrenToHtml(li)}</li>`)
-          .join("")}</ul>`;
-      case "orderedList":
-        return `<ol>${children
-          .map((li: any) => `<li>${blockChildrenToHtml(li)}</li>`)
-          .join("")}</ol>`;
-      case "codeBlock": {
-        const lang = block.attrs?.language || "";
-        // The code itself is element TEXT content (between <code> tags), so it
-        // must escape < > & — NOT the attribute escaper. The language rides in
-        // a class ATTRIBUTE, so it uses escapeAttr.
-        const code = escapeHtmlText(
-          children
-            .map(processNode)
-            .join("")
-            .replace(/\n+$/, ""),
-        );
-        const cls = lang ? ` class="language-${escapeAttr(lang)}"` : "";
-        return `<pre><code${cls}>${code}</code></pre>`;
-      }
-      case "image":
-        return imageToHtml(block);
-      case "blockquote":
-        return `<blockquote>${children.map(blockToHtml).join("")}</blockquote>`;
-      case "horizontalRule":
-        return "<hr>";
-      case "callout":
-        return calloutToHtml(block);
-      case "details":
-        return detailsToHtml(block);
-      case "detailsSummary":
-        return detailsSummaryToHtml(block);
-      case "detailsContent":
-        return detailsContentToHtml(block);
-      case "taskList":
-        return taskListToHtml(block);
-      case "taskItem":
-        // A bare taskItem (outside a taskList) still needs a wrapping list so
-        // the schema parses it; wrap it in a single-item taskList.
-        return taskListToHtml({ content: [block] });
-      // table (incl. spanned), columns/column, math, media, embed, attachment,
-      // mention, etc. already emit schema-matching HTML from processNode.
-      case "table":
-      case "columns":
-      case "column":
-      case "mathBlock":
-      case "video":
-      case "audio":
-      case "pdf":
-      case "youtube":
-      case "embed":
-      case "attachment":
-      case "drawio":
-      case "excalidraw":
-        return processNode(block);
-      default:
-        // Any still-unhandled block type: NEVER fall back to markdown inside a
-        // raw-HTML block (it would become literal text). Wrap its rendered
-        // children in a <div> so their content is preserved; if it has no block
-        // children, render its inline content instead.
-        if (children.length && children.some((c: any) => c.type !== "text")) {
-          return `<div>${children.map(blockToHtml).join("")}</div>`;
-        }
-        return `<div>${inlineToHtml(children)}</div>`;
-    }
-  };
-
-  // Render the block children of a list item to HTML (a listItem holds block+
-  // content). Mirrors processListItem but for the HTML fallback path.
-  const blockChildrenToHtml = (item: any): string =>
-    (item.content || []).map((b: any) => blockToHtml(b)).join("");
-
-  // Indent the rendered children of a list item under a marker prefix.
-  // Each child block is a (possibly multi-line) string. The very first physical
-  // line of the first child carries the marker (e.g. "- " or "1. "); EVERY
-  // other line — the remaining lines of the first child AND all lines of every
-  // subsequent child (nested lists, code blocks, extra paragraphs) — is indented
-  // to align under the marker. Without indenting these continuation lines, the
-  // 2nd/3rd line of a nested child collapses to column 0 and escapes the list.
-  //
-  // The continuation indent MUST equal the LIST marker width, which is not the
-  // same as the visible prefix width:
-  //   - bullet "- "          -> 2 columns
-  //   - task   "- [ ] "      -> marker is still "- " (the "[ ] " is content), 2
-  //   - ordered "1. "/"10. " -> 3/4 columns, scaling with the number's digits
-  // CommonMark anchors nested content to the marker column, so an ordered item
-  // indented to only 2 columns would be re-parsed as a sibling/loose content on
-  // re-import. Callers therefore pass the exact indent width to use.
-  const indentItemChildren = (
-    childStrings: string[],
-    prefix: string,
-    indentWidth: number,
-  ): string => {
-    const indent = " ".repeat(indentWidth);
-    const lines: string[] = [];
-    childStrings.forEach((child, childIndex) => {
-      child.split("\n").forEach((line, lineIndex) => {
-        if (childIndex === 0 && lineIndex === 0) {
-          // First physical line of the first block gets the marker.
-          lines.push(`${prefix} ${line}`);
-        } else {
-          // Indent every continuation line by the marker width; keep blank
-          // lines blank rather than emitting trailing whitespace.
-          lines.push(line.length ? `${indent}${line}` : "");
-        }
-      });
-    });
-    return lines.join("\n");
-  };
-
-  const processListItem = (item: any, prefix: string): string => {
-    const itemContent = item.content || [];
-    const childStrings = itemContent.map(processNode);
-    if (childStrings.length === 0) return prefix;
-    // The rendered marker is `${prefix} ` (prefix + one space), so its width —
-    // and thus the continuation indent — is prefix.length + 1. This is correct
-    // for both bullet ("-" -> 2) and ordered ("1." -> 3, "10." -> 4) markers,
-    // since for those the visible prefix IS the list marker.
-    return indentItemChildren(childStrings, prefix, prefix.length + 1);
-  };
-
-  const processTaskItem = (item: any): string => {
-    const checked = item.attrs?.checked || false;
-    const checkbox = checked ? "[x]" : "[ ]";
-    const prefix = `- ${checkbox}`;
-    const itemContent = item.content || [];
-    const childStrings = itemContent.map(processNode);
-    // An empty task item still needs its checkbox marker; without this guard
-    // the indent below produces "" and the "- [ ]"/"- [x]" row disappears.
-    if (childStrings.length === 0) return prefix;
-    // The list marker for a task item is just "- " (2 columns); the "[ ] "/"[x] "
-    // checkbox is item content, NOT part of the marker. So the continuation
-    // indent is a fixed 2 — do NOT derive it from the wider prefix.length.
-    return indentItemChildren(childStrings, prefix, 2);
-  };
-
-  return processNode(content).trim();
-}
+export {
+  convertProseMirrorToMarkdown,
+  type ConvertProseMirrorToMarkdownOptions,
+} from "@docmost/prosemirror-markdown";
diff --git a/packages/mcp/src/lib/markdown-document.ts b/packages/mcp/src/lib/markdown-document.ts
index b6bb004f..c744e117 100644
--- a/packages/mcp/src/lib/markdown-document.ts
+++ b/packages/mcp/src/lib/markdown-document.ts
@@ -1,136 +1,15 @@
 /**
- * Self-contained Docmost-flavoured Markdown document (custom extensions).
+ * Self-contained Docmost-flavoured Markdown document envelope (`docmost:meta` /
+ * `docmost:comments` blocks).
  *
- * A single `.md` file that packages everything needed to losslessly round-trip
- * a page through "download -> edit body -> re-upload":
- *   - a leading `docmost:meta` block: a one-line JSON object with page identity;
- *   - the Markdown body (carrying inline comment anchors and diagrams as HTML);
- *   - a trailing `docmost:comments` block: a one-line JSON array of comment
- *     threads.
- *
- * Both metadata blocks are HTML comments on purpose: `marked`/`generateJSON`
- * drop HTML comments, so even if the WHOLE file were ever fed straight to the
- * importer without first stripping the blocks, the metadata cannot leak into the
- * document. (A fenced ```docmost-comments``` block would WRONGLY become a
- * codeBlock node, so a fenced block is deliberately NOT used.)
- *
- * The delimiter literals may legitimately appear in the BODY too (e.g. a user
- * re-pastes an exported `.md` into a page, or a page documents this very
- * format). To stay robust, parsing treats only the FINAL, document-ending
- * `docmost:comments` block as metadata: it is the last `<!-- docmost:comments`
- * opener whose closing `-->` sits at the very end of the file. Any earlier
- * literal occurrence is left in the body untouched.
- *
- * NOTE on comments: in this version the comment THREAD records are preserved in
- * the file but are NOT pushed back to the server on import — only the inline
- * comment marks (anchors) embedded in the body are restored. Managing comment
- * records stays with the comment tools/UI.
+ * #293 STEP 5: this envelope is now owned by the shared
+ * `@docmost/prosemirror-markdown` package (the mcp copy was byte-identical to
+ * the package's, so re-exporting is lossless). Kept as a thin shim so the
+ * existing `./markdown-document.js` importers (client.ts, tests) do not move.
  */
-
-export interface DocmostMdMeta {
-  version: number;
-  pageId?: string;
-  slugId?: string;
-  title?: string;
-  spaceId?: string;
-  parentPageId?: string | null;
-}
-
-// Match the leading meta block (allow leading whitespace). Capture group 1 is
-// the JSON text between the markers.
-const META_RE = /^\s*<!--\s*docmost:meta\s*\n([\s\S]*?)\n-->/;
-// Match a `docmost:comments` opener. Used globally to scan for the LAST opener
-// rather than end-anchoring a single regex (which would mis-capture across a
-// literal opener that appears earlier in the body).
-const COMMENTS_OPEN_RE = /<!--[ \t]*docmost:comments[ \t]*\r?\n/g;
-
-/**
- * Assemble the full self-contained markdown file: meta block, body, and the
- * comments block. The meta block is always emitted; the comments block is always
- * emitted too (with `[]` when there are no comments) so the format stays uniform
- * and parsing stays simple.
- */
-export function serializeDocmostMarkdown(
-  meta: DocmostMdMeta,
-  body: string,
-  comments: any[],
-): string {
-  const metaJson = JSON.stringify(meta);
-  const commentsJson = JSON.stringify(Array.isArray(comments) ? comments : []);
-  const trimmedBody = (body ?? "").trim();
-  return (
-    `<!-- docmost:meta\n${metaJson}\n-->\n\n` +
-    `${trimmedBody}\n\n` +
-    `<!-- docmost:comments\n${commentsJson}\n-->\n`
-  );
-}
-
-/**
- * Split a self-contained file back into its parts. Tolerant: if the meta or
- * comments block is missing (e.g. a hand-written plain-markdown file), the
- * corresponding value is returned as `null` and the whole input is treated as
- * the body. This never throws on a MISSING block; only a `JSON.parse` failure
- * inside a block that IS present is surfaced as a thrown Error with a clear
- * message. Robust to `\r\n` line endings.
- */
-export function parseDocmostMarkdown(full: string): {
-  meta: DocmostMdMeta | null;
-  body: string;
-  comments: any[] | null;
-} {
-  // Normalize line endings so the anchored regexes work regardless of CRLF.
-  const normalized = (full ?? "").replace(/\r\n/g, "\n");
-
-  // Extract the leading meta block (start-anchored — already unambiguous).
-  let meta: DocmostMdMeta | null = null;
-  let metaEnd = 0;
-  const metaMatch = normalized.match(META_RE);
-  if (metaMatch) {
-    try {
-      meta = JSON.parse(metaMatch[1]);
-    } catch (e) {
-      throw new Error(
-        `Invalid docmost:meta JSON block: ${
-          e instanceof Error ? e.message : String(e)
-        }`,
-      );
-    }
-    // Body starts right after the matched meta block.
-    metaEnd = (metaMatch.index ?? 0) + metaMatch[0].length;
-  }
-
-  // Find the LAST `<!-- docmost:comments` opener; the real file-level block is
-  // the final one whose closing `-->` ends the document. Any earlier literal
-  // occurrence inside the body (e.g. a re-pasted export) is left in the body.
-  let lastOpenStart = -1;
-  let lastOpenEnd = -1;
-  let m: RegExpExecArray | null;
-  COMMENTS_OPEN_RE.lastIndex = 0;
-  while ((m = COMMENTS_OPEN_RE.exec(normalized)) !== null) {
-    lastOpenStart = m.index;
-    lastOpenEnd = m.index + m[0].length;
-  }
-
-  let comments: any[] | null = null;
-  let bodyEnd = normalized.length;
-  if (lastOpenStart !== -1) {
-    const rest = normalized.slice(lastOpenEnd);
-    const close = rest.match(/\r?\n-->[ \t]*\r?\n?\s*$/); // closer must end the doc
-    if (close) {
-      const jsonText = rest.slice(0, close.index);
-      try {
-        comments = JSON.parse(jsonText);
-      } catch (e) {
-        throw new Error(
-          `Invalid docmost:comments JSON block: ${
-            e instanceof Error ? e.message : String(e)
-          }`,
-        );
-      }
-      bodyEnd = lastOpenStart; // strip from the opener to end of document
-    }
-  }
-
-  const body = normalized.slice(metaEnd, bodyEnd).trim();
-  return { meta, body, comments };
-}
+export {
+  serializeDocmostMarkdown,
+  parseDocmostMarkdown,
+  serializeDocmostMarkdownBody,
+} from "@docmost/prosemirror-markdown";
+export type { DocmostMdMeta } from "@docmost/prosemirror-markdown";
diff --git a/packages/mcp/test-e2e.mjs b/packages/mcp/test-e2e.mjs
index 7d3d78bb..6fa6192b 100644
--- a/packages/mcp/test-e2e.mjs
+++ b/packages/mcp/test-e2e.mjs
@@ -462,7 +462,7 @@ async function main() {
     check("create_comment: markdown round-trip", c1.data.content.includes("**комментарий**"), c1.data.content);
     const reply = await client.createComment(pageId, "Ответ на комментарий.", "page", undefined, c1.data.id);
     check("create_comment: reply has parent", reply.data.parentCommentId === c1.data.id);
-    const list = await client.listComments(pageId);
+    const list = (await client.listComments(pageId)).items;
     check("list_comments: both visible", list.length === 2, `count=${list.length}`);
     await client.updateComment(c1.data.id, "Обновлённый текст комментария.");
     const got = await client.getComment(c1.data.id);
@@ -472,17 +472,19 @@ async function main() {
     // resolve_comment: close the top-level thread, verify resolvedAt surfaces, then reopen
     const resolvedRes = await client.resolveComment(c1.data.id, true);
     check("resolve_comment: marks resolved", resolvedRes.success === true && resolvedRes.resolved === true);
-    const listResolved = await client.listComments(pageId);
+    // c1 is now resolved; the default feed hides resolved threads, so pass
+    // includeResolved:true to still see it and assert its resolvedAt (#328).
+    const listResolved = (await client.listComments(pageId, true)).items;
     const c1Resolved = listResolved.find((c) => c.id === c1.data.id);
     check("resolve_comment: resolvedAt set in list", !!c1Resolved?.resolvedAt, `resolvedAt=${c1Resolved?.resolvedAt}`);
     const reopenedRes = await client.resolveComment(c1.data.id, false);
     check("resolve_comment: reopen succeeds", reopenedRes.resolved === false);
-    const listReopened = await client.listComments(pageId);
+    const listReopened = (await client.listComments(pageId)).items;
     const c1Reopened = listReopened.find((c) => c.id === c1.data.id);
     check("resolve_comment: resolvedAt cleared on reopen", !c1Reopened?.resolvedAt, `resolvedAt=${c1Reopened?.resolvedAt}`);
     await client.deleteComment(reply.data.id);
     await client.deleteComment(c1.data.id);
-    const listAfter = await client.listComments(pageId);
+    const listAfter = (await client.listComments(pageId)).items;
     check("delete_comment: comments removed", listAfter.length === 0, `count=${listAfter.length}`);
   } finally {
     if (pageId) {
diff --git a/packages/mcp/test/mock/list-comments-resolved.test.mjs b/packages/mcp/test/mock/list-comments-resolved.test.mjs
new file mode 100644
index 00000000..19188b9e
--- /dev/null
+++ b/packages/mcp/test/mock/list-comments-resolved.test.mjs
@@ -0,0 +1,160 @@
+// gitmost #328 Channel 2: DocmostClient.listComments hides RESOLVED THREADS
+// wholesale by default (a resolved top-level comment AND every reply under it),
+// returning `{ items, resolvedThreadsHidden }`. `includeResolved: true` returns
+// the full feed. These tests stand a local http.createServer in for Docmost and
+// mock the /auth/login + /comments (paginated) routes.
+import { test, after } from "node:test";
+import assert from "node:assert/strict";
+import http from "node:http";
+import { DocmostClient } from "../../build/client.js";
+
+function readBody(req) {
+  return new Promise((resolve) => {
+    let raw = "";
+    req.on("data", (c) => (raw += c));
+    req.on("end", () => resolve(raw));
+  });
+}
+
+function startServer(handler) {
+  return new Promise((resolve) => {
+    const server = http.createServer(handler);
+    server.listen(0, "127.0.0.1", () => {
+      const { port } = server.address();
+      resolve({ server, baseURL: `http://127.0.0.1:${port}/api` });
+    });
+  });
+}
+
+function closeServer(server) {
+  return new Promise((resolve) => server.close(resolve));
+}
+
+function sendJson(res, status, obj, extraHeaders = {}) {
+  res.writeHead(status, { "Content-Type": "application/json", ...extraHeaders });
+  res.end(JSON.stringify(obj));
+}
+
+const openServers = [];
+async function spawn(handler) {
+  const { server, baseURL } = await startServer(handler);
+  openServers.push(server);
+  return { server, baseURL };
+}
+
+after(async () => {
+  await Promise.all(openServers.map((s) => closeServer(s)));
+});
+
+// A minimal ProseMirror comment body (a paragraph of text).
+const body = (t) => ({
+  type: "doc",
+  content: [{ type: "paragraph", content: [{ type: "text", text: t }] }],
+});
+
+// Feed: an ACTIVE thread whose REPLY is resolved (root active, reply resolved —
+// the thread must STAY, because a thread is gated only by its ROOT's resolvedAt)
+// and a RESOLVED thread (root + reply).
+const FEED = [
+  {
+    id: "a",
+    pageId: "page-1",
+    parentCommentId: null,
+    resolvedAt: null,
+    createdAt: "2026-01-01T00:00:00.000Z",
+    creatorId: "u1",
+    content: body("active root"),
+  },
+  {
+    id: "a1",
+    pageId: "page-1",
+    parentCommentId: "a",
+    // A RESOLVED reply under an ACTIVE root: the thread is NOT hidden (only a
+    // resolved ROOT hides a thread), so this reply survives the default filter.
+    resolvedAt: "2026-02-15T00:00:00.000Z",
+    createdAt: "2026-01-01T01:00:00.000Z",
+    creatorId: "u1",
+    content: body("resolved reply of an active thread"),
+  },
+  {
+    id: "r",
+    pageId: "page-1",
+    parentCommentId: null,
+    resolvedAt: "2026-02-01T00:00:00.000Z",
+    createdAt: "2026-01-02T00:00:00.000Z",
+    creatorId: "u1",
+    content: body("resolved root"),
+  },
+  {
+    id: "r1",
+    pageId: "page-1",
+    parentCommentId: "r",
+    resolvedAt: null,
+    createdAt: "2026-01-02T01:00:00.000Z",
+    creatorId: "u1",
+    content: body("resolved reply"),
+  },
+];
+
+function commentsServer() {
+  return spawn(async (req, res) => {
+    await readBody(req);
+    if (req.url === "/api/auth/login") {
+      sendJson(res, 200, { success: true }, {
+        "Set-Cookie": "authToken=t; Path=/; HttpOnly",
+      });
+      return;
+    }
+    if (req.url === "/api/comments") {
+      // Single page, no cursor.
+      sendJson(res, 200, { data: { items: FEED, meta: { nextCursor: null } } });
+      return;
+    }
+    sendJson(res, 404, { message: "not found" });
+  });
+}
+
+test("default hides the resolved thread (root + its reply) and counts it", async () => {
+  const { baseURL } = await commentsServer();
+  const client = new DocmostClient(baseURL, "user@example.com", "pw");
+
+  const result = await client.listComments("page-1");
+  assert.equal(Array.isArray(result.items), true, "returns { items, ... }");
+  const ids = result.items.map((c) => c.id).sort();
+  assert.deepEqual(ids, ["a", "a1"], "only the active thread remains");
+  assert.equal(result.resolvedThreadsHidden, 1, "one resolved thread hidden");
+});
+
+test("includeResolved:true returns EVERYTHING with zero hidden", async () => {
+  const { baseURL } = await commentsServer();
+  const client = new DocmostClient(baseURL, "user@example.com", "pw");
+
+  const result = await client.listComments("page-1", true);
+  const ids = result.items.map((c) => c.id).sort();
+  assert.deepEqual(ids, ["a", "a1", "r", "r1"], "all four comments returned");
+  assert.equal(result.resolvedThreadsHidden, 0, "nothing hidden with the flag");
+});
+
+test("the reply of a resolved thread is hidden with the thread", async () => {
+  const { baseURL } = await commentsServer();
+  const client = new DocmostClient(baseURL, "user@example.com", "pw");
+
+  const result = await client.listComments("page-1");
+  const ids = result.items.map((c) => c.id);
+  assert.equal(ids.includes("r1"), false, "the resolved thread's reply is gone");
+  assert.equal(ids.includes("r"), false, "the resolved root is gone");
+});
+
+test("an ACTIVE thread whose REPLY is resolved is NOT hidden", async () => {
+  // A thread is gated only by its ROOT's resolvedAt. `a1` is a resolved reply
+  // under the active root `a`, so both must survive the default filter and the
+  // thread must not be counted as hidden.
+  const { baseURL } = await commentsServer();
+  const client = new DocmostClient(baseURL, "user@example.com", "pw");
+
+  const result = await client.listComments("page-1");
+  const ids = result.items.map((c) => c.id).sort();
+  assert.equal(ids.includes("a"), true, "active root stays");
+  assert.equal(ids.includes("a1"), true, "its resolved reply stays with the thread");
+  assert.equal(result.resolvedThreadsHidden, 1, "only the resolved-root thread is hidden");
+});
diff --git a/packages/mcp/test/unit/collaboration.test.mjs b/packages/mcp/test/unit/collaboration.test.mjs
index 84801840..687e5d6e 100644
--- a/packages/mcp/test/unit/collaboration.test.mjs
+++ b/packages/mcp/test/unit/collaboration.test.mjs
@@ -127,36 +127,54 @@ test("markdownToProseMirror: an aligned GFM table maps header alignment", async
 });
 
 // Comment-body data-loss guard (#228 review #4): markdownToProseMirror is reused
-// for COMMENT bodies (createComment/updateComment), so it must NOT canonicalize —
-// a comment may legitimately carry a standalone footnote definition with no
-// matching reference, and canonicalization would drop the whole list (the text
-// would vanish). The page-write variant DOES canonicalize.
-test("markdownToProseMirror (comment path) PRESERVES a reference-less footnote definition", async () => {
+// for COMMENT bodies (createComment/updateComment), so it must NOT canonicalize.
+// Under the #293 canon, footnotes are INLINE (`^[body]`), so a comment can no
+// longer carry a reference-less definition to be dropped — but the comment path
+// must still (a) leave a legacy reference-style `[^id]:` line as harmless literal
+// TEXT (never silently deleted) and (b) preserve an inline footnote it does
+// contain (no canonicalization stripping it). The page-write variant canonicalizes.
+test("markdownToProseMirror (comment path) keeps a legacy `[^id]:` line as literal text", async () => {
+  // A reference-style `[^1]:` line is not canonical footnote syntax anymore, so it
+  // is not parsed into a footnote node — but its TEXT must survive verbatim (no
+  // data loss on the comment write path).
   const md = "A comment.\n\n[^1]: a standalone footnote definition";
   const doc = await markdownToProseMirror(md);
-  const defs = findAll(doc, "footnoteDefinition");
-  assert.equal(defs.length, 1, "the footnote definition must be preserved");
+  assert.equal(
+    findAll(doc, "footnoteDefinition").length,
+    0,
+    "reference-style line is not a footnote node",
+  );
   assert.match(
     JSON.stringify(doc),
     /a standalone footnote definition/,
-    "the definition text must survive the comment write path",
+    "the text must survive the comment write path",
   );
 });
 
-test("markdownToProseMirrorCanonical (page path) DROPS a reference-less footnote definition", async () => {
-  // Same input through the PAGE variant: with no reference, the canonical doc has
-  // no footnotesList (this is the page-side behavior the comment path must avoid).
-  const md = "A page.\n\n[^1]: a standalone footnote definition";
-  const doc = await markdownToProseMirrorCanonical(md);
-  assert.equal(findAll(doc, "footnotesList").length, 0);
-  assert.equal(findAll(doc, "footnoteDefinition").length, 0);
+test("markdownToProseMirror (comment path) PRESERVES an inline footnote (no canonicalization)", async () => {
+  // An inline `^[body]` footnote in a comment imports to a real footnote node and
+  // is NOT dropped: the comment path must never canonicalize away content.
+  const md = "A comment.\n\n^[an inline footnote]";
+  const doc = await markdownToProseMirror(md);
+  assert.equal(findAll(doc, "footnoteDefinition").length, 1);
+  assert.equal(findAll(doc, "footnotesList").length, 1);
+  assert.match(JSON.stringify(doc), /an inline footnote/);
 });
 
-test("markdownToProseMirrorCanonical still canonicalizes a real page footnote (order)", async () => {
-  // Page path must STILL canonicalize: refs b,a -> definitions reorder to b,a.
-  const md = "See[^b] then[^a].\n\n[^a]: alpha\n[^b]: bravo";
+test("markdownToProseMirrorCanonical (page path) yields a single reference-ordered list", async () => {
+  // Page path produces the canonical footnote topology: one trailing
+  // `footnotesList`, definitions in FIRST-REFERENCE order, ids assigned
+  // sequentially. Inline `^[body]` footnotes carry the body at the reference
+  // point, so the bottom list is inherently reference-ordered.
+  const md = "See^[bravo] then^[alpha].";
   const doc = await markdownToProseMirrorCanonical(md);
-  const defs = findAll(doc, "footnoteDefinition").map((d) => d.attrs.id);
-  assert.deepEqual(defs, ["b", "a"]);
+  const defs = findAll(doc, "footnoteDefinition");
+  assert.deepEqual(
+    defs.map((d) => d.attrs.id),
+    ["fn-1", "fn-2"],
+  );
   assert.equal(findAll(doc, "footnotesList").length, 1);
+  // Bodies stay in reference order (bravo referenced before alpha).
+  assert.match(JSON.stringify(defs[0]), /bravo/);
+  assert.match(JSON.stringify(defs[1]), /alpha/);
 });
diff --git a/packages/mcp/test/unit/docmost-md-roundtrip.test.mjs b/packages/mcp/test/unit/docmost-md-roundtrip.test.mjs
index 798bac10..b8b1293c 100644
--- a/packages/mcp/test/unit/docmost-md-roundtrip.test.mjs
+++ b/packages/mcp/test/unit/docmost-md-roundtrip.test.mjs
@@ -210,13 +210,17 @@ test("drawio round-trips through export and import", () => {
     ],
   };
 
+  // #293 canon #8: the media family (image/video/audio/drawio/excalidraw)
+  // serializes to the markdown image form `![alt](src)` plus a trailing
+  // discriminator comment `<!--drawio {json}-->` carrying the non-src attrs.
   const body = convertProseMirrorToMarkdown(doc);
-  assert.match(body, /data-type="drawio"/);
-  assert.match(body, /data-src="https:\/\/example\/diagram\.xml"/);
+  assert.match(body, /!\[\]\(https:\/\/example\/diagram\.xml\)/);
+  assert.match(body, /<!--drawio \{"attachmentId":"att-7"\}-->/);
 
   return markdownToProseMirror(body).then((rebuilt) => {
     const diagram = find(rebuilt, "drawio");
     assert.ok(diagram, "expected a drawio node after import");
     assert.equal(diagram.attrs.src, "https://example/diagram.xml");
+    assert.equal(diagram.attrs.attachmentId, "att-7");
   });
 });
diff --git a/packages/mcp/test/unit/footnote-canonicalize.test.mjs b/packages/mcp/test/unit/footnote-canonicalize.test.mjs
index e626b316..d7af244e 100644
--- a/packages/mcp/test/unit/footnote-canonicalize.test.mjs
+++ b/packages/mcp/test/unit/footnote-canonicalize.test.mjs
@@ -253,22 +253,23 @@ test("insertInlineFootnote: anchor in body BEFORE a nested list still inserts",
   assert.equal(findAll(r.doc, "footnotesList").length, 1);
 });
 
-test("markdown import (page path): out-of-order definitions render as a reference-ordered list", async () => {
-  // References appear b, a, c in the body; definitions are written in a, b, c
-  // order (the import order). The PAGE import path (markdownToProseMirrorCanonical)
-  // canonicalizes so the bottom list follows REFERENCE order — numbers read 1, 2,
-  // 3 down the list. (The non-canonicalizing markdownToProseMirror, used for
-  // comment bodies, would keep the import order; see collaboration.test.mjs.)
-  const md = [
-    "See[^b] then[^a] then[^c].",
-    "",
-    "[^a]: alpha",
-    "[^b]: bravo",
-    "[^c]: charlie",
-  ].join("\n");
+test("markdown import (page path): inline footnotes render as a reference-ordered list", async () => {
+  // Inline `^[body]` footnotes carry their body at the reference point, so the
+  // PAGE import path (markdownToProseMirrorCanonical) materializes the bottom
+  // list in REFERENCE order — numbers read 1, 2, 3 down the list — with ids
+  // assigned sequentially (fn-1, fn-2, fn-3).
+  const md = "See^[bravo] then^[alpha] then^[charlie].";
   const json = await markdownToProseMirrorCanonical(md);
-  assert.deepEqual(defIds(json), ["b", "a", "c"]);
+  assert.deepEqual(defIds(json), ["fn-1", "fn-2", "fn-3"]);
   assert.equal(findAll(json, "footnotesList").length, 1);
+  // Bodies materialize in reference order (bravo, alpha, charlie).
+  const defsJson = JSON.stringify(findAll(json, "footnoteDefinition"));
+  assert.ok(
+    defsJson.indexOf("bravo") <
+      defsJson.indexOf("alpha") &&
+      defsJson.indexOf("alpha") < defsJson.indexOf("charlie"),
+    "definitions follow reference order",
+  );
 });
 
 test("generateFootnoteId: valid uuidv7 shape (version 7, variant 8..b) and unique", () => {
diff --git a/packages/mcp/test/unit/footnotes.test.mjs b/packages/mcp/test/unit/footnotes.test.mjs
index 67ec9bc5..ab7c2c65 100644
--- a/packages/mcp/test/unit/footnotes.test.mjs
+++ b/packages/mcp/test/unit/footnotes.test.mjs
@@ -49,15 +49,19 @@ const footnoteDoc = {
   ],
 };
 
-test("JSON -> Markdown emits pandoc footnote syntax", () => {
+test("JSON -> Markdown emits canonical inline footnote syntax (#293 canon #2)", () => {
+  // Canonical markdown form is Pandoc/Obsidian INLINE footnotes: the note body is
+  // written at the reference point as `^[body]`. There is NO `[^id]` reference
+  // marker and NO trailing `[^id]: …` definition list; the schema id never
+  // reaches markdown.
   const md = convertProseMirrorToMarkdown(footnoteDoc);
-  assert.match(md, /\[\^fn1\]/);
-  assert.match(md, /\[\^fn2\]/);
-  assert.match(md, /\[\^fn1\]: First note\./);
-  assert.match(md, /\[\^fn2\]: Second note\./);
+  assert.match(md, /\^\[First note\.\]/);
+  assert.match(md, /\^\[Second note\.\]/);
+  assert.doesNotMatch(md, /\[\^/); // no reference-style markers
+  assert.doesNotMatch(md, /^\[\^.+\]:/m); // no bottom definition lines
 });
 
-test("Markdown -> JSON rebuilds footnote nodes", async () => {
+test("Markdown -> JSON rebuilds footnote nodes with sequential fn-N ids", async () => {
   const md = convertProseMirrorToMarkdown(footnoteDoc);
   const json = await markdownToProseMirror(md);
 
@@ -65,42 +69,39 @@ test("Markdown -> JSON rebuilds footnote nodes", async () => {
   const list = findAll(json, "footnotesList");
   const defs = findAll(json, "footnoteDefinition");
 
+  // Structure is preserved; ids are (re)assigned sequentially in first-reference
+  // order by the importer (fn-1, fn-2, …) — the concrete id is never carried in
+  // markdown, so it is derived on import.
   assert.equal(refs.length, 2);
   assert.deepEqual(
     refs.map((r) => r.attrs.id),
-    ["fn1", "fn2"],
+    ["fn-1", "fn-2"],
   );
   assert.equal(list.length, 1);
   assert.equal(defs.length, 2);
   assert.deepEqual(
     defs.map((d) => d.attrs.id),
-    ["fn1", "fn2"],
+    ["fn-1", "fn-2"],
   );
 });
 
-test("JSON -> MD -> JSON preserves footnote ids and text", async () => {
+test("JSON -> MD -> JSON is byte-stable and preserves footnote body text", async () => {
   const md = convertProseMirrorToMarkdown(footnoteDoc);
   const json = await markdownToProseMirror(md);
   const md2 = convertProseMirrorToMarkdown(json);
 
-  // The second markdown serialization carries the same markers + definitions.
-  assert.match(md2, /\[\^fn1\]/);
-  assert.match(md2, /\[\^fn2\]/);
-  assert.match(md2, /\[\^fn1\]: First note\./);
-  assert.match(md2, /\[\^fn2\]: Second note\./);
+  // The round trip is byte-stable (ids are not written to markdown, so the
+  // concrete import id cannot perturb the output) and the bodies survive.
+  assert.equal(md2, md);
+  assert.match(md2, /\^\[First note\.\]/);
+  assert.match(md2, /\^\[Second note\.\]/);
 });
 
-test("repeated references REUSE one footnote; duplicate definitions are first-wins (#166)", async () => {
-  // Reuse semantics: many `[^d]` references + several `[^d]:` definitions import
-  // as ONE footnote — the references all keep id "d" (reuse), and only the FIRST
-  // definition is kept (first-wins). Deterministic and stable across re-imports.
-  const md = [
-    "See[^d] one[^d] two[^d].",
-    "",
-    "[^d]: first",
-    "[^d]: second",
-    "[^d]: third",
-  ].join("\n");
+test("identical footnote bodies MERGE to one shared definition (#293 canon #2)", async () => {
+  // Two references whose bodies are byte-identical import as ONE definition
+  // shared by both references (dedup on the exact body text). Two DIFFERENT
+  // bodies stay distinct. Deterministic and stable across re-imports.
+  const md = "See^[same] and^[same], but^[other].";
 
   const idsOf = async () => {
     const json = await markdownToProseMirror(md);
@@ -120,11 +121,11 @@ test("repeated references REUSE one footnote; duplicate definitions are first-wi
 
   // Stable across runs.
   assert.deepEqual(a, b);
-  // Reuse: all three reference markers stay "d".
-  assert.deepEqual(a.refs, ["d", "d", "d"]);
-  // First-wins: a single definition "d" with the FIRST text.
-  assert.deepEqual(a.defIds, ["d"]);
-  assert.equal(a.defText, "first");
+  // Merge: the two "same" references share fn-1; the "other" reference is fn-2.
+  assert.deepEqual(a.refs, ["fn-1", "fn-1", "fn-2"]);
+  // One definition per unique body, in first-reference order.
+  assert.deepEqual(a.defIds, ["fn-1", "fn-2"]);
+  assert.equal(a.defText, "same|other");
 });
 
 test("a [^id]: line inside a fenced code block is NOT treated as a definition", async () => {
diff --git a/packages/mcp/test/unit/markdown-converter.test.mjs b/packages/mcp/test/unit/markdown-converter.test.mjs
index 051a7e88..41ec4b00 100644
--- a/packages/mcp/test/unit/markdown-converter.test.mjs
+++ b/packages/mcp/test/unit/markdown-converter.test.mjs
@@ -70,7 +70,7 @@ test("hardBreak -> trailing two-spaces+newline", () => {
   assert.equal(convertProseMirrorToMarkdown(input), "line1  \nline2");
 });
 
-test("table cell with two block children joined by a space (and a pipe escaped)", () => {
+test("table cell with two block children falls back to a raw HTML table", () => {
   const input = doc({
     type: "table",
     content: [
@@ -86,11 +86,12 @@ test("table cell with two block children joined by a space (and a pipe escaped)"
     ],
   });
 
-  // Single-column header row + separator. The cell joins its two paragraphs
-  // with a space ("a|b c") then escapes the pipe -> "a\|b c".
+  // A pipe-table cell cannot represent two block children, so the canonical
+  // converter emits the whole table as raw HTML (lossless) rather than lossily
+  // flattening the paragraphs into one cell.
   assert.equal(
     convertProseMirrorToMarkdown(input),
-    "| a\\|b c |\n| --- |",
+    "<table><tbody><tr><td><p>a|b</p><p>c</p></td></tr></tbody></table>",
   );
 });
 
@@ -108,20 +109,20 @@ test("code block trailing newline trimmed", () => {
   );
 });
 
-test("textAlign value: delimiting double-quote escaped (attribute-safe, idempotent; < > left literal/inert)", () => {
+test("textAlign is carried in a trailing attached-comment directive (JSON-encoded, safe)", () => {
   const input = doc({
     type: "paragraph",
     attrs: { textAlign: 'right"><b' },
     content: [text("body")],
   });
 
-  // Attribute values escape only & and " so the value cannot break out of the
-  // quoted attribute. < and > are left literal: parse5/jsdom does NOT decode
-  // &lt;/&gt; inside attribute values, so escaping them would corrupt the value
-  // and accumulate on every round-trip. The literal < > are inert inside quotes.
+  // #293 canon #9: paragraph textAlign has no native markdown syntax, so it is
+  // attached as a trailing `<!--attrs {json}-->` comment on the block. The value
+  // is JSON-encoded, so a hostile value (`"`, `<`, `>`) is carried verbatim and
+  // inert — it cannot break out of the comment.
   assert.equal(
     convertProseMirrorToMarkdown(input),
-    '<div align="right&quot;><b">body</div>',
+    'body <!--attrs {"textAlign":"right\\"><b"}-->',
   );
 });
 
@@ -150,10 +151,10 @@ test("empty task item still emits its marker", () => {
   assert.equal(convertProseMirrorToMarkdown(input), "- [ ]\n- [x]");
 });
 
-// Image captions (issue #221). An image WITHOUT a caption stays the lossy-free
-// `![alt](src)`; WITH a caption it is emitted as a raw <img data-caption>
-// wrapped in a block <div> (symmetric to video) so the round-trip md -> html ->
-// json restores the caption via the image extension's parseHTML.
+// Image captions (issue #221 / #293 canon #8). An image WITHOUT a caption stays
+// the plain `![alt](src)`; WITH a caption (or any other non-src attr) the extra
+// attrs ride in a trailing `<!--img {json}-->` discriminator comment on the
+// markdown image form, so the round-trip md -> json restores them.
 test("image without a caption emits plain ![alt](src)", () => {
   const input = doc({
     type: "image",
@@ -162,24 +163,24 @@ test("image without a caption emits plain ![alt](src)", () => {
   assert.equal(convertProseMirrorToMarkdown(input), "![cat](/files/a.png)");
 });
 
-test("image with a caption emits a raw <img data-caption> in a block div", () => {
+test("image with a caption emits ![alt](src) plus an <!--img--> directive", () => {
   const input = doc({
     type: "image",
     attrs: { src: "/files/a.png", alt: "cat", caption: "A grey cat" },
   });
   assert.equal(
     convertProseMirrorToMarkdown(input),
-    '<div><img src="/files/a.png" alt="cat" data-caption="A grey cat"></div>',
+    '![cat](/files/a.png) <!--img {"caption":"A grey cat"}-->',
   );
 });
 
-test("image caption escapes & and \" in the data-caption attribute", () => {
+test("image caption is JSON-encoded in the <!--img--> directive (& and \" safe)", () => {
   const input = doc({
     type: "image",
     attrs: { src: "/files/a.png", caption: 'Tom & "Jerry"' },
   });
   assert.equal(
     convertProseMirrorToMarkdown(input),
-    '<div><img src="/files/a.png" data-caption="Tom &amp; &quot;Jerry&quot;"></div>',
+    '![](/files/a.png) <!--img {"caption":"Tom & \\"Jerry\\""}-->',
   );
 });
diff --git a/packages/mcp/test/unit/media-roundtrip-attrs.test.mjs b/packages/mcp/test/unit/media-roundtrip-attrs.test.mjs
index 37668fe0..f2b7ef82 100644
--- a/packages/mcp/test/unit/media-roundtrip-attrs.test.mjs
+++ b/packages/mcp/test/unit/media-roundtrip-attrs.test.mjs
@@ -55,8 +55,10 @@ test("round-trip: drawio diagram survives with src, title, dimensions, align, at
     },
     "drawio",
   );
-  // The converter must emit the schema-matching div[data-type="drawio"].
-  assert.match(md, /data-type="drawio"/);
+  // #293 canon #8: the media family serializes to the markdown image form plus a
+  // trailing discriminator comment carrying the non-src attrs.
+  assert.match(md, /^!\[\]\(\/api\/files\/d\.drawio\)/);
+  assert.match(md, /<!--drawio \{.*"attachmentId":"dz1".*\}-->/);
   assert.equal(found.length, 1, "drawio node must survive the round-trip");
   const a = found[0].attrs;
   assert.equal(a.src, "/api/files/d.drawio");
@@ -123,13 +125,19 @@ test("round-trip: pdf preserves width/height (standard attrs) plus name", async
 });
 
 // ---------------------------------------------------------------------------
-// Escaping: a src containing a double quote must survive the attribute-quoted
-// HTML emission (escapeAttr) and re-parse to the exact original value, with no
-// node loss and no HTML injection.
+// Escaping: a src containing a double quote must survive the markdown image form
+// with no node loss and no injection. In the `![](src)` link the URL is
+// normalized (a raw `"` percent-encodes to `%22`) on import — a semantically
+// equivalent, IDEMPOTENT normalization (it does not drift on further round
+// trips), not data loss.
 // ---------------------------------------------------------------------------
-test("round-trip: a src containing a double quote is escaped and recovered intact", async () => {
+test("round-trip: a src containing a double quote is normalized (idempotent) and survives", async () => {
   const tricky = 'https://e.com/x?a="b"&c=1';
+  const normalized = "https://e.com/x?a=%22b%22&c=1";
   const { found } = await roundtrip({ type: "youtube", attrs: { src: tricky } }, "youtube");
   assert.equal(found.length, 1, "node must survive a quote-bearing src");
-  assert.equal(found[0].attrs.src, tricky, "the exact src is recovered");
+  assert.equal(found[0].attrs.src, normalized, "the quote is percent-encoded in the URL");
+  // Idempotent: a second round trip from the normalized node is byte-stable.
+  const again = await roundtrip({ type: "youtube", attrs: { src: normalized } }, "youtube");
+  assert.equal(again.found[0].attrs.src, normalized);
 });
diff --git a/packages/mcp/test/unit/media-roundtrip.test.mjs b/packages/mcp/test/unit/media-roundtrip.test.mjs
index 9ef99602..9a99a75a 100644
--- a/packages/mcp/test/unit/media-roundtrip.test.mjs
+++ b/packages/mcp/test/unit/media-roundtrip.test.mjs
@@ -25,19 +25,15 @@ const findAll = (node, type, acc = []) => {
 };
 
 // ---------------------------------------------------------------------------
-// DATA-LOSS: atom block nodes with no converter case serialize to "" and the
-// whole block disappears from markdown export.
-//
-// markdown-converter.ts has a `default` branch (~line 601) that renders a node
-// as `nodeContent.map(processNode).join("")`. For a leaf/atom node (no
-// content) that yields "" — so the node (and ALL its attributes) is dropped.
-// `htmlEmbed` and `pageBreak` are both block atoms in docmost-schema.ts with no
-// case in the converter, so they vanish on markdown export.
-//
-// These tests assert the CURRENT (buggy) behavior and name it, so that when a
-// converter case is added the failing assertion flags the test for an update.
+// #293 canon: atom block nodes with no NATIVE markdown syntax are preserved via
+// dedicated converter forms (they used to serialize to "" and vanish — the old
+// mcp converter's data-loss gap, now fixed by consuming the shared package):
+//   - htmlEmbed  -> a raw `<div data-type="htmlEmbed" data-source=… data-height=…>`
+//                   block (source base64-encoded so arbitrary HTML is inert);
+//   - pageBreak  -> a standalone `<!--pagebreak-->` machinery comment (#5).
+// Both survive markdown export AND a full PM -> markdown -> PM round-trip.
 // ---------------------------------------------------------------------------
-test("DATA-LOSS: an htmlEmbed block is silently dropped from markdown export (no converter case)", () => {
+test("htmlEmbed block survives markdown export (source + height preserved)", () => {
   const input = doc(
     para(text("before")),
     { type: "htmlEmbed", attrs: { source: "<b>hi</b>", height: 200 } },
@@ -45,32 +41,31 @@ test("DATA-LOSS: an htmlEmbed block is silently dropped from markdown export (no
   );
   const md = convertProseMirrorToMarkdown(input);
 
-  // BUG: the htmlEmbed block, including its `source` and `height` attrs, is
-  // gone — only the surrounding paragraphs survive. If a future fix adds an
-  // htmlEmbed case, update this test to assert the block (or a placeholder)
-  // survives instead.
-  assert.equal(md, "before\n\n\n\nafter", "htmlEmbed currently disappears");
-  assert.ok(!md.includes("<b>hi</b>"), "the embed source is NOT preserved (data-loss)");
+  assert.match(md, /data-type="htmlEmbed"/);
+  assert.match(md, /data-height="200"/);
+  // The raw source is base64-encoded in data-source (not emitted verbatim), so
+  // the surrounding markdown cannot be corrupted by hostile embed HTML.
+  assert.match(md, /data-source="[^"]+"/);
+  assert.ok(md.includes("before") && md.includes("after"));
 });
 
-test("DATA-LOSS: an htmlEmbed does NOT round-trip (PM -> markdown -> PM loses the node)", async () => {
+test("htmlEmbed round-trips PM -> markdown -> PM (node + source recovered)", async () => {
   const input = doc(
     para(text("x")),
     { type: "htmlEmbed", attrs: { source: "<i>raw</i>", height: 120 } },
   );
   const out = await markdownToProseMirror(convertProseMirrorToMarkdown(input));
-  assert.equal(
-    findAll(out, "htmlEmbed").length,
-    0,
-    "htmlEmbed is lost across a markdown round-trip (known data-loss gap)",
-  );
+  const embeds = findAll(out, "htmlEmbed");
+  assert.equal(embeds.length, 1, "htmlEmbed survives the markdown round-trip");
+  assert.equal(embeds[0].attrs.source, "<i>raw</i>", "source recovered intact");
 });
 
-test("DATA-LOSS: a pageBreak block is silently dropped from markdown export (no converter case)", () => {
+test("pageBreak block survives markdown export and round-trips", async () => {
   const input = doc(para(text("a")), { type: "pageBreak" }, para(text("b")));
   const md = convertProseMirrorToMarkdown(input);
-  // BUG: pageBreak (a block atom with no converter case) disappears.
-  assert.equal(md, "a\n\n\n\nb", "pageBreak currently disappears");
+  assert.match(md, /<!--pagebreak-->/);
+  const out = await markdownToProseMirror(md);
+  assert.equal(findAll(out, "pageBreak").length, 1);
 });
 
 // ---------------------------------------------------------------------------
diff --git a/packages/mcp/test/unit/roundtrip.test.mjs b/packages/mcp/test/unit/roundtrip.test.mjs
index 1b80e554..08ae6219 100644
--- a/packages/mcp/test/unit/roundtrip.test.mjs
+++ b/packages/mcp/test/unit/roundtrip.test.mjs
@@ -165,3 +165,67 @@ test("import: a colored mention span keeps the mention node", async () => {
   const out = await markdownToProseMirror('<span data-type="mention" data-id="u1" data-label="Alice" style="color: blue">@Alice</span>');
   assert.equal(findNodes(out, "mention").length, 1, "mention node must survive a colored span");
 });
+
+// ---------------------------------------------------------------------------
+// #293 STEP 5 canon safety net. These assert STRUCTURE/content preservation
+// (format-agnostic: the node/mark and its value survive PM -> markdown -> PM,
+// and the markdown is idempotent), NOT the exact markdown bytes — so they stay
+// valid regardless of the concrete canonical spelling. They cover the node/mark
+// types whose canonical markdown form changed in #293 (highlight-without-color,
+// textAlign, subpages, inline footnotes) and complement the existing math /
+// media / mention / column round-trips above.
+// ---------------------------------------------------------------------------
+test("round-trip: highlight WITHOUT a color survives as a highlight mark (==)", async () => {
+  const input = doc(para(text("hi", [{ type: "highlight", attrs: { color: null } }])));
+  const md = convertProseMirrorToMarkdown(input);
+  const out = await roundtrip(input);
+  const hit = findNodes(out, "text").find(
+    (n) => n.text === "hi" && (n.marks || []).some((m) => m.type === "highlight"),
+  );
+  assert.ok(hit, "the highlight mark must survive a color-less round-trip");
+  // Idempotent markdown.
+  assert.equal(convertProseMirrorToMarkdown(out), md);
+});
+
+test("round-trip: paragraph textAlign survives via the attached-comment directive", async () => {
+  const input = doc({
+    type: "paragraph",
+    attrs: { textAlign: "center" },
+    content: [text("mid")],
+  });
+  const md = convertProseMirrorToMarkdown(input);
+  const out = await roundtrip(input);
+  const p = findNodes(out, "paragraph").find((n) => n.attrs && n.attrs.textAlign === "center");
+  assert.ok(p, "textAlign must be restored on the paragraph");
+  assert.equal(convertProseMirrorToMarkdown(out), md, "textAlign round-trip is idempotent");
+});
+
+test("round-trip: subpages atom survives", async () => {
+  const input = doc({ type: "subpages" });
+  const out = await roundtrip(input);
+  assert.equal(findNodes(out, "subpages").length, 1, "subpages node must survive");
+});
+
+test("round-trip: inline footnote survives with body text (canonical structure)", async () => {
+  const input = doc(
+    para(text("Claim"), { type: "footnoteReference", attrs: { id: "fnA" } }),
+    {
+      type: "footnotesList",
+      content: [
+        {
+          type: "footnoteDefinition",
+          attrs: { id: "fnA" },
+          content: [para(text("the evidence"))],
+        },
+      ],
+    },
+  );
+  const md = convertProseMirrorToMarkdown(input);
+  const out = await roundtrip(input);
+  assert.equal(findNodes(out, "footnoteReference").length, 1);
+  assert.equal(findNodes(out, "footnotesList").length, 1);
+  assert.equal(findNodes(out, "footnoteDefinition").length, 1);
+  assert.match(JSON.stringify(out), /the evidence/, "footnote body survives");
+  // Byte-stable (the schema id is never written to markdown).
+  assert.equal(convertProseMirrorToMarkdown(out), md);
+});
diff --git a/packages/prosemirror-markdown/package.json b/packages/prosemirror-markdown/package.json
new file mode 100644
index 00000000..9f0bd2e3
--- /dev/null
+++ b/packages/prosemirror-markdown/package.json
@@ -0,0 +1,45 @@
+{
+  "name": "@docmost/prosemirror-markdown",
+  "version": "0.1.0",
+  "description": "Pure ProseMirror <-> Markdown converter + schema mirror (headless, framework-free).",
+  "private": true,
+  "type": "module",
+  "main": "./build/index.js",
+  "types": "./build/index.d.ts",
+  "exports": {
+    ".": {
+      "types": "./build/index.d.ts",
+      "default": "./build/index.js"
+    }
+  },
+  "scripts": {
+    "build": "tsc",
+    "watch": "tsc --watch",
+    "test": "vitest run",
+    "test:watch": "vitest"
+  },
+  "license": "MIT",
+  "dependencies": {
+    "@tiptap/core": "3.20.4",
+    "@tiptap/extension-highlight": "3.20.4",
+    "@tiptap/extension-image": "3.20.4",
+    "@tiptap/extension-subscript": "3.20.4",
+    "@tiptap/extension-superscript": "3.20.4",
+    "@tiptap/extension-task-item": "3.20.4",
+    "@tiptap/extension-task-list": "3.20.4",
+    "@tiptap/html": "3.20.4",
+    "@tiptap/pm": "3.20.4",
+    "@tiptap/starter-kit": "3.20.4",
+    "jsdom": "25.0.0",
+    "marked": "17.0.5",
+    "zod": "4.3.6"
+  },
+  "devDependencies": {
+    "@docmost/editor-ext": "workspace:*",
+    "@types/jsdom": "^21.1.7",
+    "@types/node": "^20.0.0",
+    "fast-check": "^4.8.0",
+    "typescript": "^5.0.0",
+    "vitest": "4.1.6"
+  }
+}
diff --git a/packages/prosemirror-markdown/src/index.ts b/packages/prosemirror-markdown/src/index.ts
new file mode 100644
index 00000000..fe94a762
--- /dev/null
+++ b/packages/prosemirror-markdown/src/index.ts
@@ -0,0 +1,9 @@
+/**
+ * Public surface of `@docmost/prosemirror-markdown`.
+ *
+ * A headless, framework-free ProseMirror <-> Markdown converter plus the
+ * Docmost schema mirror. Everything lives under `lib/` (the converter core);
+ * this top-level barrel simply re-exports that surface so the package entry is
+ * the converter surface.
+ */
+export * from "./lib/index.js";
diff --git a/packages/prosemirror-markdown/src/lib/attached-comment.ts b/packages/prosemirror-markdown/src/lib/attached-comment.ts
new file mode 100644
index 00000000..29c6eb91
--- /dev/null
+++ b/packages/prosemirror-markdown/src/lib/attached-comment.ts
@@ -0,0 +1,124 @@
+/**
+ * Attached-comment convention (#293 canon).
+ *
+ * Some block-level attributes have no native markdown syntax (paragraph/heading
+ * `textAlign` — #9; image/media attrs — #4/#8). Rather than HTML-wrapping the
+ * whole block (the old `<div align>` / `<p style>` forms, which the maintainer
+ * had to patch repeatedly and which did not round-trip cleanly), we ATTACH a
+ * compact HTML comment at the END of the block's rendered line:
+ *
+ *     Some paragraph text <!--attrs {"textAlign":"center"}-->
+ *
+ * The comment is invisible in any markdown renderer and is dropped by the
+ * DOM/generateJSON import stage, so it can never leak into the document body.
+ * The importer intercepts it BEFORE that stage (see markdown-to-prosemirror's
+ * applyAttachedComments) and re-applies the encoded attributes to the node.
+ *
+ * This module holds the two PURE, reusable primitives of the convention so the
+ * serializer, the parser, and future decisions (#4 image, #8 media) share ONE
+ * implementation:
+ *   - `attachedCommentFor(name, json)` — build the comment string.
+ *   - `parseAttachedComment(data)`     — parse a comment node's data back.
+ */
+
+/**
+ * A parsed attached comment: the leading `name` token and the decoded JSON
+ * object payload (empty object when the comment carried no JSON body).
+ */
+export interface AttachedComment {
+  name: string;
+  attrs: Record<string, unknown>;
+}
+
+/**
+ * Grammar of an attached comment's DATA (the text between `<!--` and `-->`):
+ * a leading name token (`attrs`, `img`, …) optionally followed by whitespace
+ * and a single JSON object. The name deliberately does NOT allow `:` so the
+ * file-level envelope comments (`docmost:meta` / `docmost:comments`) never match
+ * and stay inert here.
+ */
+const ATTACHED_COMMENT_RE = /^\s*([A-Za-z][\w-]*)(?:\s+(\{[\s\S]*\}))?\s*$/;
+
+/**
+ * Build an attached HTML comment `<!--name {compact-json}-->` for `json`.
+ *
+ * The JSON is emitted compactly (no spaces) via `JSON.stringify`. A string value
+ * may legitimately contain two consecutive hyphens `--`, which would prematurely
+ * close the HTML comment (`-->`). We defuse that WITHOUT changing the decoded
+ * value: each hyphen of every `--` pair is rewritten as the JSON unicode escape
+ * `-`, so `JSON.parse` on the reading side restores the exact original
+ * hyphens. `--` can only occur inside a JSON string (structural JSON never
+ * produces it), so a blanket replace over the stringified payload is safe.
+ */
+export function attachedCommentFor(name: string, json: object): string {
+  return `<!--${name} ${escapeCommentJson(json)}-->`;
+}
+
+/**
+ * Compactly stringify `json` and defuse any `--` pair so the payload can never
+ * close the HTML comment early. Shared by `attachedCommentFor` (attached form)
+ * and `standaloneCommentFor` (standalone form) so both stay in sync.
+ *
+ * A string value may legitimately contain two consecutive hyphens `--`, which
+ * would prematurely close the comment (`-->`). We defuse that WITHOUT changing
+ * the decoded value: each hyphen of every `--` pair is rewritten as the JSON
+ * unicode escape `-`, so `JSON.parse` on the reading side restores the exact
+ * original hyphens. `--` can only occur inside a JSON string (structural JSON
+ * never produces it), so a blanket replace over the stringified payload is safe.
+ * Scanning left-to-right and replacing each `--` handles odd runs too (`---` ->
+ * two escapes + one bare `-`, still `---` after JSON.parse).
+ */
+function escapeCommentJson(json: object): string {
+  return JSON.stringify(json).replace(/--/g, "\\u002d\\u002d");
+}
+
+/**
+ * Build a STANDALONE machinery comment (#293 canon #5) for a block node that
+ * lives on its OWN line, e.g. `<!--pagebreak-->` or `<!--subpages-->`.
+ *
+ * Grammar is identical to the attached form (`<!--name {JSON?}-->`), but the
+ * JSON body is emitted ONLY when there are real attributes to carry:
+ *   - `standaloneCommentFor("pagebreak")`            -> `<!--pagebreak-->`
+ *   - `standaloneCommentFor("subpages")`             -> `<!--subpages-->`
+ *   - `standaloneCommentFor("subpages", {recursive:true})`
+ *                                    -> `<!--subpages {"recursive":true}-->`
+ *
+ * When `attrs` is undefined/null/empty-object the comment is name-only (no JSON,
+ * which parses back to default attrs). Otherwise the JSON body is emitted with
+ * the SAME `--`-escaping as `attachedCommentFor` (via `escapeCommentJson`), so
+ * the standalone and attached encoders can never diverge.
+ */
+export function standaloneCommentFor(name: string, attrs?: object | null): string {
+  if (!attrs || Object.keys(attrs).length === 0) {
+    return `<!--${name}-->`;
+  }
+  return `<!--${name} ${escapeCommentJson(attrs)}-->`;
+}
+
+/**
+ * Parse the DATA of a comment node into `{ name, attrs }`, or `null` when it is
+ * not a well-formed attached comment.
+ *
+ * Fail-open by design (maintainer spec): a comment whose name token is missing,
+ * whose JSON body is malformed, or whose body is not a plain object returns
+ * `null` so the caller ignores it and keeps default attributes. Unknown keys in
+ * a valid object are preserved here and filtered by the caller.
+ */
+export function parseAttachedComment(data: string): AttachedComment | null {
+  const m = ATTACHED_COMMENT_RE.exec(data);
+  if (!m) return null;
+  const name = m[1];
+  if (m[2] === undefined) {
+    // Name-only comment (no JSON body): a valid attached marker with no attrs.
+    return { name, attrs: {} };
+  }
+  try {
+    const parsed = JSON.parse(m[2]);
+    if (parsed && typeof parsed === "object" && !Array.isArray(parsed)) {
+      return { name, attrs: parsed as Record<string, unknown> };
+    }
+    return null; // fail-open: payload is not a plain object
+  } catch {
+    return null; // fail-open: malformed JSON -> ignore the comment
+  }
+}
diff --git a/packages/git-sync/src/lib/canonicalize.ts b/packages/prosemirror-markdown/src/lib/canonicalize.ts
similarity index 96%
rename from packages/git-sync/src/lib/canonicalize.ts
rename to packages/prosemirror-markdown/src/lib/canonicalize.ts
index 99ff5bc6..25fbc921 100644
--- a/packages/git-sync/src/lib/canonicalize.ts
+++ b/packages/prosemirror-markdown/src/lib/canonicalize.ts
@@ -45,9 +45,11 @@
  *       converter coercing numeric `width`/`height` to strings, which is outside
  *       canonicalize's scope.
  *
- * NOTE: `image` has NO non-null align default — its `align` defaults to `null`
- * (docmost-schema.ts L174), so it is already handled by the null-drop rule and
- * is intentionally NOT listed here.
+ * NOTE: `image` align now defaults to `"center"` — unified with editor-ext
+ * (#293 canon #4). It is listed below so a canonical image drops `align` when
+ * it equals "center" (absent ≡ default), exactly like the diagram/media nodes.
+ * A null align is likewise dropped by the null-drop rule and re-imports as the
+ * "center" default, so bare `![](src)` images stay canonically clean.
  */
 const KNOWN_DEFAULTS: Record<string, Record<string, unknown>> = {
   // mark types
@@ -62,6 +64,9 @@ const KNOWN_DEFAULTS: Record<string, Record<string, unknown>> = {
   orderedList: {
     start: 1,
   },
+  image: {
+    align: "center",
+  },
   drawio: {
     align: "center",
   },
diff --git a/packages/git-sync/src/lib/docmost-schema.ts b/packages/prosemirror-markdown/src/lib/docmost-schema.ts
similarity index 97%
rename from packages/git-sync/src/lib/docmost-schema.ts
rename to packages/prosemirror-markdown/src/lib/docmost-schema.ts
index 276efe90..1a63ec95 100644
--- a/packages/git-sync/src/lib/docmost-schema.ts
+++ b/packages/prosemirror-markdown/src/lib/docmost-schema.ts
@@ -256,7 +256,22 @@ const DocmostAttributes = Extension.create({
       {
         types: ["image"],
         attributes: {
-          align: { default: null },
+          // #293 canon #4: the image `align` default is unified to "center"
+          // (matching editor-ext, the source of real user documents) so an
+          // editor-authored image — which is always align="center" — serializes
+          // as the clean `![](src)` form with NO attached comment, and only a
+          // genuinely non-default alignment (left/right) emits an `<!--img-->`
+          // comment. The DOM attribute name stays `align` (imageToHtml already
+          // round-trips it as align="…"); only the DEFAULT value changed from
+          // null to "center". parseHTML reads the `align` attribute so a bare
+          // <img> with no align falls back to "center", and <img align="left">
+          // reads "left".
+          align: {
+            default: "center",
+            parseHTML: (el: HTMLElement) => el.getAttribute("align") || "center",
+            renderHTML: (attrs: Record<string, any>) =>
+              attrs.align && attrs.align !== "center" ? { align: attrs.align } : {},
+          },
           // imageToHtml emits these Docmost-specific image attrs as data-*; map
           // them back explicitly so a top-level image (or one inside a column)
           // round-trips them. Without a parseHTML the default reads the bare
diff --git a/packages/prosemirror-markdown/src/lib/footnote.ts b/packages/prosemirror-markdown/src/lib/footnote.ts
new file mode 100644
index 00000000..d1732734
--- /dev/null
+++ b/packages/prosemirror-markdown/src/lib/footnote.ts
@@ -0,0 +1,61 @@
+/**
+ * #293 canon #2: inline footnotes `^[text]`.
+ *
+ * Shared, side-effect-free helpers used by BOTH the serializer
+ * (markdown-converter.ts) and the importer (markdown-to-prosemirror.ts) so the
+ * two directions cannot drift.
+ *
+ * The canonical markdown form is Pandoc/Obsidian inline footnotes: the note body
+ * is written AT the reference point as `^[body]`; there is no separate
+ * `[^id]: …` definition line and no bottom `<section>` list in the markdown. On
+ * import the body is re-assembled into the schema's doc-level
+ * `footnotesList`/`footnoteDefinition` so the editor sees the usual three-node
+ * footnote model, while identical bodies MERGE to a single definition shared by
+ * every reference. Ids are assigned by the importer's assembleFootnotes pass
+ * (dedup on the EXACT body text -> sequential `fn-N`), NOT derived from a hash,
+ * so two DIFFERENT bodies can never collide onto one definition (F1). The id is
+ * never written to markdown (`^[body]` carries only text), so the round trip
+ * stays byte-stable regardless of the concrete id.
+ */
+
+/**
+ * Split an ENCODED footnote body (the inner captured between `^[` and its
+ * matching `]`, or the value of a `data-fn-text` attribute) into its paragraph
+ * markdown strings.
+ *
+ * Paragraph boundaries are the two-character literal separator `\n` (backslash +
+ * n); a REAL backslash-n in the body was encoded as `\\n` (an escaped backslash
+ * followed by n) by the serializer, so it must NOT split. The scan therefore
+ * treats any `\<char>` as an escaped pair kept verbatim (so `\\` `n` stays a
+ * literal backslash-then-n and the trailing `n` is plain), and only an
+ * UNescaped `\n` is a separator. Every other backslash escape (`\=`, `\$`,
+ * `\[`, …) is preserved untouched so the per-paragraph `parseInline` decodes it.
+ */
+export function splitFootnoteParagraphs(encoded: string): string[] {
+  const paragraphs: string[] = [];
+  let current = "";
+  let i = 0;
+  while (i < encoded.length) {
+    const c = encoded[i];
+    if (c === "\\" && i + 1 < encoded.length) {
+      const next = encoded[i + 1];
+      if (next === "n") {
+        // Unescaped backslash-n: a paragraph separator.
+        paragraphs.push(current);
+        current = "";
+        i += 2;
+        continue;
+      }
+      // Any other escaped pair (including `\\`) is kept verbatim; consuming
+      // BOTH chars is what makes an encoded real `\n` (`\\n`) safe — the `\\`
+      // pair is taken here, leaving the following `n` as an ordinary literal.
+      current += c + next;
+      i += 2;
+      continue;
+    }
+    current += c;
+    i++;
+  }
+  paragraphs.push(current);
+  return paragraphs;
+}
diff --git a/packages/git-sync/src/lib/index.ts b/packages/prosemirror-markdown/src/lib/index.ts
similarity index 50%
rename from packages/git-sync/src/lib/index.ts
rename to packages/prosemirror-markdown/src/lib/index.ts
index 9e797a26..f95e6a6d 100644
--- a/packages/git-sync/src/lib/index.ts
+++ b/packages/prosemirror-markdown/src/lib/index.ts
@@ -16,9 +16,29 @@ export {
 export type { DocmostMdMeta } from "./markdown-document.js";
 
 export { convertProseMirrorToMarkdown } from "./markdown-converter.js";
+export type { ConvertProseMirrorToMarkdownOptions } from "./markdown-converter.js";
 
 export { markdownToProseMirror } from "./markdown-to-prosemirror.js";
 
+// The Docmost tiptap schema mirror. Exposed so consumers (and the sync
+// engine's schema-validity regression tests) can build the exact ProseMirror
+// schema the converter targets.
+export { docmostExtensions } from "./docmost-schema.js";
+
+// Schema-adjacent sanitizers used by consumers (mcp) so the single canonical,
+// alias-aware / allowlist implementations live ONLY here (no drifting copies).
+export { clampCalloutType, sanitizeCssColor } from "./docmost-schema.js";
+
+// Attached-comment convention (#293 canon #9/#4/#8): the reusable primitives
+// the serializer/parser use to encode attrs that have no native markdown syntax
+// as trailing `<!--name {json}-->` comments.
+export {
+  attachedCommentFor,
+  standaloneCommentFor,
+  parseAttachedComment,
+} from "./attached-comment.js";
+export type { AttachedComment } from "./attached-comment.js";
+
 export {
   canonicalizeContent,
   docsCanonicallyEqual,
diff --git a/packages/prosemirror-markdown/src/lib/markdown-converter.ts b/packages/prosemirror-markdown/src/lib/markdown-converter.ts
new file mode 100644
index 00000000..2d173e52
--- /dev/null
+++ b/packages/prosemirror-markdown/src/lib/markdown-converter.ts
@@ -0,0 +1,1528 @@
+import { encodeHtmlEmbedSource } from "./docmost-schema.js";
+import {
+  attachedCommentFor,
+  standaloneCommentFor,
+} from "./attached-comment.js";
+import {
+  encodeInlineMathLatex,
+  inlineMathGlobalRe,
+  inlineMathSerializable,
+} from "./math-inline.js";
+import {
+  attachmentToHtml,
+  audioToHtml,
+  diagramToHtml,
+  embedToHtml,
+  pageEmbedToHtml,
+  pdfToHtml,
+  transclusionReferenceToHtml,
+  videoToHtml,
+  youtubeToHtml,
+} from "./media-html.js";
+
+/**
+ * Hard cap on processNode recursion depth (see the depth guard below).
+ *
+ * Chosen well above any realistic document (the deepest legitimate nesting the
+ * editor can produce is far shallower) yet far below the point where the
+ * converter's own call stack overflows. The heaviest shape (deeply nested
+ * lists) costs ~5 JS frames per level and the runtime stack holds ~10k frames,
+ * so the measured overflow is around level ~650 (deeply nested lists); 400
+ * leaves a comfortable margin while still rendering pathological-but-bounded
+ * docs in full (the 200-level stress fixture reaches depth ~204).
+ */
+const MAX_NODE_DEPTH = 400;
+
+/**
+ * Options for {@link convertProseMirrorToMarkdown}.
+ */
+export interface ConvertProseMirrorToMarkdownOptions {
+  /**
+   * When true, an inline comment anchor whose Comment mark is `resolved`
+   * emits its BARE text (no `<span data-comment-id …>` wrapper), so an agent
+   * reading the page never sees resolved-comment anchors. ACTIVE (unresolved)
+   * anchors still emit their wrapper. Defaults to false — a zero-behavior
+   * change for every existing caller, including the lossless git-sync export
+   * path where resolved anchors MUST be preserved for round-tripping.
+   */
+  dropResolvedCommentAnchors?: boolean;
+}
+
+/**
+ * Convert ProseMirror/TipTap JSON content to Markdown
+ * Supports all Docmost-specific node types and extensions
+ */
+export function convertProseMirrorToMarkdown(
+  content: any,
+  options: ConvertProseMirrorToMarkdownOptions = {},
+): string {
+  if (!content || !content.content) return "";
+
+  // Closure flag read by both `case "comment"` emitters (the top-level marks
+  // loop and the raw-HTML inlineToHtml path). Off by default; the agent-read
+  // callers (mcp getPage / in-app AI chat) pass it true.
+  const dropResolvedCommentAnchors = options.dropResolvedCommentAnchors === true;
+
+  // Escape a value interpolated into an HTML double-quoted attribute value
+  // (textAlign, colors, image src, math `text`, all data-* attrs, etc.). In the
+  // ATTRIBUTE context only the quote that delimits the value and the ampersand
+  // that starts an entity are special, so we escape ONLY & " (and ' for safety
+  // when single-quoted delimiters are used). We deliberately do NOT escape < or
+  // >: the HTML re-parser (parse5/jsdom via @tiptap/html) does NOT decode
+  // &lt;/&gt; back inside attribute values, so escaping them would corrupt the
+  // stored data (e.g. a math node's LaTeX `a < b`) and ACCUMULATE escapes on
+  // every round-trip (`a < b` -> `a &lt; b` -> `a &amp;lt; b`). Escaping & "
+  // keeps the value inert against attribute-injection while staying idempotent.
+  // NOTE: escape ONLY & and " here. The value is always wrapped in double
+  // quotes, so " is the only delimiter; ' is NOT special in a double-quoted
+  // value, and parse5 does not decode &#39; back inside attribute values, so
+  // escaping ' would (like < >) corrupt the value and accumulate &amp; on every
+  // round-trip. Escaping & and " is idempotent (parse5 decodes them back).
+  const escapeAttr = (value: unknown): string =>
+    String(value)
+      .replace(/&/g, "&amp;")
+      .replace(/"/g, "&quot;");
+
+  // Escape a value placed as HTML element TEXT content (between tags), where
+  // <, >, and & are all significant. Used for text rendered inside raw-HTML
+  // blocks (table cells / columns) so stored characters cannot inject markup.
+  const escapeHtmlText = (value: unknown): string =>
+    String(value)
+      .replace(/&/g, "&amp;")
+      .replace(/</g, "&lt;")
+      .replace(/>/g, "&gt;");
+
+  // Percent-encode characters that would break out of a markdown URL target
+  // (...) — whitespace/newlines and parentheses — so a stored src stays a
+  // single inert token (used for image/video/youtube srcs).
+  const encodeMdUrl = (value: unknown): string =>
+    String(value || "")
+      .replace(/\s/g, (c: string) => (c === " " ? "%20" : encodeURIComponent(c)))
+      .replace(/\(/g, "%28")
+      .replace(/\)/g, "%29");
+
+  // Backslash-escape every character that would be INTERPRETED inside a markdown
+  // label re-parsed as inline content — used for a link-form media node's visible
+  // text (`attrs.name`/`attrs.provider`, #293 canon #8) AND for an image `![alt]`
+  // (canon #4) — so the value round-trips byte-exact. Two overlapping trigger
+  // sets must be escaped:
+  //   1. Stock CommonMark inline: emphasis (`* _`), code (`` ` ``), strikethrough
+  //      (`~`), autolinks/raw-HTML (`<`), HTML entities (`&`), image markers (`!`),
+  //      brackets (`[ ]`), and `( )` — even with `[ ]` escaped, an unescaped
+  //      `](x)` forms a false nested-link destination and fragments the parse.
+  //   2. The Docmost inline EXTENSIONS this package registers on its marked
+  //      instance: highlight `==x==` (canon #7), math `$x$` (canon #6), and
+  //      footnote `^[x]` (canon #2). Their triggers `= $ ^` are NOT CommonMark
+  //      punctuation the stock lexer would treat specially, but the extension
+  //      tokenizers fire on them — so an alt/name like `x $A$ y`, `use ==b==`, or
+  //      `^[fn]` would be silently turned into a math/highlight/footnote node on
+  //      import unless the trigger is escaped. `\= \$ \^` decode back to literals
+  //      (all ASCII punctuation) and, being escape tokens, stop the extension
+  //      tokenizer from matching — verified lossless round-trip.
+  const escapeLinkText = (value: unknown): string =>
+    String(value ?? "").replace(/[\\`*_~[\]<&!()=$^]/g, (c: string) => `\\${c}`);
+
+  // #293 canon #6: the schema-HTML forms for math. These are the LOSSLESS forms
+  // the raw-HTML path (columns/cells) and the mathInline fallback emit, and the
+  // SAME shape the importer's schema parseHTML rebuilds (span/div carrying the
+  // LaTeX in a `text="…"` attribute). Kept as small helpers so the readable
+  // `$…$`/`$$…$$` markdown forms and the raw-HTML forms cannot drift apart.
+  const mathInlineHtml = (latex: string): string =>
+    `<span data-type="mathInline" data-katex="true" text="${escapeAttr(latex)}"></span>`;
+  const mathBlockHtml = (latex: string): string =>
+    `<div data-type="mathBlock" data-katex="true" text="${escapeAttr(latex)}"></div>`;
+
+  // #293 canon #6: neutralize a would-be inline-math `$…$` span sitting in PROSE
+  // text so it re-imports as literal text (never a phantom math node). We escape
+  // ONLY the two delimiting `$` of a span the inline-math tokenizer WOULD match
+  // (shared rule, math-inline.ts), leaving the inner untouched. A currency `$`
+  // (`$5`, `$5 and $10`) has no VALID closing under the rule, so it never
+  // matches and is emitted CLEAN (no backslash churn). On re-import marked's
+  // escape tokenizer turns each `\$` back into a literal `$`, so `the set $A$`
+  // round-trips as text while `$5 and $10` stays exactly as written.
+  const escapeProseMath = (value: string): string =>
+    value.replace(inlineMathGlobalRe(), (_m, inner) => `\\$${inner}\\$`);
+
+  // #293 canon #2 inline footnotes. PRE-SCAN the whole tree once: map every
+  // footnote DEFINITION by its id (first-wins) and collect every REFERENCED id.
+  // The canonical markdown form inlines a note's body AT its reference point as
+  // `^[body]`, so the serializer needs the body keyed by id when it reaches a
+  // `footnoteReference`, and needs to know which definitions are orphaned (no
+  // ref) so their bodies are not silently dropped (appended at the doc end).
+  const footnoteDefs = new Map<string, any>();
+  const referencedFootnoteIds = new Set<string>();
+  // ITERATIVE walk (explicit stack, not recursion): a pathologically deep
+  // document must not overflow the call stack here — the same reason processNode
+  // has its depth guard. This scan is unbounded but stack-safe.
+  const scanStack: any[] = [content];
+  while (scanStack.length) {
+    const n = scanStack.pop();
+    if (!n || typeof n !== "object") continue;
+    if (
+      n.type === "footnoteDefinition" &&
+      n.attrs?.id &&
+      !footnoteDefs.has(n.attrs.id)
+    ) {
+      footnoteDefs.set(n.attrs.id, n);
+    }
+    if (n.type === "footnoteReference" && n.attrs?.id) {
+      referencedFootnoteIds.add(n.attrs.id);
+    }
+    if (Array.isArray(n.content)) {
+      for (const child of n.content) scanStack.push(child);
+    }
+  }
+
+  // Balance `[`/`]` in a rendered footnote body so the whole thing stays a
+  // parseable `^[…]` capture (the importer's tokenizer counts brackets from `^[`
+  // to the matching `]`). A markdown link's `[text](url)` is already balanced
+  // and is left intact; only a STRAY unmatched `]` (or `[`) — e.g. a literal
+  // bracket in prose — is backslash-escaped so it cannot open/close the footnote
+  // early. Already backslash-escaped pairs are passed through untouched.
+  const balanceBrackets = (s: string): string => {
+    const out: string[] = [];
+    const openIndices: number[] = []; // positions in `out` of unmatched `[`
+    let i = 0;
+    while (i < s.length) {
+      const c = s[i];
+      if (c === "\\" && i + 1 < s.length) {
+        out.push(c + s[i + 1]); // keep an existing escaped pair verbatim
+        i += 2;
+        continue;
+      }
+      if (c === "[") {
+        openIndices.push(out.length);
+        out.push("[");
+        i++;
+        continue;
+      }
+      if (c === "]") {
+        if (openIndices.length > 0) {
+          openIndices.pop();
+          out.push("]");
+        } else {
+          out.push("\\]"); // stray close -> escape
+        }
+        i++;
+        continue;
+      }
+      out.push(c);
+      i++;
+    }
+    for (const idx of openIndices) out[idx] = "\\["; // stray opens -> escape
+    return out.join("");
+  };
+
+  // While TRUE, `case "text"` DOUBLES every RAW user backslash (`\` -> `\\`) in a
+  // text run BEFORE the intentional markdown/balance escapes are layered on (see
+  // the text case). This is the F2 fix: a body ending in `\` (Windows path,
+  // LaTeX, regex) must survive `^[…]`. Without it a trailing `\` serialized to
+  // `^[…\]`, whose `\]` the import tokenizer reads as an ESCAPED `]`, so the
+  // balance never closed and the whole footnote degraded to literal prose (and
+  // the `\` was lost). Doubling raw backslashes makes `parseInline` restore each
+  // (`\\`->`\`) on import while the serializer's OWN single escapes (`\[` `\]`
+  // `\=` `\$`, the `\n` paragraph separator) stay intact. It is a closure flag
+  // (per-conversion, not module state), so concurrent conversions never share it.
+  let inFootnoteBody = false;
+
+  // Render a footnote DEFINITION's `paragraph+` body to INLINE markdown suitable
+  // to sit inside `^[…]`. Each paragraph is rendered inline (so links/marks in
+  // the note round-trip) with raw backslashes doubled (via inFootnoteBody) and
+  // its brackets balanced; paragraphs are then joined with the literal two-char
+  // separator `\n`. Because raw backslashes are already doubled, a real
+  // backslash-n in the text is `\\n` and never mistaken for the separator (the
+  // only unescaped `\n` is the join inserted here). Footnotes are inline (single
+  // line) in markdown, so an embedded hard break collapses to a space.
+  const renderFootnoteBody = (def: any): string => {
+    const paras = (def?.content || []).filter(
+      (p: any) => p?.type === "paragraph",
+    );
+    // A definition with no paragraph still yields one (empty) segment so an
+    // empty note serializes as `^[]` and round-trips.
+    const segments = (paras.length ? paras : [{ content: [] }]).map(
+      (p: any) => {
+        const prev = inFootnoteBody;
+        inFootnoteBody = true;
+        let s: string;
+        try {
+          s = renderInlineChildren(p.content || []);
+        } finally {
+          inFootnoteBody = prev;
+        }
+        // Collapse any real newline (e.g. a hard break) so `^[…]` stays on one
+        // logical line for the inline tokenizer.
+        s = s.replace(/\r?\n/g, " ");
+        s = balanceBrackets(s);
+        return s;
+      },
+    );
+    return segments.join("\\n");
+  };
+
+  // Recursion depth guard. processNode is mutually recursive (directly and via
+  // processListItem/processTaskItem/blockToHtml), and a pathologically nested
+  // document (e.g. tens of thousands of nested blockquotes) would otherwise
+  // overflow the call stack and throw a RangeError, which would abort the sync
+  // and prevent the page from ever being written. We track the live nesting
+  // depth in a closure counter (the wrapper below) so we NEVER throw: past the
+  // limit we stop recursing and emit the node's own text (or nothing) instead.
+  // Normal documents never approach MAX_NODE_DEPTH, so their output is byte-
+  // identical. NOTE: the wrapper signature is (node) only — several callers use
+  // `.map(processNode)`, which would otherwise pass the array index as a second
+  // argument; the wrapper ignores extra arguments so that is harmless.
+  let nodeDepth = 0;
+
+  // A table cell whose content is NOT a single plain paragraph — a list, code
+  // block, blockquote, multiple paragraphs, etc. A GFM pipe cell can only hold
+  // inline content on one line, so such a cell must force the HTML <table> form
+  // or its structure is flattened/lost on round trip (review #8).
+  const cellIsMultiBlock = (cell: any): boolean => {
+    const blocks = cell.content || [];
+    if (blocks.length > 1) return true;
+    const only = blocks[0];
+    return only != null && only.type !== "paragraph";
+  };
+
+  // Render a whole table as raw HTML `<table>` (round-trips via the schema's
+  // table-family parseHTML). Used when a GFM pipe table would be wrong: merged
+  // cells (colspan/rowspan), multi-block cells (#8), OR the table sits inside a
+  // raw-HTML container like a column (marked does not parse markdown inside raw
+  // HTML, so a GFM pipe table there becomes literal "| a | b |" text — #7).
+  // `blockToHtml` is referenced lazily (defined below; only called at runtime).
+  const tableToHtml = (tableRows: any[]): string => {
+    const renderHtmlCell = (cell: any): string => {
+      const tag = cell.type === "tableHeader" ? "th" : "td";
+      const a = cell.attrs || {};
+      const cellParts: string[] = [];
+      if ((a.colspan ?? 1) > 1)
+        cellParts.push(`colspan="${escapeAttr(a.colspan)}"`);
+      if ((a.rowspan ?? 1) > 1)
+        cellParts.push(`rowspan="${escapeAttr(a.rowspan)}"`);
+      if (a.align) cellParts.push(`align="${escapeAttr(a.align)}"`);
+      const open = cellParts.length
+        ? `<${tag} ${cellParts.join(" ")}>`
+        : `<${tag}>`;
+      const inner = (cell.content || [])
+        .map((block: any) => blockToHtml(block))
+        .join("");
+      return `${open}${inner}</${tag}>`;
+    };
+    const htmlRows = tableRows
+      .map(
+        (row: any) =>
+          `<tr>${(row.content || []).map(renderHtmlCell).join("")}</tr>`,
+      )
+      .join("");
+    return `<table><tbody>${htmlRows}</tbody></table>`;
+  };
+
+  const processNode = (node: any): string => {
+    if (nodeDepth >= MAX_NODE_DEPTH) {
+      // Bail out of deeper recursion without throwing. A text node still has
+      // its own content worth keeping; a container at the limit collapses to
+      // "" (its already-too-deep subtree is dropped) rather than overflowing.
+      return typeof node?.text === "string" ? node.text : "";
+    }
+    nodeDepth++;
+    try {
+      return processNodeInner(node);
+    } finally {
+      nodeDepth--;
+    }
+  };
+
+  const processNodeInner = (node: any): string => {
+    const type = node.type;
+    const nodeContent = node.content || [];
+
+    switch (type) {
+      case "doc": {
+        // #293 canon #2: the `footnotesList` is NOT emitted in markdown — every
+        // note body is inlined at its `^[…]` reference. Skip the list entirely
+        // (emitting "" would inject a phantom blank gap via the "\n\n" join),
+        // then append any ORPHAN definition (one no reference points at) as its
+        // own `^[body]` line so its body is never silently lost.
+        // F3 (accepted, intentional): on re-import that orphan `^[body]` line
+        // becomes a reference + definition (an orphan def gains a ref). This is
+        // lossless (the body survives) and byte-stable (it re-exports identically),
+        // so it is deliberately not treated as data loss.
+        const parts: string[] = [];
+        for (const child of nodeContent) {
+          if (child?.type === "footnotesList") continue;
+          parts.push(processNode(child));
+        }
+        for (const [id, def] of footnoteDefs) {
+          if (!referencedFootnoteIds.has(id)) {
+            parts.push(`^[${renderFootnoteBody(def)}]`);
+          }
+        }
+        return parts.join("\n\n");
+      }
+
+      case "paragraph": {
+        const text = renderInlineChildren(nodeContent);
+        const align = node.attrs?.textAlign;
+        // Non-default alignment round-trips as an ATTACHED HTML comment at the
+        // END of the block line (#293 canon #9):
+        //   `some text <!--attrs {"textAlign":"center"}-->`
+        // This replaces the old `<p style="text-align:…">` wrapper (review #10,
+        // itself a replacement for the never-parsed `<div align>`). The schema's
+        // textAlign default is `null`; "left" is the visual default the editor
+        // renders identically to null — neither emits a marker (no churn). The
+        // importer's applyAttachedComments step reads the comment back before the
+        // DOM stage drops it. We only attach when there is text to attach to: a
+        // lone comment on a blank line has no block to bind to on re-import.
+        if (align && align !== "left" && text) {
+          return `${text} ${attachedCommentFor("attrs", { textAlign: align })}`;
+        }
+        return text || "";
+      }
+
+      case "heading": {
+        const level = node.attrs?.level || 1;
+        const headingText = renderInlineChildren(nodeContent);
+        const headingLine = "#".repeat(level) + " " + headingText;
+        const headingAlign = node.attrs?.textAlign;
+        // A non-default heading alignment attaches the same trailing comment
+        // (#293 canon #9), keeping the readable `## text` markdown form:
+        //   `## Title <!--attrs {"textAlign":"center"}-->`
+        // Bare `## text` carries no alignment, so without this an aligned heading
+        // would silently drop textAlign on export. Replaces the old
+        // `<hN style="text-align:…">` HTML form. "left"/null stay bare (no churn).
+        // Require headingText so an empty aligned heading stays bare `##` rather
+        // than emitting a comment with no visible element to attach to (matches
+        // the paragraph guard's `text` check — a lone comment has no block to
+        // bind on re-import).
+        if (headingAlign && headingAlign !== "left" && headingText) {
+          return `${headingLine} ${attachedCommentFor("attrs", { textAlign: headingAlign })}`;
+        }
+        return headingLine;
+      }
+
+      case "text":
+        let textContent = node.text || "";
+        // #293 canon #7: `==` is now a LIVE inline highlight syntax on import (a
+        // marked inline extension turns `==text==` into a color-less highlight
+        // mark). A LITERAL `==` in a text run would therefore be misparsed as a
+        // highlight on the next import, so backslash-escape each `=` of a `==`
+        // pair; marked's escape tokenizer decodes `\=` back to a literal `=`, so
+        // a literal `==` round-trips as text (never materializes a phantom mark).
+        // This runs for BOTH unmarked text and marked non-code runs, but NOT for
+        // an inline code span (a run carrying the `code` mark returns a backtick
+        // span below with `==` verbatim, matching `` `a == b` `` staying code).
+        // A highlight run's own `==` delimiters are appended AFTER this in the
+        // marks loop, so they are never escaped; only the run's inner text is.
+        if (!(node.marks || []).some((m: any) => m.type === "code")) {
+          // #293 canon #2 (F2): inside a footnote body, DOUBLE every RAW user
+          // backslash FIRST, so it survives `^[…]` (the import tokenizer treats
+          // `\<char>` as an escape when balancing brackets, and `parseInline`
+          // decodes escapes). Doing it before the intentional escapes below keeps
+          // the serializer's own single escapes (`\=` `\$` `^\[`, and the `\[`/
+          // `\]` balanceBrackets adds) single; only genuine user backslashes are
+          // doubled. Skipped for code runs (a code span's content is NOT decoded
+          // by parseInline, so its backslashes must stay verbatim).
+          if (inFootnoteBody) {
+            textContent = textContent.replace(/\\/g, "\\\\");
+          }
+          textContent = textContent.replace(/==/g, "\\=\\=");
+          // #293 canon #6: escape a would-be inline-math `$…$` span so it stays
+          // literal text on re-import (currency `$5` is left clean — see
+          // escapeProseMath). Runs on the SAME non-code runs as the `==` escape
+          // above; an inline `code` run returns verbatim below, matching the
+          // codeBlock path (a `$…$` inside code must stay code, never math).
+          textContent = escapeProseMath(textContent);
+          // #293 canon #2: `^[` opens a LIVE inline-footnote span on import
+          // (`^[text]` -> a footnote reference). A LITERAL `^[` in prose text
+          // would therefore materialize a phantom footnote on the next import, so
+          // backslash-escape the bracket (`^[` -> `^\[`); marked's escape
+          // tokenizer decodes `\[` back to `[`, so a literal `^[…]` round-trips
+          // as text and never opens a footnote. Only the OPENING `^[` needs
+          // breaking (the tokenizer requires it), so this is a minimal, idempotent
+          // escape. A real footnoteReference node emits `^[body]` from its own
+          // case, never through here.
+          textContent = textContent.replace(/\^\[/g, "^\\[");
+        }
+        // Apply marks (bold, italic, code, etc.)
+        if (node.marks) {
+          // The schema's `code` mark declares `excludes: "_"` — it excludes every
+          // other inline mark — so the editor can NEVER produce a text run that
+          // carries `code` together with another mark, and on import any
+          // co-occurring mark is always dropped (the run comes back as code-only).
+          // The lossless, byte-stable behavior is therefore: when a run has the
+          // `code` mark, emit ONLY the backtick code span and ignore every other
+          // mark, so md1 is already code-only and md2 === md1. Runs WITHOUT a code
+          // mark are rendered exactly as before.
+          const markTypes = node.marks.map((m: any) => m.type);
+          const hasCode = markTypes.includes("code");
+          if (hasCode) {
+            textContent = `\`${textContent}\``;
+            return textContent;
+          }
+          for (const mark of node.marks) {
+            switch (mark.type) {
+              case "bold":
+                textContent = `**${textContent}**`;
+                break;
+              case "italic":
+                textContent = `*${textContent}*`;
+                break;
+              case "code":
+                // A `code` run already returned above (hasCode early return), so
+                // this branch is only reached for a non-code run that somehow
+                // still lists `code`; emit the plain backtick span.
+                textContent = `\`${textContent}\``;
+                break;
+              case "link": {
+                const href = mark.attrs?.href || "";
+                const title = mark.attrs?.title;
+                if (title) {
+                  // Emit the optional markdown link title; escape an embedded
+                  // double-quote so it cannot terminate the title string early.
+                  const safeTitle = String(title).replace(/"/g, '\\"');
+                  textContent = `[${textContent}](${href} "${safeTitle}")`;
+                } else {
+                  textContent = `[${textContent}](${href})`;
+                }
+                break;
+              }
+              case "strike":
+                textContent = `~~${textContent}~~`;
+                break;
+              case "underline":
+                textContent = `<u>${textContent}</u>`;
+                break;
+              case "subscript":
+                textContent = `<sub>${textContent}</sub>`;
+                break;
+              case "superscript":
+                textContent = `<sup>${textContent}</sup>`;
+                break;
+              case "highlight": {
+                // #293 canon #7: a highlight WITHOUT a color serializes as the
+                // Obsidian/GFM `==text==` syntax (the importer's marked inline
+                // `==` extension parses it back to a color-less highlight mark).
+                // A highlight WITH a color keeps the `<mark style="background-
+                // color: …">` HTML form (the condition is deterministic on the
+                // `color` attr), so a colored highlight is not flattened. The
+                // inner textContent already had any literal `==` backslash-
+                // escaped above, so a highlight over text containing `==` still
+                // round-trips.
+                const color = mark.attrs?.color;
+                textContent = color
+                  ? `<mark style="background-color: ${escapeAttr(color)}">${textContent}</mark>`
+                  : `==${textContent}==`;
+                break;
+              }
+              case "textStyle":
+                if (mark.attrs?.color) {
+                  textContent = `<span style="color: ${escapeAttr(mark.attrs.color)}">${textContent}</span>`;
+                }
+                break;
+              case "spoiler":
+                // Markdown has no native spoiler syntax, so emit the same raw
+                // inline HTML the editor-ext/MCP stack uses. The schema's Spoiler
+                // mark parses span[data-spoiler] back on import, so the mark
+                // survives the PM -> MD -> PM round-trip.
+                textContent = `<span data-spoiler="true">${textContent}</span>`;
+                break;
+              case "comment": {
+                // Emit the inline comment anchor so highlights round-trip. The
+                // schema's Comment mark parses span[data-comment-id] (attrs
+                // commentId/resolved).
+                const cid = mark.attrs?.commentId;
+                if (cid) {
+                  // Hide resolved anchors from agent reads: drop the wrapper and
+                  // keep only the bare text. Active anchors keep their wrapper.
+                  if (mark.attrs?.resolved && dropResolvedCommentAnchors) {
+                    break;
+                  }
+                  const resolvedAttr = mark.attrs?.resolved
+                    ? ` data-resolved="true"`
+                    : "";
+                  textContent = `<span data-comment-id="${escapeAttr(cid)}"${resolvedAttr}>${textContent}</span>`;
+                }
+                break;
+              }
+            }
+          }
+        }
+        return textContent;
+
+      case "codeBlock":
+        const language = node.attrs?.language || "";
+        // Strip ALL trailing newlines so the export is idempotent: marked
+        // re-adds exactly one trailing "\n" on import, so trimming only one
+        // here would let the text grow by "\n" on each round-trip. Removing
+        // every trailing newline makes repeated cycles stable.
+        //
+        // Read the child text RAW (schema codeBlock is `content: "text*"`), NOT
+        // through processNode: code-fence content is literal and markdown escapes
+        // do not apply inside a fence. In particular the canon #7 `==` -> `\=\=`
+        // escape (in `case "text"`) must NOT reach code — marked leaves `\=`
+        // verbatim inside a fence, so routing code through `case "text"` would
+        // permanently stamp backslashes into any `==` (a `==` comparison is
+        // extremely common in source), corrupting the block on the git-sync data
+        // path.
+        const code = nodeContent
+          .map((child: any) => (typeof child?.text === "string" ? child.text : ""))
+          .join("")
+          .replace(/\n+$/, "");
+        // CommonMark: an inner ``` run inside the code would prematurely close
+        // a 3-backtick fence (corrupting the block on re-import). Use an outer
+        // fence one backtick longer than the longest backtick run in the code
+        // (minimum 3) so the inner fence is always content.
+        const longestBacktickRun = (code.match(/`+/g) || []).reduce(
+          (max: number, run: string) => Math.max(max, run.length),
+          0,
+        );
+        const fence = "`".repeat(Math.max(3, longestBacktickRun + 1));
+        return fence + language + "\n" + code + "\n" + fence;
+
+      case "bulletList":
+        return nodeContent
+          .map((item: any) => processListItem(item, "-"))
+          .join("\n");
+
+      case "orderedList":
+        return nodeContent
+          .map((item: any, index: number) =>
+            processListItem(item, `${index + 1}.`),
+          )
+          .join("\n");
+
+      case "taskList":
+        return nodeContent.map((item: any) => processTaskItem(item)).join("\n");
+
+      case "taskItem":
+        // Delegate to the same helper used by taskList so multi-block and
+        // nested task items render and indent consistently.
+        return processTaskItem(node);
+
+      case "listItem":
+        return nodeContent.map(processNode).join("\n");
+
+      case "blockquote":
+        // Prefix EVERY line of EVERY child with "> " and separate block-level
+        // children with a blank ">" line so code blocks / multi-paragraph
+        // quotes round-trip correctly.
+        return nodeContent
+          .map((n: any) =>
+            processNode(n)
+              .split("\n")
+              .map((line: string) => (line.length ? `> ${line}` : ">"))
+              .join("\n"),
+          )
+          .join("\n>\n");
+
+      case "horizontalRule":
+        return "---";
+
+      case "hardBreak":
+        // Two trailing spaces before the newline encode a markdown hard break;
+        // a bare "\n" would be reimported as a soft break and lost.
+        return "  \n";
+
+      case "image": {
+        const imgAttrs = node.attrs || {};
+        // #293 canon #4: a top-level image ALWAYS serializes as `![alt](src)`.
+        // Non-default layout/identity attrs (which markdown `![](src)` cannot
+        // express — width/height/align/size/attachmentId/aspectRatio/caption/
+        // title) are carried in an attached `<!--img {…}-->` comment on the SAME
+        // line, materialized back onto the <img> by markdown-to-prosemirror's
+        // applyCommentDirectives before generateJSON drops the comment.
+        // Escape the alt text: it sits in the `![alt]` label, which the importer
+        // re-parses as CommonMark inline content, so a markdown-active char in a
+        // realistic description ("Figure [1]", "the *new* logo") would break the
+        // round-trip — the image node vanishes / emphasis collapses. Same reason
+        // the link-form media (attachment/pdf/embed) escape their visible text.
+        const imgAlt = escapeLinkText(imgAttrs.alt ?? "");
+        // Neutralize characters that could break out of the markdown image
+        // URL: spaces/newlines and parentheses would terminate the (...) target
+        // and let a stored src inject following markdown/HTML. Percent-encode
+        // them so the URL stays a single inert token.
+        const imgSrc = encodeMdUrl(imgAttrs.src);
+        const base = `![${imgAlt}](${imgSrc})`;
+        // Build the img-comment JSON from the NON-DEFAULT attrs only, in a
+        // STABLE key order so the output is deterministic. An attr equal to its
+        // schema default is NOT emitted (predicate over the canonicalized attrs).
+        const json: Record<string, unknown> = {};
+        // Numeric sizing attrs are coerced to string in the payload: the import
+        // side (applyCommentDirectives) writes them as DOM attributes and the
+        // schema's parseHTML reads them back as strings, so a numeric value would
+        // otherwise round-trip as `420 -> "420"` and produce a one-time spurious
+        // git diff. Emitting the string form up front keeps the round-trip
+        // byte-stable whether the source attr was a number or a string (mirrors
+        // the legacy imageToHtml, which stringified via `width="…"`).
+        if (imgAttrs.width != null) json.width = String(imgAttrs.width);
+        if (imgAttrs.height != null) json.height = String(imgAttrs.height);
+        // align default is unified to "center" (#293 canon #4): treat BOTH null
+        // and "center" as the default and omit them, so a bare/center image stays
+        // clean `![](src)` and only left/right emits `"align"`.
+        if (imgAttrs.align != null && imgAttrs.align !== "center")
+          json.align = imgAttrs.align;
+        if (imgAttrs.size != null) json.size = String(imgAttrs.size);
+        if (imgAttrs.aspectRatio != null)
+          json.aspectRatio = String(imgAttrs.aspectRatio);
+        if (imgAttrs.attachmentId) json.attachmentId = imgAttrs.attachmentId;
+        if (imgAttrs.caption) json.caption = imgAttrs.caption;
+        if (imgAttrs.title) json.title = imgAttrs.title;
+        // No non-default attrs -> bare image, no trailing space, no comment.
+        if (Object.keys(json).length === 0) return base;
+        // attachedCommentFor defuses any `--` in a value (e.g. a caption that
+        // contains the comment-closing `-->`) so the payload can never close the
+        // HTML comment early; JSON.parse on the import side restores it verbatim.
+        return `${base} ${attachedCommentFor("img", json)}`;
+      }
+
+      case "video": {
+        // #293 canon #8 (image-form): a top-level video serializes as
+        // `![](src)<!--video {…}-->`. The bare `![](src)` is ALWAYS followed by
+        // the `video` discriminator comment — a bare image with NO comment is an
+        // `image`, never sniffed by URL — so the comment is REQUIRED even when
+        // there are no extra attrs (emitted name-only as `<!--video-->`). src
+        // lives in the markdown target; every OTHER non-default attr rides in the
+        // comment JSON (stable key order, numerics stringified for byte-stability
+        // exactly like canon #4). align default "center" is omitted. The schema
+        // `<div><video>` form is still emitted on the raw-HTML path (blockToHtml)
+        // via videoToHtml, since comment nodes are dropped inside columns/cells.
+        const attrs = node.attrs || {};
+        const src = encodeMdUrl(attrs.src);
+        const json: Record<string, unknown> = {};
+        if (attrs.alt) json.alt = attrs.alt;
+        if (attrs.attachmentId) json.attachmentId = attrs.attachmentId;
+        if (attrs.width != null) json.width = String(attrs.width);
+        if (attrs.height != null) json.height = String(attrs.height);
+        if (attrs.size != null) json.size = String(attrs.size);
+        if (attrs.align != null && attrs.align !== "center")
+          json.align = attrs.align;
+        if (attrs.aspectRatio != null)
+          json.aspectRatio = String(attrs.aspectRatio);
+        return `![](${src})${standaloneCommentFor("video", json)}`;
+      }
+
+      case "youtube": {
+        // #293 canon #8 (image-form): `![](url)<!--youtube {…}-->`. Same rules as
+        // video — src in the target, other non-default attrs (width/height/align,
+        // align!=center) in the ALWAYS-emitted discriminator comment. The
+        // div[data-type="youtube"] form stays on the raw-HTML path (youtubeToHtml).
+        const attrs = node.attrs || {};
+        const src = encodeMdUrl(attrs.src);
+        const json: Record<string, unknown> = {};
+        if (attrs.width != null) json.width = String(attrs.width);
+        if (attrs.height != null) json.height = String(attrs.height);
+        if (attrs.align != null && attrs.align !== "center")
+          json.align = attrs.align;
+        return `![](${src})${standaloneCommentFor("youtube", json)}`;
+      }
+
+      case "table": {
+        // A GFM pipe table cannot represent merged cells. If ANY cell carries
+        // colspan>1 or rowspan>1, a pipe table would corrupt the grid on
+        // re-import, so emit the WHOLE table as raw HTML <table> instead: the
+        // schema's table family parseHTML (tag table/tr/td/th, with colspan/
+        // rowspan read from the same-named HTML attrs and align via parseHTML)
+        // round-trips it faithfully. Otherwise keep the lighter GFM pipe table.
+        const tableRows: any[] = nodeContent;
+        if (tableRows.length === 0) return "";
+        const hasSpan = tableRows.some((row: any) =>
+          (row.content || []).some(
+            (cell: any) =>
+              (cell.attrs?.colspan ?? 1) > 1 || (cell.attrs?.rowspan ?? 1) > 1,
+          ),
+        );
+        // A GFM pipe table also cannot hold a cell with block content (a list,
+        // code block, paragraphs) — it would be flattened to one line and lost
+        // (review #8). Force the HTML form for those too.
+        const hasMultiBlockCell = tableRows.some((row: any) =>
+          (row.content || []).some((cell: any) => cellIsMultiBlock(cell)),
+        );
+
+        if (hasSpan || hasMultiBlockCell) {
+          return tableToHtml(tableRows);
+        }
+
+        // No merged cells: emit a GFM table (header row + separator) so the
+        // markdown can be parsed back into a table on re-import.
+        const rows = tableRows.map(processNode);
+        const headerCells = tableRows[0]?.content || [];
+        const columns = headerCells.length || 1;
+        // Derive alignment markers (:--, :-:, --:) from each header cell.
+        const markers = Array.from({ length: columns }, (_, i) => {
+          const align = headerCells[i]?.attrs?.align;
+          switch (align) {
+            case "left":
+              return ":--";
+            case "center":
+              return ":-:";
+            case "right":
+              return "--:";
+            default:
+              return "---";
+          }
+        });
+        const separator = "| " + markers.join(" | ") + " |";
+        return [rows[0], separator, ...rows.slice(1)].join("\n");
+      }
+
+      case "tableRow":
+        return "| " + nodeContent.map(processNode).join(" | ") + " |";
+
+      case "tableCell":
+      case "tableHeader": {
+        // Join multiple block children with a space (not "") so adjacent blocks
+        // like a paragraph followed by a list don't collide into "line1- a".
+        // Then collapse newlines and escape pipes so a cell containing "|" or a
+        // line break cannot corrupt the surrounding GFM row.
+        return nodeContent
+          .map(processNode)
+          .join(" ")
+          .replace(/\r?\n/g, " ")
+          .replace(/\|/g, "\\|");
+      }
+
+      case "callout": {
+        // Obsidian-native callout: `> [!type]` opener + a blockquote (`>`-prefixed)
+        // body, so it renders as a callout in Obsidian. The importer parses both
+        // this and the legacy `:::type` fence (existing vaults). Each body line is
+        // blockquote-prefixed; a blank line becomes a bare `>` so the callout is
+        // not split.
+        const calloutType = (node.attrs?.type || "info").toLowerCase();
+        const calloutBody = nodeContent
+          .map(processNode)
+          .join("\n")
+          .split("\n")
+          .map((l: string) => (l.length ? `> ${l}` : ">"))
+          .join("\n");
+        return `> [!${calloutType}]\n${calloutBody}`;
+      }
+
+      case "details": {
+        // The `open` (collapsed/expanded) state lives on the details node, NOT on
+        // the summary, so emit the <details> wrapper HERE carrying it — otherwise
+        // the open state is dropped on a round trip. The schema's details node
+        // parses `open` back from the attribute.
+        const open = node.attrs?.open ? " open" : "";
+        return `<details${open}>\n${nodeContent.map(processNode).join("")}</details>`;
+      }
+
+      case "detailsSummary":
+        return `<summary>${renderInlineChildren(nodeContent)}</summary>\n\n`;
+
+      case "detailsContent":
+        return `${nodeContent.map(processNode).join("\n")}\n`;
+
+      case "mathInline": {
+        // #293 canon #6: inline math serializes as Obsidian-native `$LaTeX$`
+        // (readable, re-parsed by the importer's marked inline extension). A
+        // literal `$` inside the LaTeX is escaped `\$` so it cannot close the
+        // span early (the importer decodes `\$`→`$`). When the LaTeX cannot be
+        // safely fenced (empty, whitespace-edged, multi-line, or an ambiguous
+        // backslash-before-`$`), fall back to the LOSSLESS schema-HTML `<span>`
+        // form (inlineMathSerializable). A following-sibling digit — which would
+        // also break the pandoc closing rule — is handled by renderInlineChildren
+        // (this case cannot see siblings).
+        const inlineMath = node.attrs?.text || "";
+        if (!inlineMathSerializable(inlineMath)) {
+          return mathInlineHtml(inlineMath);
+        }
+        return `$${encodeInlineMathLatex(inlineMath)}$`;
+      }
+
+      case "mathBlock": {
+        // #293 canon #6: block math serializes as a `$$` fence on its own lines
+        // (`$$\n<latex>\n$$`), so multi-line LaTeX is preserved. If the LaTeX
+        // itself contains a `$$` (which would close the fence early — essentially
+        // never valid inside a single math node), fall back to the lossless
+        // schema-HTML `<div>` form.
+        const blockMath = node.attrs?.text || "";
+        if (blockMath.includes("$$")) {
+          return mathBlockHtml(blockMath);
+        }
+        return `$$\n${blockMath}\n$$`;
+      }
+
+      case "mention": {
+        // Emit span[data-type="mention"] with the schema's data-* attributes so
+        // generateJSON rebuilds the mention node instead of leaving "@label"
+        // plain text that cannot re-parse.
+        const attrs = node.attrs || {};
+        const parts: string[] = [`data-type="mention"`];
+        if (attrs.id) parts.push(`data-id="${escapeAttr(attrs.id)}"`);
+        if (attrs.label)
+          parts.push(`data-label="${escapeAttr(attrs.label)}"`);
+        if (attrs.entityType)
+          parts.push(`data-entity-type="${escapeAttr(attrs.entityType)}"`);
+        if (attrs.entityId)
+          parts.push(`data-entity-id="${escapeAttr(attrs.entityId)}"`);
+        if (attrs.slugId)
+          parts.push(`data-slug-id="${escapeAttr(attrs.slugId)}"`);
+        if (attrs.creatorId)
+          parts.push(`data-creator-id="${escapeAttr(attrs.creatorId)}"`);
+        if (attrs.anchorId)
+          parts.push(`data-anchor-id="${escapeAttr(attrs.anchorId)}"`);
+        // Keep the label as visible text content too; the schema reads attrs
+        // from data-*, so the inner text is purely cosmetic and harmless.
+        const mentionLabel = attrs.label || attrs.id || "";
+        // The label is visible element TEXT content here (the data-* attrs above
+        // carry the real values), so escape it for the text context, not attrs.
+        return `<span ${parts.join(" ")}>@${escapeHtmlText(mentionLabel)}</span>`;
+      }
+
+      case "attachment": {
+        // #293 canon #8 (link-form): `[filename](src)<!--attachment {…}-->`. The
+        // schema's `url` is the markdown target; the VISIBLE text is the filename
+        // (`attrs.name`, escaped so `[`/`]` cannot break the label). Every OTHER
+        // non-default attr (mime/size/attachmentId) rides in the ALWAYS-emitted
+        // discriminator comment — a bare `[text](src)` with no comment is a plain
+        // link, never an attachment. The div[data-type="attachment"] form stays
+        // on the raw-HTML path (attachmentToHtml) for columns/cells.
+        const attrs = node.attrs || {};
+        const src = encodeMdUrl(attrs.url);
+        const text = escapeLinkText(attrs.name ?? "");
+        const json: Record<string, unknown> = {};
+        if (attrs.mime) json.mime = attrs.mime;
+        if (attrs.size != null) json.size = String(attrs.size);
+        if (attrs.attachmentId) json.attachmentId = attrs.attachmentId;
+        return `[${text}](${src})${standaloneCommentFor("attachment", json)}`;
+      }
+
+      case "drawio":
+      case "excalidraw": {
+        // #293 canon #8 (image-form): `![](src)<!--drawio|excalidraw {…}-->`. src
+        // in the target; title/alt/width/height/size/aspectRatio/align(!=center)/
+        // attachmentId in the ALWAYS-emitted discriminator comment (the NAME
+        // selects drawio vs excalidraw). The div[data-type=…] form stays on the
+        // raw-HTML path (diagramToHtml).
+        const attrs = node.attrs || {};
+        const src = encodeMdUrl(attrs.src);
+        const json: Record<string, unknown> = {};
+        if (attrs.title != null) json.title = attrs.title;
+        if (attrs.alt != null) json.alt = attrs.alt;
+        if (attrs.width != null) json.width = String(attrs.width);
+        if (attrs.height != null) json.height = String(attrs.height);
+        if (attrs.size != null) json.size = String(attrs.size);
+        if (attrs.aspectRatio != null)
+          json.aspectRatio = String(attrs.aspectRatio);
+        if (attrs.align != null && attrs.align !== "center")
+          json.align = attrs.align;
+        if (attrs.attachmentId) json.attachmentId = attrs.attachmentId;
+        return `![](${src})${standaloneCommentFor(type, json)}`;
+      }
+
+      case "embed": {
+        // #293 canon #8 (link-form): `[provider](src)<!--embed {…}-->`. src in
+        // the target; the VISIBLE text is the provider (`attrs.provider`). align/
+        // width/height ride in the discriminator comment only when non-default
+        // (align "center", width 800, height 600 are the schema defaults). The
+        // div[data-type="embed"] form stays on the raw-HTML path (embedToHtml).
+        const attrs = node.attrs || {};
+        const src = encodeMdUrl(attrs.src);
+        const text = escapeLinkText(attrs.provider ?? "");
+        const json: Record<string, unknown> = {};
+        if (attrs.align != null && attrs.align !== "center")
+          json.align = attrs.align;
+        if (attrs.width != null && attrs.width !== 800)
+          json.width = String(attrs.width);
+        if (attrs.height != null && attrs.height !== 600)
+          json.height = String(attrs.height);
+        return `[${text}](${src})${standaloneCommentFor("embed", json)}`;
+      }
+
+      case "audio": {
+        // #293 canon #8 (image-form): `![](src)<!--audio {…}-->`. src in the
+        // target; attachmentId/size in the ALWAYS-emitted discriminator comment.
+        // The <div><audio> form stays on the raw-HTML path (audioToHtml).
+        const attrs = node.attrs || {};
+        const src = encodeMdUrl(attrs.src);
+        const json: Record<string, unknown> = {};
+        if (attrs.attachmentId) json.attachmentId = attrs.attachmentId;
+        if (attrs.size != null) json.size = String(attrs.size);
+        return `![](${src})${standaloneCommentFor("audio", json)}`;
+      }
+
+      case "pdf": {
+        // #293 canon #8 (link-form): `[filename](src)<!--pdf {…}-->`. src in the
+        // target; the VISIBLE text is the filename (`attrs.name`). attachmentId/
+        // size/width/height ride in the ALWAYS-emitted discriminator comment. The
+        // div[data-type="pdf"] form stays on the raw-HTML path (pdfToHtml).
+        const attrs = node.attrs || {};
+        const src = encodeMdUrl(attrs.src);
+        const text = escapeLinkText(attrs.name ?? "");
+        const json: Record<string, unknown> = {};
+        if (attrs.attachmentId) json.attachmentId = attrs.attachmentId;
+        if (attrs.size != null) json.size = String(attrs.size);
+        if (attrs.width != null) json.width = String(attrs.width);
+        if (attrs.height != null) json.height = String(attrs.height);
+        return `[${text}](${src})${standaloneCommentFor("pdf", json)}`;
+      }
+
+      case "columns": {
+        // Emit the schema-matching div[data-type="columns"] wrapper so the
+        // multi-column layout survives. Without a case the children were
+        // concatenated with no separator and the text merged. The schema reads
+        // layout from data-layout and widthMode from data-width-mode. The whole
+        // block is raw HTML, so render children via blockToHtml (NOT markdown,
+        // which marked would not re-parse inside a raw HTML block).
+        const attrs = node.attrs || {};
+        const parts: string[] = [`data-type="columns"`];
+        if (attrs.layout)
+          parts.push(`data-layout="${escapeAttr(attrs.layout)}"`);
+        if (attrs.widthMode && attrs.widthMode !== "normal")
+          parts.push(`data-width-mode="${escapeAttr(attrs.widthMode)}"`);
+        const inner = nodeContent.map((n: any) => blockToHtml(n)).join("");
+        return `<div ${parts.join(" ")}>${inner}</div>`;
+      }
+
+      case "column": {
+        // Emit the schema-matching div[data-type="column"]; the schema reads the
+        // column width from data-width. Children are rendered as HTML so their
+        // formatting survives inside this raw HTML block.
+        const attrs = node.attrs || {};
+        const parts: string[] = [`data-type="column"`];
+        if (attrs.width)
+          parts.push(`data-width="${escapeAttr(attrs.width)}"`);
+        const inner = nodeContent.map((n: any) => blockToHtml(n)).join("");
+        return `<div ${parts.join(" ")}>${inner}</div>`;
+      }
+
+      case "pageBreak":
+        // #293 canon #5: a pageBreak is a STANDALONE machinery comment on its
+        // own line — `<!--pagebreak-->` — which is invisible in any markdown
+        // renderer yet round-trips (the importer materializes it back into the
+        // pageBreak atom; see markdown-to-prosemirror's applyCommentDirectives).
+        // This keeps the markdown readable instead of leaking a raw <div>. The
+        // schema div-form is still emitted on the raw-HTML path (blockToHtml),
+        // because DOM parsers drop comment nodes inside columns/cells.
+        return standaloneCommentFor("pagebreak");
+
+      case "subpages":
+        // #293 canon #5: a subpages block serializes as a STANDALONE comment —
+        // `<!--subpages-->` by default, or `<!--subpages {"recursive":true}-->`
+        // when the recursive toggle is set. Same rationale as pageBreak: readable
+        // markdown, invisible in renderers, re-materialized on import. The div
+        // form (`<div data-type="subpages">`) is retained on the raw-HTML path
+        // (blockToHtml) since comments cannot survive a DOM parse inside columns.
+        return node.attrs?.recursive
+          ? standaloneCommentFor("subpages", { recursive: true })
+          : standaloneCommentFor("subpages");
+
+      case "status": {
+        // Inline status pill. The schema reads the label from the element's
+        // TEXT content and the color from data-color, so emit both; without a
+        // case this inline atom fell through to `default` and collapsed to "".
+        const attrs = node.attrs || {};
+        const statusColor = attrs.color || "gray";
+        return `<span data-type="status" data-color="${escapeAttr(statusColor)}">${escapeHtmlText(attrs.text ?? "")}</span>`;
+      }
+
+      case "htmlEmbed": {
+        // Block atom; the schema reads the raw source from a base64-encoded
+        // data-source attribute (and an optional fixed height from data-height).
+        // Encode with the shared helper so it decodes symmetrically on import.
+        const attrs = node.attrs || {};
+        const parts: string[] = [
+          `data-type="htmlEmbed"`,
+          `data-source="${escapeAttr(encodeHtmlEmbedSource(attrs.source ?? ""))}"`,
+        ];
+        if (attrs.height != null)
+          parts.push(`data-height="${escapeAttr(attrs.height)}"`);
+        return `<div ${parts.join(" ")}></div>`;
+      }
+
+      case "footnoteReference": {
+        // #293 canon #2: on the top-level/inline markdown path a footnote is
+        // written AT its reference as `^[body]` (Pandoc/Obsidian inline
+        // footnote). Look the body up by id in the pre-scanned definitions map
+        // and render it inline. An ORPHAN reference (no matching definition) has
+        // no body anywhere, so it emits `^[]` — a footnote with an empty body,
+        // the lossless choice (the id was already derived, never authored). The
+        // separate `<section data-footnotes>` list is NOT emitted (see the
+        // footnotesList/doc cases); the raw-HTML path carries the body on the
+        // <sup> instead (inlineToHtml).
+        const def = footnoteDefs.get(node.attrs?.id);
+        return `^[${def ? renderFootnoteBody(def) : ""}]`;
+      }
+
+      case "footnotesList":
+        // Bodies are inlined at their references (`^[…]`), so the bottom list
+        // emits NOTHING in markdown. The doc case skips it outright to avoid a
+        // phantom blank line; this case guards any non-doc-level occurrence.
+        return "";
+
+      case "footnoteDefinition":
+        // Reached only via a footnotesList (handled above) — never rendered on
+        // its own on the markdown path; its body rides at the reference.
+        return "";
+
+      case "pageEmbed": {
+        // #293 canon #8 (standalone): a whole-page live embed serializes as a
+        // lone discriminator comment on its own line — `<!--pageembed-->` or
+        // `<!--pageembed {"sourcePageId":…}-->`. Readable markdown, invisible in
+        // renderers, re-materialized on import. The div[data-type="pageEmbed"]
+        // form stays on the raw-HTML path (pageEmbedToHtml) for columns/cells.
+        const attrs = node.attrs || {};
+        const json: Record<string, unknown> = {};
+        if (attrs.sourcePageId) json.sourcePageId = attrs.sourcePageId;
+        return standaloneCommentFor("pageembed", json);
+      }
+
+      case "transclusionReference": {
+        // #293 canon #8 (standalone): a live block/page reference serializes as a
+        // lone `<!--transclusion {…}-->` comment carrying sourcePageId +
+        // transclusionId (the data-loss-critical id links). The
+        // div[data-type="transclusionReference"] form stays on the raw-HTML path
+        // (transclusionReferenceToHtml). (transclusionSource is unchanged — it has
+        // block children and keeps recursing through processNode.)
+        const attrs = node.attrs || {};
+        const json: Record<string, unknown> = {};
+        if (attrs.sourcePageId) json.sourcePageId = attrs.sourcePageId;
+        if (attrs.transclusionId) json.transclusionId = attrs.transclusionId;
+        return standaloneCommentFor("transclusion", json);
+      }
+
+      case "transclusionSource": {
+        // Sync-source container; the schema reads data-id and re-parses its
+        // block children, so render them as schema-matching HTML.
+        const attrs = node.attrs || {};
+        const idAttr = attrs.id ? ` data-id="${escapeAttr(attrs.id)}"` : "";
+        const inner = nodeContent.map((n: any) => blockToHtml(n)).join("");
+        return `<div data-type="transclusionSource"${idAttr}>${inner}</div>`;
+      }
+
+      default:
+        // Fallback: process children
+        return nodeContent.map(processNode).join("");
+    }
+  };
+
+  // Render a run of inline children to MARKDOWN, with the #293 canon #6
+  // inline-math guard. A `mathInline` serialized as `$…$` whose FOLLOWING
+  // sibling renders starting with a DIGIT would put a digit right after the
+  // closing `$`, which the pandoc inline rule refuses to parse as math (the
+  // currency guard) — so the node would re-import as literal text (data loss).
+  // For that node ONLY we fall back to the lossless schema-HTML `<span>` form.
+  // Every other inline node is rendered exactly as processNode would, so output
+  // is unchanged whenever no math sits directly before a digit.
+  const renderInlineChildren = (nodes: any[]): string => {
+    const parts = nodes.map(processNode);
+    for (let i = 0; i < nodes.length - 1; i++) {
+      if (
+        nodes[i]?.type === "mathInline" &&
+        parts[i].startsWith("$") &&
+        /^[0-9]/.test(parts[i + 1] || "")
+      ) {
+        parts[i] = mathInlineHtml(nodes[i].attrs?.text || "");
+      }
+    }
+    return parts.join("");
+  };
+
+  // Render inline content (text runs + their marks) to HTML. Used by the raw
+  // HTML fallbacks (spanned tables, columns) where marked will NOT re-parse
+  // markdown, so backtick/asterisk/bracket syntax would otherwise leak as
+  // literal characters. Each mark is mirrored to the HTML the schema's parseHTML
+  // accepts so it re-imports as the matching ProseMirror mark.
+  const inlineToHtml = (inlineNodes: any[]): string =>
+    (inlineNodes || [])
+      .map((n: any) => {
+        if (n.type === "hardBreak") return "<br>";
+        // #293 canon #6: on the raw-HTML path (columns/spanned cells) marked does
+        // NOT re-parse markdown, so inline math MUST stay the schema-HTML `<span>`
+        // form here — a `$…$` fence would land as literal text on re-import.
+        if (n.type === "mathInline") return mathInlineHtml(n.attrs?.text || "");
+        if (n.type === "footnoteReference") {
+          // #293 canon #2 raw-HTML path (columns/spanned cells): marked does NOT
+          // re-parse `^[…]` inside raw HTML, so the note text rides ON the <sup>
+          // in a `data-fn-text` attribute (encoded exactly like the `^[…]`
+          // inner). NO id is emitted here (F1): the importer's footnote post-pass
+          // assigns ids by dedup-ing on the EXACT body text, so a column footnote
+          // and an inline `^[…]` with the same body merge to one definition and
+          // DIFFERENT bodies can never collide. The post-pass reads data-fn-text,
+          // sets data-id, builds the doc-level definition, and strips the attr.
+          const def = footnoteDefs.get(n.attrs?.id);
+          const body = def ? renderFootnoteBody(def) : "";
+          return `<sup data-footnote-ref data-fn-text="${escapeAttr(body)}"></sup>`;
+        }
+        if (n.type !== "text") {
+          // Other inline atoms (mention, status) already emit schema HTML from
+          // processNode.
+          return processNode(n);
+        }
+        let t = escapeHtmlText(n.text || "");
+        for (const mark of n.marks || []) {
+          switch (mark.type) {
+            case "bold":
+              t = `<strong>${t}</strong>`;
+              break;
+            case "italic":
+              t = `<em>${t}</em>`;
+              break;
+            case "code":
+              t = `<code>${t}</code>`;
+              break;
+            case "strike":
+              t = `<s>${t}</s>`;
+              break;
+            case "underline":
+              t = `<u>${t}</u>`;
+              break;
+            case "subscript":
+              t = `<sub>${t}</sub>`;
+              break;
+            case "superscript":
+              t = `<sup>${t}</sup>`;
+              break;
+            case "link": {
+              // Mirror the top-level link path: emit the optional `title` too
+              // (the schema's link mark carries a `title` attr — see
+              // DocmostAttributes link globals — so <a title> round-trips). A
+              // link with a title inside a column/spanned cell would otherwise
+              // drop it on re-import.
+              const linkTitle = mark.attrs?.title;
+              const titleAttr = linkTitle
+                ? ` title="${escapeAttr(String(linkTitle))}"`
+                : "";
+              t = `<a href="${escapeAttr(mark.attrs?.href || "")}"${titleAttr}>${t}</a>`;
+              break;
+            }
+            case "highlight":
+              t = mark.attrs?.color
+                ? `<mark style="background-color: ${escapeAttr(mark.attrs.color)}">${t}</mark>`
+                : `<mark>${t}</mark>`;
+              break;
+            case "textStyle":
+              if (mark.attrs?.color)
+                t = `<span style="color: ${escapeAttr(mark.attrs.color)}">${t}</span>`;
+              break;
+            case "spoiler":
+              // Emit the same raw inline HTML the top-level path uses. The
+              // schema's Spoiler mark parses span[data-spoiler] back on import,
+              // so a spoiler inside a column/spanned cell survives the round
+              // trip (without this case the mark was silently lost here).
+              t = `<span data-spoiler="true">${t}</span>`;
+              break;
+            case "comment":
+              // Inline comment anchor inside a raw-HTML container (columns /
+              // spanned table cells), so commented text there also round-trips.
+              if (mark.attrs?.commentId) {
+                // Hide resolved anchors from agent reads: drop the wrapper and
+                // keep only the bare text. Active anchors keep their wrapper.
+                if (mark.attrs?.resolved && dropResolvedCommentAnchors) {
+                  break;
+                }
+                const r = mark.attrs?.resolved ? ` data-resolved="true"` : "";
+                t = `<span data-comment-id="${escapeAttr(mark.attrs.commentId)}"${r}>${t}</span>`;
+              }
+              break;
+          }
+        }
+        return t;
+      })
+      .join("");
+
+  // Emit the schema-matching <img> for an image node. Shared so the image is
+  // emitted as real HTML wherever a raw-HTML container needs it (inside a column
+  // or a spanned table cell), where markdown `![](...)` would NOT be re-parsed
+  // and would survive as literal text. The Image extension reads src/alt from
+  // the standard attributes; the Docmost extra attrs (width/height/align/size/
+  // attachmentId/aspectRatio) are global attributes read from same-named DOM
+  // attributes, so emit them by name.
+  const imageToHtml = (node: any): string => {
+    const attrs = node.attrs || {};
+    const parts: string[] = [`src="${escapeAttr(attrs.src ?? "")}"`];
+    if (attrs.alt) parts.push(`alt="${escapeAttr(attrs.alt)}"`);
+    if (attrs.title) parts.push(`title="${escapeAttr(attrs.title)}"`);
+    if (attrs.width != null) parts.push(`width="${escapeAttr(attrs.width)}"`);
+    if (attrs.height != null) parts.push(`height="${escapeAttr(attrs.height)}"`);
+    // #293 canon #4: image align default is unified to "center", so a center
+    // (or unset) image no longer emits a redundant align="center" here — only a
+    // genuinely non-default alignment (left/right) is written.
+    if (attrs.align && attrs.align !== "center")
+      parts.push(`align="${escapeAttr(attrs.align)}"`);
+    if (attrs.size != null) parts.push(`data-size="${escapeAttr(attrs.size)}"`);
+    if (attrs.attachmentId)
+      parts.push(`data-attachment-id="${escapeAttr(attrs.attachmentId)}"`);
+    if (attrs.aspectRatio != null)
+      parts.push(`data-aspect-ratio="${escapeAttr(attrs.aspectRatio)}"`);
+    // Plain-text caption (issue #221). Markdown `![](src)` cannot carry it, so
+    // emit it as data-caption; the schema's image `caption` attr parses it back.
+    if (attrs.caption) parts.push(`data-caption="${escapeAttr(attrs.caption)}"`);
+    return `<img ${parts.join(" ")}>`;
+  };
+
+  // Emit the schema-matching div[data-type="callout"] for a callout node. The
+  // schema reads the banner type from data-callout-type. Children are rendered
+  // as HTML so they survive inside a raw-HTML container.
+  const calloutToHtml = (node: any): string => {
+    const type = (node.attrs?.type || "info").toLowerCase();
+    const inner = (node.content || []).map(blockToHtml).join("");
+    return `<div data-type="callout" data-callout-type="${escapeAttr(type)}">${inner}</div>`;
+  };
+
+  // Emit a schema-matching <details> tree. The schema parses <details>,
+  // summary[data-type="detailsSummary"], and div[data-type="detailsContent"].
+  // The `open` (collapsed/expanded) state lives on the details node and the
+  // schema parses it back from the attribute, so emit it here too — mirroring
+  // the top-level `details` case — or a NESTED details (inside columns/cells)
+  // would silently drop `open:true` every round trip.
+  const detailsToHtml = (node: any): string => {
+    const open = node.attrs?.open ? " open" : "";
+    const inner = (node.content || []).map(blockToHtml).join("");
+    return `<details${open}>${inner}</details>`;
+  };
+  const detailsSummaryToHtml = (node: any): string =>
+    `<summary data-type="detailsSummary">${inlineToHtml(node.content || [])}</summary>`;
+  const detailsContentToHtml = (node: any): string => {
+    const inner = (node.content || []).map(blockToHtml).join("");
+    return `<div data-type="detailsContent">${inner}</div>`;
+  };
+
+  // Emit the schema-matching taskList/taskItem HTML. bridgeTaskLists (in
+  // collaboration.ts) recognizes ul[data-type="taskList"] with
+  // li[data-type="taskItem"][data-checked]; emitting that directly here keeps
+  // task lists inside columns/cells from degrading to literal "- [ ]" text.
+  const taskListToHtml = (node: any): string => {
+    const items = (node.content || [])
+      .map((it: any) => {
+        const checked = it.attrs?.checked ? "true" : "false";
+        return `<li data-type="taskItem" data-checked="${checked}">${blockChildrenToHtml(it)}</li>`;
+      })
+      .join("");
+    return `<ul data-type="taskList">${items}</ul>`;
+  };
+
+  // Render a block node to HTML for the raw-HTML containers (spanned tables,
+  // columns). marked does NOT re-parse markdown inside a raw-HTML block, so
+  // EVERY block type that can appear inside a column or a spanned cell must be
+  // emitted as schema-matching HTML here — never as markdown, or it would land
+  // as literal text on re-import. Nodes whose processNode case already produces
+  // schema-matching HTML (math/media/embed/attachment/nested columns/spanned
+  // table) are delegated to processNode; the markdown-emitting cases
+  // (image/blockquote/callout/details/hr/taskList) get explicit HTML here.
+  const blockToHtml = (block: any): string => {
+    const children = block.content || [];
+    switch (block.type) {
+      case "paragraph": {
+        // Carry textAlign here too (symmetric with the processNode paragraph
+        // case): a paragraph nested inside an HTML container (column/table/
+        // callout) would otherwise drop its alignment on the round trip.
+        const pAlign = block.attrs?.textAlign;
+        const pStyle =
+          pAlign && pAlign !== "left"
+            ? ` style="text-align:${escapeAttr(pAlign)}"`
+            : "";
+        return `<p${pStyle}>${inlineToHtml(children)}</p>`;
+      }
+      case "heading": {
+        // Same for a heading nested in an HTML container: emit the alignment as
+        // an inline style (symmetric with the processNode heading case) so it is
+        // not silently dropped. Clamp the level to a valid HTML heading tag.
+        const level = Math.min(6, Math.max(1, block.attrs?.level || 1));
+        const hAlign = block.attrs?.textAlign;
+        const hStyle =
+          hAlign && hAlign !== "left"
+            ? ` style="text-align:${escapeAttr(hAlign)}"`
+            : "";
+        return `<h${level}${hStyle}>${inlineToHtml(children)}</h${level}>`;
+      }
+      case "bulletList":
+        return `<ul>${children
+          .map((li: any) => `<li>${blockChildrenToHtml(li)}</li>`)
+          .join("")}</ul>`;
+      case "orderedList":
+        return `<ol>${children
+          .map((li: any) => `<li>${blockChildrenToHtml(li)}</li>`)
+          .join("")}</ol>`;
+      case "codeBlock": {
+        const lang = block.attrs?.language || "";
+        // The code itself is element TEXT content (between <code> tags), so it
+        // must escape < > & — NOT the attribute escaper. The language rides in
+        // a class ATTRIBUTE, so it uses escapeAttr.
+        const code = escapeHtmlText(
+          children
+            .map(processNode)
+            .join("")
+            .replace(/\n+$/, ""),
+        );
+        const cls = lang ? ` class="language-${escapeAttr(lang)}"` : "";
+        return `<pre><code${cls}>${code}</code></pre>`;
+      }
+      case "image":
+        return imageToHtml(block);
+      case "blockquote":
+        return `<blockquote>${children.map(blockToHtml).join("")}</blockquote>`;
+      case "horizontalRule":
+        return "<hr>";
+      case "callout":
+        return calloutToHtml(block);
+      case "details":
+        return detailsToHtml(block);
+      case "detailsSummary":
+        return detailsSummaryToHtml(block);
+      case "detailsContent":
+        return detailsContentToHtml(block);
+      case "taskList":
+        return taskListToHtml(block);
+      case "taskItem":
+        // A bare taskItem (outside a taskList) still needs a wrapping list so
+        // the schema parses it; wrap it in a single-item taskList.
+        return taskListToHtml({ content: [block] });
+      // A table nested in a raw-HTML block (e.g. inside a column) MUST be the
+      // HTML <table> form — a GFM pipe table here would not be re-parsed by
+      // marked and would round-trip as literal "| a | b |" text (review #7).
+      case "table":
+        return tableToHtml(block.content || []);
+      // #293 canon #5: on the TOP-LEVEL path (processNode) subpages/pageBreak
+      // serialize as standalone `<!--...-->` comments, but a comment node is
+      // discarded by the DOM parse stage (jsdom/parse5) that reads back a raw-
+      // HTML block — so inside a column/cell the comment form would silently
+      // vanish (latent data loss; these atoms previously fell through to the
+      // `default` <div></div>). Here we KEEP the schema-matching div-form so the
+      // node survives the raw-HTML round trip.
+      case "pageBreak":
+        return `<div data-type="pageBreak"></div>`;
+      case "subpages": {
+        const recursive = block.attrs?.recursive ? ` data-recursive="true"` : "";
+        return `<div data-type="subpages"${recursive}></div>`;
+      }
+      // #293 canon #8: the media/discriminator family now serializes at TOP LEVEL
+      // (processNode) as md-target + `<!--name-->` comment. A comment node is
+      // DROPPED by the DOM parse stage that reads a raw-HTML block back, so inside
+      // a column/cell the comment form would silently vanish (data loss). Give
+      // each an EXPLICIT schema-HTML case here (via the shared media-html builders
+      // — the SAME output processNode used to emit, and the same the importer
+      // rebuilds) instead of delegating to processNode's md+comment form.
+      case "video":
+        return videoToHtml(block.attrs || {});
+      case "audio":
+        return audioToHtml(block.attrs || {});
+      case "pdf":
+        return pdfToHtml(block.attrs || {});
+      case "youtube":
+        return youtubeToHtml(block.attrs || {});
+      case "embed":
+        return embedToHtml(block.attrs || {});
+      case "attachment":
+        return attachmentToHtml(block.attrs || {});
+      case "drawio":
+      case "excalidraw":
+        return diagramToHtml(block.type, block.attrs || {});
+      case "pageEmbed":
+        return pageEmbedToHtml(block.attrs || {});
+      case "transclusionReference":
+        return transclusionReferenceToHtml(block.attrs || {});
+      // #293 canon #6: on the TOP-LEVEL path (processNode) mathBlock now
+      // serializes as a `$$…$$` fence, but marked does NOT re-parse markdown
+      // inside a raw-HTML block, so inside a column/cell it MUST stay the
+      // schema-HTML `<div>` form or it would land as literal `$$…$$` text on
+      // re-import. Give it an EXPLICIT case here (the same form the importer
+      // rebuilds) instead of delegating to processNode's fence form.
+      case "mathBlock":
+        return mathBlockHtml(block.attrs?.text || "");
+      // #293 canon #2: on the markdown path a footnotesList emits nothing (the
+      // note body rides at each `^[…]` reference). But a raw-HTML container
+      // drops comment/markdown reconstruction, so KEEP the schema-matching
+      // <section>/<div> HTML here so a footnotesList that ever lands inside a
+      // column/cell still round-trips via the schema's parseHTML instead of
+      // vanishing. (Normally the list is doc-level and never nests here.)
+      case "footnotesList": {
+        const inner = (block.content || []).map(blockToHtml).join("");
+        return `<section data-footnotes>${inner}</section>`;
+      }
+      case "footnoteDefinition": {
+        const idAttr = block.attrs?.id
+          ? ` data-id="${escapeAttr(block.attrs.id)}"`
+          : "";
+        const inner = (block.content || []).map(blockToHtml).join("");
+        return `<div data-footnote-def${idAttr}>${inner}</div>`;
+      }
+      // columns/column, htmlEmbed, transclusionSource already emit
+      // schema-matching HTML from processNode.
+      case "columns":
+      case "column":
+      case "htmlEmbed":
+      case "transclusionSource":
+        return processNode(block);
+      default:
+        // Any still-unhandled block type: NEVER fall back to markdown inside a
+        // raw-HTML block (it would become literal text). Wrap its rendered
+        // children in a <div> so their content is preserved; if it has no block
+        // children, render its inline content instead.
+        if (children.length && children.some((c: any) => c.type !== "text")) {
+          return `<div>${children.map(blockToHtml).join("")}</div>`;
+        }
+        return `<div>${inlineToHtml(children)}</div>`;
+    }
+  };
+
+  // Render the block children of a list item to HTML (a listItem holds block+
+  // content). Mirrors processListItem but for the HTML fallback path.
+  const blockChildrenToHtml = (item: any): string =>
+    (item.content || []).map((b: any) => blockToHtml(b)).join("");
+
+  // Indent the rendered children of a list item under a marker prefix.
+  // Each child block is a (possibly multi-line) string. The very first physical
+  // line of the first child carries the marker (e.g. "- " or "1. "); EVERY
+  // other line — the remaining lines of the first child AND all lines of every
+  // subsequent child (nested lists, code blocks, extra paragraphs) — is indented
+  // to align under the marker. Without indenting these continuation lines, the
+  // 2nd/3rd line of a nested child collapses to column 0 and escapes the list.
+  //
+  // The continuation indent MUST equal the LIST marker width, which is not the
+  // same as the visible prefix width:
+  //   - bullet "- "          -> 2 columns
+  //   - task   "- [ ] "      -> marker is still "- " (the "[ ] " is content), 2
+  //   - ordered "1. "/"10. " -> 3/4 columns, scaling with the number's digits
+  // CommonMark anchors nested content to the marker column, so an ordered item
+  // indented to only 2 columns would be re-parsed as a sibling/loose content on
+  // re-import. Callers therefore pass the exact indent width to use.
+  const indentItemChildren = (
+    childStrings: string[],
+    prefix: string,
+    indentWidth: number,
+  ): string => {
+    const indent = " ".repeat(indentWidth);
+    const lines: string[] = [];
+    childStrings.forEach((child, childIndex) => {
+      child.split("\n").forEach((line, lineIndex) => {
+        if (childIndex === 0 && lineIndex === 0) {
+          // First physical line of the first block gets the marker.
+          lines.push(`${prefix} ${line}`);
+        } else {
+          // Indent every continuation line by the marker width; keep blank
+          // lines blank rather than emitting trailing whitespace.
+          lines.push(line.length ? `${indent}${line}` : "");
+        }
+      });
+    });
+    return lines.join("\n");
+  };
+
+  const processListItem = (item: any, prefix: string): string => {
+    const itemContent = item.content || [];
+    const childStrings = itemContent.map(processNode);
+    if (childStrings.length === 0) return prefix;
+    // The rendered marker is `${prefix} ` (prefix + one space), so its width —
+    // and thus the continuation indent — is prefix.length + 1. This is correct
+    // for both bullet ("-" -> 2) and ordered ("1." -> 3, "10." -> 4) markers,
+    // since for those the visible prefix IS the list marker.
+    return indentItemChildren(childStrings, prefix, prefix.length + 1);
+  };
+
+  const processTaskItem = (item: any): string => {
+    const checked = item.attrs?.checked || false;
+    const checkbox = checked ? "[x]" : "[ ]";
+    const prefix = `- ${checkbox}`;
+    const itemContent = item.content || [];
+    const childStrings = itemContent.map(processNode);
+    // An empty task item still needs its checkbox marker; without this guard
+    // the indent below produces "" and the "- [ ]"/"- [x]" row disappears.
+    if (childStrings.length === 0) return prefix;
+    // The list marker for a task item is just "- " (2 columns); the "[ ] "/"[x] "
+    // checkbox is item content, NOT part of the marker. So the continuation
+    // indent is a fixed 2 — do NOT derive it from the wider prefix.length.
+    return indentItemChildren(childStrings, prefix, 2);
+  };
+
+  return processNode(content).trim();
+}
diff --git a/packages/git-sync/src/lib/markdown-document.ts b/packages/prosemirror-markdown/src/lib/markdown-document.ts
similarity index 100%
rename from packages/git-sync/src/lib/markdown-document.ts
rename to packages/prosemirror-markdown/src/lib/markdown-document.ts
diff --git a/packages/prosemirror-markdown/src/lib/markdown-to-prosemirror.ts b/packages/prosemirror-markdown/src/lib/markdown-to-prosemirror.ts
new file mode 100644
index 00000000..b5e0f2d7
--- /dev/null
+++ b/packages/prosemirror-markdown/src/lib/markdown-to-prosemirror.ts
@@ -0,0 +1,1013 @@
+/**
+ * Pure markdown -> ProseMirror conversion.
+ *
+ * The converter path is `markdownToProseMirror` (marked -> HTML ->
+ * generateJSON) plus the two pre/post processors it needs (`preprocessCallouts`,
+ * `bridgeTaskLists`). The gitmost server writes the resulting page bodies
+ * natively through the collab gateway, so no websocket/Yjs write-path lives
+ * here.
+ */
+import { generateJSON } from "@tiptap/html";
+import { JSDOM } from "jsdom";
+import { Marked } from "marked";
+import type { TokenizerExtension, RendererExtension } from "marked";
+import { docmostExtensions } from "./docmost-schema.js";
+import { parseAttachedComment } from "./attached-comment.js";
+import { splitFootnoteParagraphs } from "./footnote.js";
+import {
+  decodeInlineMathLatex,
+  escapeMathAttr,
+  inlineMathAnchoredRe,
+} from "./math-inline.js";
+import {
+  attachmentToHtml,
+  audioToHtml,
+  diagramToHtml,
+  embedToHtml,
+  pageEmbedToHtml,
+  pdfToHtml,
+  transclusionReferenceToHtml,
+  videoToHtml,
+  youtubeToHtml,
+} from "./media-html.js";
+
+/**
+ * #293 canon #7: `==text==` (Obsidian/GFM highlight) inline syntax.
+ *
+ * `==` is NOT standard markdown, so we teach the parser to turn `==text==` into
+ * `<mark>text</mark>`, which the schema's Highlight extension parses back into a
+ * color-less `highlight` mark (see docmost-schema.ts). This mirrors the
+ * serializer's no-color highlight form, so a plain highlight round-trips.
+ *
+ * This is an INLINE extension (mid-line, must respect token precedence so it
+ * never fires inside an inline code span). The tokenizer requires a non-empty,
+ * non-space-leading inner and re-tokenizes that inner via `this.lexer.inline-
+ * Tokens`, so nested marks (bold/italic/links inside a highlight) round-trip.
+ * The renderer re-parses the inner tokens and wraps them in `<mark>`.
+ *
+ * It is registered on a DEDICATED `Marked` instance owned by this module
+ * (below), NOT the global `marked` singleton, so the `==` behavior cannot leak
+ * into unrelated callers that import `marked` elsewhere in the monorepo.
+ */
+interface HighlightMarkToken {
+  type: "highlightMark";
+  raw: string;
+  text: string;
+  tokens: any[];
+}
+
+const highlightMarkExtension: TokenizerExtension & RendererExtension = {
+  name: "highlightMark",
+  level: "inline",
+  // Point marked at the next `==` so the tokenizer is invoked at that offset.
+  start(src: string) {
+    const i = src.indexOf("==");
+    return i < 0 ? undefined : i;
+  },
+  tokenizer(src: string) {
+    // Require a non-empty, non-space-leading inner and a closing `==`. The lazy
+    // `+?` matches the SHORTEST inner, so `==a== ==b==` yields two marks. `====`
+    // (empty) and `==x` (unbalanced) do not match and stay literal text.
+    const match = /^==(?=\S)([\s\S]+?)==/.exec(src);
+    if (!match) return undefined;
+    const token: HighlightMarkToken = {
+      type: "highlightMark",
+      raw: match[0],
+      text: match[1],
+      tokens: [],
+    };
+    // Re-tokenize the inner so marks nested inside the highlight round-trip.
+    token.tokens = this.lexer.inlineTokens(match[1]);
+    return token as any;
+  },
+  renderer(token: any) {
+    return `<mark>${this.parser.parseInline(token.tokens)}</mark>`;
+  },
+};
+
+/**
+ * #293 canon #6: Obsidian-native math — `$LaTeX$` (inline) and `$$…$$` (block).
+ *
+ * INLINE `$…$` uses the SHARED pandoc currency-safe rule (math-inline.ts), the
+ * SAME rule the serializer's prose escaper uses, so currency (`$5`,
+ * `$5 and $10`) is NEVER math and a would-be-math prose `$x$` (escaped `\$x\$`
+ * on export) stays literal. The captured inner LaTeX is decoded (`\$`→`$`) and
+ * emitted as the schema's `span[data-type="mathInline"]` carrying the LaTeX in a
+ * `text="…"` attribute (the schema's default attribute parser reads it back).
+ *
+ * BLOCK `$$…$$` matches a `$$` fence on its own line(s), capturing multi-line
+ * LaTeX up to the next `$$` line, and emits `div[data-type="mathBlock"]`.
+ *
+ * Both fail OPEN: an unbalanced `$`/`$$`, or a currency `$`, returns undefined
+ * from the tokenizer and stays literal text with no crash. Registered on the
+ * SAME dedicated instance as the highlight extension (never the global marked
+ * singleton), so the `$`/`$$` behavior cannot leak into unrelated callers.
+ */
+const mathInlineExtension: TokenizerExtension & RendererExtension = {
+  name: "mathInline",
+  level: "inline",
+  start(src: string) {
+    const i = src.indexOf("$");
+    return i < 0 ? undefined : i;
+  },
+  tokenizer(src: string) {
+    const match = inlineMathAnchoredRe().exec(src);
+    if (!match) return undefined; // currency / unbalanced -> literal
+    return {
+      type: "mathInline",
+      raw: match[0],
+      text: decodeInlineMathLatex(match[1]),
+    } as any;
+  },
+  renderer(token: any) {
+    return `<span data-type="mathInline" data-katex="true" text="${escapeMathAttr(token.text)}"></span>`;
+  },
+};
+
+const mathBlockExtension: TokenizerExtension & RendererExtension = {
+  name: "mathBlock",
+  level: "block",
+  start(src: string) {
+    const m = /(?:^|\n)\$\$/.exec(src);
+    if (!m) return undefined;
+    return m.index + (m[0].startsWith("\n") ? 1 : 0);
+  },
+  tokenizer(src: string) {
+    // A `$$` fence on its own line, then the SHORTEST run up to the next `$$`
+    // line (non-greedy, so it never swallows across an unrelated later fence).
+    // The inner may be empty (an empty mathBlock) or multi-line.
+    const match = /^\$\$[^\S\n]*\n([\s\S]*?)\n\$\$[^\S\n]*(?:\n|$)/.exec(src);
+    if (!match) return undefined; // no closing fence -> literal
+    return {
+      type: "mathBlock",
+      raw: match[0],
+      text: match[1],
+    } as any;
+  },
+  renderer(token: any) {
+    return `<div data-type="mathBlock" data-katex="true" text="${escapeMathAttr(token.text)}"></div>`;
+  },
+};
+
+/**
+ * #293 canon #2: Pandoc/Obsidian inline footnotes — `^[note body]`.
+ *
+ * The single canonical markdown form carries the note body AT the reference
+ * point. The crux is the tokenizer: it BALANCES `[`/`]` (respecting
+ * backslash-escaped brackets) from the opening `^[` to its MATCHING `]`, so a
+ * body that itself contains a `[link](url)` is captured whole — a lazy
+ * `^\[([^\]]+)\]` would cut at the first inner `]` and fragment the parse.
+ *
+ * The renderer emits the schema's `<sup data-footnote-ref>` marker carrying the
+ * (still-encoded) body in a `data-fn-text` attribute and NO id. A later
+ * post-`marked` pass (assembleFootnotes) collects those sups, dedups by the EXACT
+ * body text, ASSIGNS sequential ids (fn-1, fn-2, … in first-seen order), and
+ * builds one doc-level `<div data-footnote-def>` per unique body inside a single
+ * `<section data-footnotes>`. Assigning ids from the exact text (rather than a
+ * hash) makes collisions between DIFFERENT bodies impossible (F1) while staying
+ * race-free — all ids are assigned inside that one call from the local DOM, no
+ * module state — and byte-stable (ids are never written to markdown; `^[body]`
+ * carries only text, so identical bodies still merge).
+ *
+ * Fail-open: an unbalanced `^[` with no matching `]` returns undefined from the
+ * tokenizer and stays literal text (no crash). `^[]` is a footnote with an empty
+ * body. The reference form `[^id]` / `[^id]: def` is NOT parsed (no `^[`), so it
+ * stays literal (an accepted hand-authoring gap; no backward compat). Registered
+ * on the SAME dedicated instance as the highlight/math extensions.
+ */
+const footnoteInlineExtension: TokenizerExtension & RendererExtension = {
+  name: "footnoteInline",
+  level: "inline",
+  start(src: string) {
+    const i = src.indexOf("^[");
+    return i < 0 ? undefined : i;
+  },
+  tokenizer(src: string) {
+    if (!src.startsWith("^[")) return undefined;
+    // Balance-scan from just after `^[` to the matching `]`. A backslash escapes
+    // the next character (so `\[` / `\]` do not affect the depth), matching the
+    // serializer's balanceBrackets.
+    let depth = 1;
+    let i = 2;
+    while (i < src.length) {
+      const c = src[i];
+      if (c === "\\" && i + 1 < src.length) {
+        i += 2;
+        continue;
+      }
+      if (c === "[") {
+        depth++;
+        i++;
+        continue;
+      }
+      if (c === "]") {
+        depth--;
+        if (depth === 0) break;
+        i++;
+        continue;
+      }
+      i++;
+    }
+    if (depth !== 0) return undefined; // unbalanced -> literal text (fail-open)
+    const inner = src.slice(2, i); // content between `^[` and the matching `]`
+    return {
+      type: "footnoteInline",
+      raw: src.slice(0, i + 1), // includes the closing `]`
+      text: inner,
+    } as any;
+  },
+  renderer(token: any) {
+    // No id here (F1): assembleFootnotes assigns ids by dedup-ing the exact body.
+    return `<sup data-footnote-ref data-fn-text="${escapeFootnoteAttr(token.text)}"></sup>`;
+  },
+};
+
+/**
+ * Escape a value placed in a double-quoted HTML attribute (footnote id /
+ * body). Only `&` and `"` are special in that context; escaping them keeps the
+ * attribute well-formed and is idempotent (jsdom decodes them back).
+ */
+function escapeFootnoteAttr(value: string): string {
+  return String(value).replace(/&/g, "&amp;").replace(/"/g, "&quot;");
+}
+
+// Dedicated marked instance: default (GFM) options plus the `==` highlight
+// inline extension, the `$…$` / `$$…$$` math extensions (#293 canon #6), and the
+// `^[…]` inline-footnote extension (#293 canon #2). Constructed once at module
+// load so the extensions are registered exactly once and never mutate the global
+// `marked` singleton.
+const markedInstance = new Marked().use({
+  extensions: [
+    highlightMarkExtension,
+    mathInlineExtension,
+    mathBlockExtension,
+    footnoteInlineExtension,
+  ],
+});
+
+// Setup DOM environment for Tiptap HTML parsing in Node.js
+const dom = new JSDOM("<!DOCTYPE html><html><body></body></html>");
+global.window = dom.window as any;
+global.document = dom.window.document;
+// @ts-ignore
+global.Element = dom.window.Element;
+
+/**
+ * Hard ceiling above which we skip callout preprocessing entirely. The linear
+ * scanner below has no quadratic blow-up, but we still cap input defensively so
+ * a pathological multi-megabyte payload cannot tie up the event loop; in that
+ * case the markdown is passed through verbatim (callouts are simply not
+ * detected) rather than risking a slow scan.
+ */
+const MAX_CALLOUT_PREPROCESS_BYTES = 4 * 1024 * 1024; // 4 MB
+
+/** Matches an opening callout fence: `:::type` (type captured, lower-cased). */
+const CALLOUT_OPEN_RE = /^:::\s*(\w+)\s*$/;
+/** Matches a bare closing callout fence: `:::`. */
+const CALLOUT_CLOSE_RE = /^:::\s*$/;
+/**
+ * Matches an Obsidian-native callout opener: `> [!type]` (type captured). An
+ * optional title after the type is allowed but ignored (the Docmost callout
+ * schema has no title). The body is the following contiguous blockquote lines.
+ */
+const CALLOUT_BQ_OPEN_RE = /^>\s*\[!(\w+)\]/;
+/** Matches any blockquote continuation line (`>` … ). */
+const BLOCKQUOTE_LINE_RE = /^>/;
+/** Matches the start/end of a code fence (``` or ~~~), capturing the marker. */
+const CODE_FENCE_RE = /^(\s*)(`{3,}|~{3,})/;
+
+/**
+ * Pre-process Docmost-flavoured markdown: convert `:::type ... :::`
+ * callout blocks (the syntax our markdown export produces) into HTML
+ * divs that the callout extension parses. The inner content is rendered
+ * through marked as regular markdown.
+ *
+ * Implemented as a single linear pass over the lines (no quadratic regex
+ * rescan). It:
+ *   - tracks fenced code regions (```...``` and ~~~...~~~) and never treats a
+ *     `:::` line that lives inside a code fence as a callout delimiter, so a
+ *     callout body that itself contains a fenced code block with a `:::` line is
+ *     no longer corrupted;
+ *   - matches an opening `:::type` line with the next CLOSING `:::` at the SAME
+ *     nesting level, supporting NESTED callouts via a depth counter (an inner
+ *     `:::type` opens a deeper level and consumes a matching `:::`);
+ *   - emits the same `<div data-type="callout" data-callout-type="TYPE">` output
+ *     (inner rendered through marked) as the previous regex implementation.
+ */
+async function preprocessCallouts(markdown: string): Promise<string> {
+  // Defensive cap: skip preprocessing for pathologically large inputs.
+  if (markdown.length > MAX_CALLOUT_PREPROCESS_BYTES) {
+    return markdown;
+  }
+
+  // Recursively transform a slice of lines, converting top-level callouts in
+  // that slice into <div> blocks and rendering their inner content (which may
+  // itself contain nested callouts) through this same function.
+  const transform = async (lines: string[]): Promise<string> => {
+    const out: string[] = [];
+    let inCodeFence = false;
+    let codeFenceMarker = ""; // the exact run of backticks/tildes that opened it
+    let i = 0;
+
+    while (i < lines.length) {
+      const line = lines[i];
+
+      // Inside a code fence, only its matching closing fence is significant;
+      // everything else (including `:::` lines) is copied through verbatim.
+      if (inCodeFence) {
+        out.push(line);
+        const fence = line.match(CODE_FENCE_RE);
+        if (fence && fence[2].startsWith(codeFenceMarker[0]) &&
+            fence[2].length >= codeFenceMarker.length) {
+          inCodeFence = false;
+          codeFenceMarker = "";
+        }
+        i++;
+        continue;
+      }
+
+      // A code fence opening outside any callout body: enter code-fence mode.
+      const fenceOpen = line.match(CODE_FENCE_RE);
+      if (fenceOpen) {
+        inCodeFence = true;
+        codeFenceMarker = fenceOpen[2];
+        out.push(line);
+        i++;
+        continue;
+      }
+
+      // An opening callout fence: scan forward (with code-fence and nested
+      // callout awareness) for its matching closing `:::` at the same level.
+      const open = line.match(CALLOUT_OPEN_RE);
+      if (open) {
+        const type = open[1].toLowerCase();
+        const bodyLines: string[] = [];
+        let depth = 1;
+        let innerInCodeFence = false;
+        let innerCodeFenceMarker = "";
+        let j = i + 1;
+        for (; j < lines.length; j++) {
+          const bl = lines[j];
+          if (innerInCodeFence) {
+            const f = bl.match(CODE_FENCE_RE);
+            if (f && f[2].startsWith(innerCodeFenceMarker[0]) &&
+                f[2].length >= innerCodeFenceMarker.length) {
+              innerInCodeFence = false;
+              innerCodeFenceMarker = "";
+            }
+            bodyLines.push(bl);
+            continue;
+          }
+          const innerFence = bl.match(CODE_FENCE_RE);
+          if (innerFence) {
+            innerInCodeFence = true;
+            innerCodeFenceMarker = innerFence[2];
+            bodyLines.push(bl);
+            continue;
+          }
+          if (CALLOUT_OPEN_RE.test(bl)) {
+            depth++;
+            bodyLines.push(bl);
+            continue;
+          }
+          if (CALLOUT_CLOSE_RE.test(bl)) {
+            depth--;
+            if (depth === 0) break; // matching close for THIS callout
+            bodyLines.push(bl);
+            continue;
+          }
+          bodyLines.push(bl);
+        }
+
+        if (j < lines.length) {
+          // Found the matching closing fence: render the body (recursively, so
+          // nested callouts are handled) and emit the callout div.
+          const inner = await transform(bodyLines);
+          const renderedInner = await markedInstance.parse(inner);
+          out.push(
+            `\n<div data-type="callout" data-callout-type="${type}">${renderedInner}</div>\n`,
+          );
+          i = j + 1; // skip past the closing `:::`
+          continue;
+        }
+        // No matching close (unterminated callout): treat the opener as a
+        // literal line and continue, preserving the original text.
+        out.push(line);
+        i++;
+        continue;
+      }
+
+      // An Obsidian-native callout: `> [!type]` opener; the body is the following
+      // CONTIGUOUS blockquote (`>`-prefixed) lines. Strip ONE blockquote level and
+      // recurse so nested callouts (`> > [!type]`) are handled, then emit the same
+      // callout div the `:::` path produces. A normal blockquote (no `[!type]` on
+      // its first line) does not match and stays a blockquote.
+      const bqOpen = line.match(CALLOUT_BQ_OPEN_RE);
+      if (bqOpen) {
+        const type = bqOpen[1].toLowerCase();
+        const bodyLines: string[] = [];
+        let j = i + 1;
+        for (; j < lines.length; j++) {
+          if (!BLOCKQUOTE_LINE_RE.test(lines[j])) break;
+          bodyLines.push(lines[j].replace(/^>\s?/, ""));
+        }
+        const inner = await transform(bodyLines);
+        const renderedInner = await markedInstance.parse(inner);
+        out.push(
+          `\n<div data-type="callout" data-callout-type="${type}">${renderedInner}</div>\n`,
+        );
+        i = j;
+        continue;
+      }
+
+      out.push(line);
+      i++;
+    }
+
+    return out.join("\n");
+  };
+
+  return transform(markdown.split("\n"));
+}
+
+/**
+ * Bridge marked's checkbox lists to TipTap task lists.
+ *
+ * marked renders GitHub task list items (`- [x] done`) as a plain
+ * `<ul><li><p><input type="checkbox" checked> text</p></li></ul>` WITHOUT the
+ * markup TipTap's TaskList/TaskItem extensions parse. This rewrites such lists
+ * into the shape those extensions expect:
+ *   TaskList parseHTML matches `ul[data-type="taskList"]`,
+ *   TaskItem matches `li[data-type="taskItem"]`,
+ *   the checked state is read from `data-checked === "true"`.
+ *
+ * A list is only converted when it has at least one `<li>` and EVERY direct
+ * `<li>` contains a checkbox input. Both `<ul>` and `<ol>` are considered: a
+ * numbered checklist (`1. [x] a`, which marked renders as an `<ol>` of checkbox
+ * `<li>`s) would otherwise lose its task state. TipTap task lists are unordered,
+ * so a matching `<ol>` is emitted as `data-type="taskList"` exactly like a
+ * `<ul>`. Mixed or ordinary lists (including ordinary `<ol>` lists) are left
+ * untouched so they keep rendering as bullet/numbered lists. The marked `<p>`
+ * wrapper is kept inside the `<li>` because TaskItem content allows paragraphs.
+ */
+function bridgeTaskLists(html: string): string {
+  // Cheap early-out: if the markup contains no checkbox input at all there is
+  // nothing to bridge, so skip the expensive JSDOM parse entirely. This is the
+  // common case (most pages have no task lists).
+  if (!/type=["']?checkbox/i.test(html)) {
+    return html;
+  }
+  // Defensive cap (consistent with preprocessCallouts): skip the bridge for
+  // pathologically large inputs rather than running a second expensive JSDOM
+  // parse on a multi-megabyte payload. The markup is passed through verbatim.
+  if (html.length > MAX_CALLOUT_PREPROCESS_BYTES) {
+    return html;
+  }
+  const dom = new JSDOM(html);
+  const document = dom.window.document;
+  // Collect the checkbox(es) that belong to THIS <li> directly: either direct
+  // child <input type="checkbox"> elements or ones inside the <li>'s direct <p>
+  // child (the shape marked emits: `<li><p><input type="checkbox"> text</p></li>`).
+  // Checkboxes nested deeper (e.g. inside a child <ul>/<ol>) are excluded so a
+  // bullet <li> that merely contains a nested task sublist is not misdetected.
+  // Raw inline HTML can put more than one checkbox in a single <li>; we gather
+  // ALL of them so none survive into the converted item.
+  const directCheckboxes = (li: Element): Element[] => {
+    const found: Element[] = [];
+    for (const child of Array.from(li.children)) {
+      if (
+        child.tagName === "INPUT" &&
+        child.getAttribute("type") === "checkbox"
+      ) {
+        found.push(child);
+        continue;
+      }
+      if (child.tagName === "P") {
+        for (const inp of Array.from(
+          child.querySelectorAll(":scope > input[type='checkbox']"),
+        )) {
+          found.push(inp);
+        }
+      }
+    }
+    return found;
+  };
+  // Both <ul> and <ol> are candidates: an <ol> whose every direct <li> carries
+  // its own checkbox is a numbered checklist that must also become a taskList.
+  const lists = Array.from(document.querySelectorAll("ul, ol"));
+  for (const list of lists) {
+    // Only consider DIRECT child <li> elements; nested lists are handled by
+    // their own iteration of the outer loop.
+    const items = Array.from(list.children).filter(
+      (child) => child.tagName === "LI",
+    );
+    if (items.length === 0) continue;
+    const itemCheckboxes = items.map((li) => directCheckboxes(li));
+    // Convert only when every direct <li> carries at least one OWN checkbox.
+    if (!itemCheckboxes.every((boxes) => boxes.length > 0)) continue;
+
+    // A numbered checklist arrives as an <ol>. We must NOT leave the tag as
+    // <ol> while tagging it data-type="taskList": generateJSON would then match
+    // BOTH the orderedList rule (tag ol) and the taskList rule (data-type),
+    // emitting a phantom empty orderedList beside the real taskList. So rename a
+    // qualifying <ol> to a <ul> — move its <li> children over and replace it —
+    // leaving only the taskList rule to match. Already-<ul> lists are unchanged.
+    let target: Element = list;
+    if (list.tagName === "OL") {
+      const ul = document.createElement("ul");
+      // Carry over existing attributes (e.g. class) so nothing is silently lost.
+      for (const attr of Array.from(list.attributes)) {
+        ul.setAttribute(attr.name, attr.value);
+      }
+      // Move every child node (including the <li>s we collected) into the <ul>.
+      while (list.firstChild) {
+        ul.appendChild(list.firstChild);
+      }
+      list.replaceWith(ul);
+      target = ul;
+    }
+
+    target.setAttribute("data-type", "taskList");
+    items.forEach((li, index) => {
+      const boxes = itemCheckboxes[index];
+      // The first checkbox determines the checked state (matches the previous
+      // single-checkbox behaviour); any extras only need removing.
+      const input = boxes[0] ?? null;
+      li.setAttribute("data-type", "taskItem");
+      const checked =
+        input != null &&
+        (input.hasAttribute("checked") || (input as any).checked);
+      li.setAttribute("data-checked", checked ? "true" : "false");
+      // Remove ALL direct checkbox inputs so none survive into the content
+      // (a raw-inline-HTML <li> may carry more than one).
+      for (const box of boxes) {
+        box.remove();
+      }
+    });
+  }
+  return document.body.innerHTML;
+}
+
+/**
+ * Re-apply ATTACHED HTML comments (#293 canon) before the DOM/generateJSON
+ * stage drops them.
+ *
+ * The serializer appends attributes that have no native markdown syntax as a
+ * trailing `<!--name {json}-->` comment on the block's line (see
+ * attached-comment.ts). `marked` keeps that comment as an HTML comment NODE
+ * inside the block element (`<p>text <!--attrs {…}--></p>`), but the next stage
+ * (parse5/jsdom via generateJSON) discards comment nodes, so the attributes
+ * would be lost. This pass runs on the post-`marked` HTML: for every attached
+ * comment it re-expresses the encoded attributes in a form the schema's
+ * parseHTML already understands, then removes the comment so it cannot leak.
+ *
+ * This pass materializes BOTH comment conventions, discriminated by position:
+ *
+ *   - ATTACHED comments (#9 `attrs`): a comment sitting INSIDE a `<p>`/`<hN>`
+ *     (same rendered line as visible content). The only handled key is
+ *     `textAlign`, re-expressed as an inline `text-align` style on the parent,
+ *     which the docmost-schema textAlign global attribute reads back.
+ *   - ATTACHED image comments (#4 `img`): a comment bound to an `<img>` (its
+ *     previous element sibling), e.g. `![](src) <!--img {"align":"left"}-->`
+ *     rendered as `<p><img> <!--img …--></p>`. Each decoded key is written as
+ *     the DOM attribute the image schema's parseHTML reads back (align/width/
+ *     height/data-size/data-aspect-ratio/data-attachment-id/data-caption/title).
+ *     An `img` comment with no adjacent <img> is INERT.
+ *   - STANDALONE machinery comments (#5 `subpages`/`pagebreak`): a lone comment
+ *     line, which `marked` renders as an HTML block so jsdom makes it a DIRECT
+ *     child of `<body>`. These are replaced with the schema-matching block div
+ *     (`<div data-type="pageBreak">` / `<div data-type="subpages" [data-recursive]>`)
+ *     that the schema's parseHTML rebuilds into the atom.
+ *   - MEDIA DISCRIMINATOR comments (#8): the comment NAME selects the node type.
+ *     IMAGE-FORM (`youtube`/`video`/`audio`/`drawio`/`excalidraw`) binds to the
+ *     preceding `<img>` (`![](src)<!--name …-->`); LINK-FORM (`pdf`/`attachment`/
+ *     `embed`) binds to the preceding `<a>` (`[text](src)<!--name …-->`);
+ *     STANDALONE (`pageembed`/`transclusion`) is a lone comment line. Each is
+ *     re-expressed as the SAME schema HTML the serializer's raw-HTML path emits
+ *     (media-html.ts) — the img's `src`/the anchor's `href`+text plus the decoded
+ *     comment attrs — then swapped in for the `<img>`/`<a>`/comment. A bare
+ *     `![](url)`/`[text](src)` with NO following discriminator stays an `image`/
+ *     plain link (never sniffed by URL).
+ *
+ * Position determines legality: an `attrs` comment is honored only in attached
+ * position, `subpages`/`pagebreak`/`pageembed`/`transclusion` only in standalone
+ * position, an image-form comment only next to an `<img>` and a link-form comment
+ * only next to an `<a>`; a comment in the wrong position/next to the wrong element
+ * is left INERT (generateJSON drops it). Fail-open everywhere: a malformed comment
+ * (null from parseAttachedComment), an unknown name, a wrong-position comment, or
+ * an unknown/empty attr value is ignored.
+ */
+function applyCommentDirectives(html: string): string {
+  // Cheap early-out: no comments at all -> nothing to intercept.
+  if (!html.includes("<!--")) return html;
+  const dom = new JSDOM(html);
+  const document = dom.window.document;
+  const nodeFilter = dom.window.NodeFilter;
+  // Walk the WHOLE document, not just <body>: when a standalone machinery
+  // comment is the FIRST thing in the output (before any body content), the
+  // HTML parser places it at document level (a child of `#document`, before
+  // `<html>`), where it is outside `document.body` and would be lost. Attached
+  // attrs comments always live inside body, so this wider walk still finds them.
+  const walker = document.createTreeWalker(document, nodeFilter.SHOW_COMMENT);
+  const comments: any[] = [];
+  let current: any;
+  while ((current = walker.nextNode())) comments.push(current);
+
+  // Standalone machinery comments that were parsed at document level (leading,
+  // before body content) must be MOVED into body — in document order — since we
+  // return `document.body.innerHTML`. Because the parser only puts LEADING
+  // comments at document level, prepending them to body preserves global order.
+  const leadingDivs: any[] = [];
+
+  // #293 canon #8 discriminator NAME -> node form. The comment NAME alone selects
+  // the node type; a bare `![](url)`/`[text](src)` with NO following comment is an
+  // `image`/plain link (never sniffed). These are materialized below by rebuilding
+  // the SAME schema HTML the serializer's raw-HTML path emits (media-html.ts), so
+  // serialize and parse cannot drift.
+  const IMAGE_FORM_NAMES = new Set([
+    "youtube",
+    "video",
+    "audio",
+    "drawio",
+    "excalidraw",
+  ]);
+  const LINK_FORM_NAMES = new Set(["pdf", "attachment", "embed"]);
+
+  // Parse a schema-HTML string (from a media-html builder) into its top-level
+  // element so it can be swapped in for the <img>/<a>/comment it replaces.
+  const buildElement = (htmlStr: string): any => {
+    const tmp = document.createElement("div");
+    tmp.innerHTML = htmlStr;
+    return tmp.firstElementChild;
+  };
+
+  // Build the image-form schema HTML for a given discriminator name, using the
+  // <img>'s src as the node src plus the decoded comment attrs.
+  const imageFormHtml = (name: string, attrs: Record<string, any>): string => {
+    switch (name) {
+      case "video":
+        return videoToHtml(attrs);
+      case "audio":
+        return audioToHtml(attrs);
+      case "youtube":
+        return youtubeToHtml(attrs);
+      default: // drawio | excalidraw
+        return diagramToHtml(name as "drawio" | "excalidraw", attrs);
+    }
+  };
+
+  for (const comment of comments) {
+    const parsed = parseAttachedComment(comment.data);
+    if (!parsed) continue; // malformed -> inert (dropped by generateJSON)
+    const parent = comment.parentElement as any;
+    const tag = String(parent?.tagName || "").toLowerCase();
+
+    if (parsed.name === "subpages" || parsed.name === "pagebreak") {
+      // #293 canon #5 STANDALONE machinery. A lone comment line is rendered by
+      // marked as an HTML block; the parser places it either directly under
+      // <body> (when other content surrounds it) or at document level (when it
+      // leads the output). Both are STANDALONE position. A `subpages`/`pagebreak`
+      // comment sitting inside a `<p>`/`<hN>` (or any other element) is attached
+      // position -> INERT.
+      const standalone = tag === "" || tag === "body" || tag === "html";
+      if (!standalone) continue; // wrong position -> inert
+      const div = document.createElement("div");
+      if (parsed.name === "pagebreak") {
+        div.setAttribute("data-type", "pageBreak");
+      } else {
+        div.setAttribute("data-type", "subpages");
+        if (parsed.attrs.recursive === true) {
+          div.setAttribute("data-recursive", "true");
+        }
+      }
+      if (tag === "body") {
+        // In-body: replace in place so surrounding content keeps its order.
+        comment.replaceWith(div);
+      } else {
+        // Document-level (leading): drop the stray comment and queue the div to
+        // be prepended into body below.
+        comment.remove();
+        leadingDivs.push(div);
+      }
+      continue;
+    }
+
+    if (parsed.name === "pageembed" || parsed.name === "transclusion") {
+      // #293 canon #8 STANDALONE media. Like subpages/pagebreak: a lone comment
+      // line placed under <body> or at document level (leading). An attached-
+      // position comment (inside a <p>/<hN> with a sibling) is INERT. We rebuild
+      // the schema div the raw-HTML path emits (media-html.ts) from the decoded
+      // attrs so serialize/parse stay in sync.
+      const standalone = tag === "" || tag === "body" || tag === "html";
+      if (!standalone) continue; // wrong position -> inert
+      const el = buildElement(
+        parsed.name === "pageembed"
+          ? pageEmbedToHtml({ sourcePageId: parsed.attrs.sourcePageId })
+          : transclusionReferenceToHtml({
+              sourcePageId: parsed.attrs.sourcePageId,
+              transclusionId: parsed.attrs.transclusionId,
+            }),
+      );
+      if (!el) continue; // defensive: builder always yields an element
+      if (tag === "body") {
+        comment.replaceWith(el);
+      } else {
+        comment.remove();
+        leadingDivs.push(el);
+      }
+      continue;
+    }
+
+    if (IMAGE_FORM_NAMES.has(parsed.name)) {
+      // #293 canon #8 IMAGE-FORM media (youtube/video/audio/drawio/excalidraw).
+      // `![](src)<!--name {…}-->` renders as `<p><img …><!--name …--></p>`, so
+      // the target is the comment's previous element sibling and it MUST be an
+      // <img>. We rebuild the schema element from the img's src + decoded attrs
+      // and swap it in for the <img>. No adjacent <img> -> INERT.
+      const prev = comment.previousElementSibling as any;
+      const target =
+        prev && String(prev.tagName || "").toLowerCase() === "img"
+          ? prev
+          : null;
+      if (!target) continue; // no adjacent <img> -> inert
+      const attrs = { ...parsed.attrs, src: target.getAttribute("src") || "" };
+      const el = buildElement(imageFormHtml(parsed.name, attrs));
+      if (!el) continue;
+      target.replaceWith(el);
+      comment.remove();
+      continue;
+    }
+
+    if (LINK_FORM_NAMES.has(parsed.name)) {
+      // #293 canon #8 LINK-FORM media (pdf/attachment/embed).
+      // `[text](src)<!--name {…}-->` renders as `<p><a href="src">text</a>
+      // <!--name …--></p>`, so the target is the previous element sibling and it
+      // MUST be an <a>. src = a.href; the visible text is the filename/provider.
+      // Not an <a> -> INERT.
+      const prev = comment.previousElementSibling as any;
+      const target =
+        prev && String(prev.tagName || "").toLowerCase() === "a" ? prev : null;
+      if (!target) continue; // no adjacent <a> -> inert
+      const src = target.getAttribute("href") || "";
+      const text = target.textContent || "";
+      let htmlStr: string;
+      if (parsed.name === "pdf") {
+        // pdf: src standard attr, filename in data-name (null when empty).
+        htmlStr = pdfToHtml({ ...parsed.attrs, src, name: text || null });
+      } else if (parsed.name === "attachment") {
+        // attachment: the schema field is `url`, filename in data-attachment-name.
+        htmlStr = attachmentToHtml({
+          ...parsed.attrs,
+          url: src,
+          name: text || null,
+        });
+      } else {
+        // embed: the visible text is the provider (schema default "").
+        htmlStr = embedToHtml({ ...parsed.attrs, src, provider: text });
+      }
+      const el = buildElement(htmlStr);
+      if (!el) continue;
+      target.replaceWith(el);
+      comment.remove();
+      continue;
+    }
+
+    if (parsed.name === "img") {
+      // #293 canon #4 ATTACHED image attrs. `![](src) <!--img {…}-->` renders
+      // as `<p><img …> <!--img …--></p>`, so the comment's target is the nearest
+      // preceding <img> — its previousElementSibling. An `img` comment with no
+      // adjacent <img> (e.g. a standalone `<!--img-->` at body level, or one
+      // whose previous sibling is not an image) is INERT.
+      const prev = comment.previousElementSibling as any;
+      const target =
+        prev && String(prev.tagName || "").toLowerCase() === "img"
+          ? prev
+          : null;
+      if (!target) continue; // no adjacent <img> -> inert
+      // Re-express each decoded key as the DOM attribute the schema's image
+      // parseHTML reads back (docmost-schema.ts image attrs). Unknown keys are
+      // ignored (fail-open); a bad JSON body already returned null above.
+      const a = parsed.attrs;
+      if (typeof a.align === "string" && a.align)
+        target.setAttribute("align", a.align);
+      if (a.width != null) target.setAttribute("width", String(a.width));
+      if (a.height != null) target.setAttribute("height", String(a.height));
+      if (a.size != null) target.setAttribute("data-size", String(a.size));
+      if (a.aspectRatio != null)
+        target.setAttribute("data-aspect-ratio", String(a.aspectRatio));
+      if (a.attachmentId != null)
+        target.setAttribute("data-attachment-id", String(a.attachmentId));
+      if (a.caption != null)
+        target.setAttribute("data-caption", String(a.caption));
+      if (a.title != null) target.setAttribute("title", String(a.title));
+      comment.remove();
+      continue;
+    }
+
+    if (!parent) continue; // attrs comment must have an element parent
+    if (parsed.name !== "attrs") continue; // unknown name -> inert
+    // #293 canon #9 ATTACHED attrs: honored only in attached position.
+    const isBlock = tag === "p" || /^h[1-6]$/.test(tag);
+    if (!isBlock) continue; // misplaced comment -> inert
+    const align = parsed.attrs.textAlign;
+    if (typeof align === "string" && align) {
+      // Re-express as an inline style; the schema's textAlign parseHTML reads
+      // `el.style.textAlign` back onto the paragraph/heading node.
+      parent.style.textAlign = align;
+    }
+    // Consume the marker regardless (unknown keys are simply ignored) so no
+    // attached comment ever survives into the parsed body.
+    comment.remove();
+  }
+  // Prepend any document-level (leading) standalone divs into body, preserving
+  // their document order relative to each other and ahead of existing content.
+  for (let i = leadingDivs.length - 1; i >= 0; i--) {
+    document.body.insertBefore(leadingDivs[i], document.body.firstChild);
+  }
+  return document.body.innerHTML;
+}
+
+/**
+ * #293 canon #2: assemble the doc-level footnote list from the `<sup>` markers.
+ *
+ * The `^[…]` inline extension (and the raw-HTML column path) leave every
+ * footnote reference as `<sup data-footnote-ref data-fn-text>`, carrying the
+ * (encoded) note body ON the marker but NO id. This post-`marked` pass — a
+ * sibling of applyCommentDirectives, run before generateJSON — turns those into
+ * the schema's three-node model:
+ *
+ *   - collect every `<sup data-footnote-ref>` that carries a `data-fn-text`;
+ *   - DEDUP by the EXACT body text (first-seen order) and assign SEQUENTIAL ids
+ *     `fn-1`, `fn-2`, …; set `data-id` on each sup (matched by its body). This is
+ *     the F1 fix: distinct bodies get distinct ids, so DIFFERENT notes can never
+ *     merge (a hash-derived id could collide and silently drop one body), while
+ *     identical bodies still key to the same entry and MERGE (identical `^[text]`
+ *     merge; a column footnote and an inline one with the same body collapse to
+ *     one def);
+ *   - build one `<div data-footnote-def data-id>` per unique body — the decoded
+ *     `data-fn-text` split on the literal `\n` separator into `<p>`s, each parsed
+ *     as INLINE markdown so links/marks in the note round-trip;
+ *   - append those defs into a single doc-level `<section data-footnotes>` at the
+ *     END of `<body>` — reusing an existing one if the HTML already has a
+ *     footnotes section (F4: never emit a duplicate `<section>`);
+ *   - STRIP `data-fn-text` from every sup, leaving `<sup data-footnote-ref
+ *     data-id>` for the schema's FootnoteReference parseHTML.
+ *
+ * NESTED footnotes (N1): a body can itself contain a `^[…]` (Pandoc/Obsidian
+ * allow it, and the schema's `footnoteDefinition` body is `paragraph+` → inline →
+ * footnoteReference), so `parseInline` of a def body SPAWNS a new inner
+ * `<sup data-fn-text>` INSIDE the just-built definition. A single scan would
+ * leave that inner sup unassigned (dangling `footnoteReference{id:null}`, inner
+ * body lost). So the pass runs to a FIXED POINT: after each round it RE-SCANS for
+ * any `sup[data-footnote-ref][data-fn-text]` still lacking a `data-id` and
+ * processes those too, reusing the SAME exact-body dedup map so an inner body
+ * identical to another still merges. A large round cap bounds pathological input
+ * (fail-open: leftover sups stay inert rather than looping forever).
+ *
+ * Race-free by construction: ids are assigned inside this one call from the local
+ * DOM, so concurrent conversions share no mutable state. Fail-open: a sup without
+ * `data-fn-text` (e.g. a legacy `<sup data-footnote-ref data-id>` from the old
+ * `<section>` HTML form) is left untouched.
+ */
+// Hard cap on fixed-point rounds. Each round peels ONE nesting level, so this is
+// far above any realistic footnote nesting; it exists only so an adversarial
+// input can never spin unbounded. On hitting it we stop (leftover deeply-nested
+// sups stay inert) rather than hang.
+const MAX_FOOTNOTE_ROUNDS = 10000;
+
+function assembleFootnotes(html: string): string {
+  // Cheap early-out: nothing carries a footnote body -> nothing to assemble.
+  if (!html.includes("data-fn-text")) return html;
+  const dom = new JSDOM(html);
+  const document = dom.window.document;
+  if (document.querySelector("sup[data-footnote-ref][data-fn-text]") == null) {
+    return html;
+  }
+
+  // F4: reuse an existing footnotes section if the HTML already has one (e.g. a
+  // legacy `<section data-footnotes>` from the old HTML form, or a footnotesList
+  // that landed inside a column via the raw-HTML path) so we never emit a
+  // duplicate. Otherwise create one at the END of <body>.
+  let section = document.querySelector("section[data-footnotes]");
+  if (!section) {
+    section = document.createElement("section");
+    section.setAttribute("data-footnotes", "");
+    // Attach it NOW (at the end of body), BEFORE the fixed-point loop: each def
+    // is appended into this section, and a def body's `parseInline` may spawn a
+    // nested `<sup data-fn-text>`. The re-scan below uses `document.query…`,
+    // which only sees ATTACHED nodes — so the section must live in the document
+    // for those inner sups to be found (N1). A detached section would hide them.
+    document.body.appendChild(section);
+  }
+
+  // N2: seed the sequential id counter PAST the highest `fn-<N>` id already
+  // present ANYWHERE in the document (a reused legacy section's defs, or existing
+  // refs), so a generated id can never collide with a pre-existing one and
+  // produce two defs sharing an id (ambiguous ref↔def).
+  let counter = 0;
+  for (const el of Array.from(document.querySelectorAll("[data-id]"))) {
+    const m = /^fn-(\d+)$/.exec(el.getAttribute("data-id") || "");
+    if (m) counter = Math.max(counter, parseInt(m[1], 10));
+  }
+
+  // Dedup by the EXACT body text (first-seen order) -> sequential id. Keyed on
+  // the string itself, so two DIFFERENT bodies can NEVER share an id (F1). The
+  // map persists ACROSS rounds so a nested inner body that equals an outer/other
+  // body merges to the same def (N1).
+  const idByBody = new Map<string, string>(); // exact body -> assigned id
+
+  for (let round = 0; round < MAX_FOOTNOTE_ROUNDS; round++) {
+    const pending = Array.from(
+      document.querySelectorAll("sup[data-footnote-ref][data-fn-text]"),
+    );
+    if (pending.length === 0) break;
+    for (const sup of pending) {
+      const body = sup.getAttribute("data-fn-text") || "";
+      let id = idByBody.get(body);
+      const isNew = id === undefined;
+      if (id === undefined) {
+        id = `fn-${++counter}`;
+        idByBody.set(body, id);
+      }
+      // Pin the id on the sup so the reference matches its definition, and strip
+      // the transient body attribute so it never re-matches / reaches generateJSON.
+      sup.setAttribute("data-id", id);
+      sup.removeAttribute("data-fn-text");
+      if (!isNew) continue; // this body already has its definition
+      // Build the definition. `parseInline` may inject a NEW inner
+      // `<sup data-fn-text>` into this def body — that is caught on the next
+      // round's re-scan (the fixed-point loop).
+      const def = document.createElement("div");
+      def.setAttribute("data-footnote-def", "");
+      def.setAttribute("data-id", id);
+      // Split the encoded body into paragraph markdown strings, then parse each
+      // inline so links/marks survive. An empty body yields one empty paragraph
+      // (the schema's footnoteDefinition requires `paragraph+`).
+      for (const paraMd of splitFootnoteParagraphs(body)) {
+        const p = document.createElement("p");
+        p.innerHTML = markedInstance.parseInline(paraMd) as string;
+        def.appendChild(p);
+      }
+      section.appendChild(def);
+    }
+  }
+
+  return document.body.innerHTML;
+}
+
+/**
+ * Recursively strip content-less paragraph nodes from a generated doc.
+ *
+ * A block-level atom whose markdown form is INLINE (e.g. the block `image`'s
+ * `![](url)`, or a bare media element) is wrapped by marked in a <p>; the schema
+ * then HOISTS the block atom out of that paragraph, leaving an EMPTY paragraph
+ * sibling. On the next export that empty `<p>` renders to "" and the doc "\n\n"
+ * join injects a phantom blank gap, so the markdown is not byte-stable.
+ *
+ * Markdown blank lines are separators, never content, so generateJSON only ever
+ * produces an empty paragraph as such a hoist artifact — removing them is safe
+ * and general (it also subsumes the <div>-wrapper workaround the `video` case
+ * uses). We remove ONLY `type === 'paragraph'` nodes whose `content` is absent
+ * or an empty array; every other node (including atoms without `content`) is
+ * preserved, and we recurse into the content of any node that has children.
+ */
+function stripEmptyParagraphs(node: any): any {
+  if (!node || !Array.isArray(node.content)) {
+    // Atom / leaf node (no children to recurse into): keep as-is.
+    return node;
+  }
+  const mapped = node.content.map((child: any) => stripEmptyParagraphs(child));
+  const isEmptyParagraph = (child: any): boolean =>
+    !!child &&
+    child.type === "paragraph" &&
+    (!Array.isArray(child.content) || child.content.length === 0);
+  const filtered = mapped.filter((child: any) => !isEmptyParagraph(child));
+  // Schema-validity guard: several nodes require NON-empty block content
+  // (`content: "block+"` — tableCell, tableHeader, blockquote, column, callout,
+  // and the doc root). For an empty one of those, generateJSON materializes a
+  // single empty paragraph as its OBLIGATORY content — that is not a hoist
+  // artifact. If stripping would empty the container, keep ONE empty paragraph
+  // so the result stays schema-valid (an empty cell/quote must not become `[]`).
+  const cleaned =
+    filtered.length === 0 && mapped.length > 0 ? [mapped[0]] : filtered;
+  return { ...node, content: cleaned };
+}
+
+/** Convert markdown to a ProseMirror doc using the full Docmost schema. */
+export async function markdownToProseMirror(
+  markdownContent: string,
+): Promise<any> {
+  const withCallouts = await preprocessCallouts(markdownContent);
+  const html = await markedInstance.parse(withCallouts);
+  // Materialize comment directives (#293 #9 attached textAlign; #5 standalone
+  // subpages/pageBreak) while the comment nodes still exist, before generateJSON
+  // drops them.
+  const withAttrs = applyCommentDirectives(html);
+  // #293 canon #2: assemble the doc-level footnote list from the `<sup
+  // data-fn-text>` markers (from `^[…]` or the raw-HTML column form) before
+  // generateJSON, so references + definitions materialize into the schema model.
+  const withFootnotes = assembleFootnotes(withAttrs);
+  const bridged = bridgeTaskLists(withFootnotes);
+  const doc = generateJSON(bridged, docmostExtensions);
+  return stripEmptyParagraphs(doc);
+}
diff --git a/packages/prosemirror-markdown/src/lib/math-inline.ts b/packages/prosemirror-markdown/src/lib/math-inline.ts
new file mode 100644
index 00000000..4deb3621
--- /dev/null
+++ b/packages/prosemirror-markdown/src/lib/math-inline.ts
@@ -0,0 +1,78 @@
+/**
+ * Shared inline-math boundary rule (#293 canon #6).
+ *
+ * Pandoc's inline-math rule lives here because it is used in TWO directions that
+ * MUST agree byte-for-byte on which `$…$` spans are math:
+ *
+ *   - the IMPORT tokenizer (markdown-to-prosemirror.ts) that turns `$LaTeX$`
+ *     into a `mathInline` node, and
+ *   - the EXPORT escaper (markdown-converter.ts) that backslash-escapes a
+ *     would-be-math `$…$` span sitting in PROSE text so it re-imports as literal
+ *     text instead of silently materializing a phantom math node.
+ *
+ * Defining the rule ONCE guarantees the two directions never drift: a span the
+ * tokenizer would match is EXACTLY a span the escaper neutralizes, so a prose
+ * `$x$` round-trips as literal text and math `$x^2$` round-trips as math.
+ *
+ * The rule (currency-safe, from pandoc): an opening `$` is NOT followed by
+ * whitespace; the closing `$` is NOT preceded by whitespace AND NOT immediately
+ * followed by a digit; the inner run is non-empty, single-line, and may embed an
+ * escaped `\$` (which never counts as the closer). Under this rule `$5`,
+ * `$5 and $10`, `price is $5`, `a $5 b $6 c` all stay literal (no VALID closing
+ * `$` exists — the `$` before a space-preceded amount fails the "not preceded by
+ * whitespace" test, and a lone `$` has no closer), while `$x^2$` is math.
+ */
+
+// Core pattern (unanchored). Escaping note for the string form:
+//   \\$        -> a literal `$`
+//   (?!\s)     -> opening `$` NOT followed by whitespace (also forces a
+//                 non-empty inner: the next char must exist and be non-space)
+//   (?:\\\\\\$|[^$\n])+?  -> inner: shortest run of either an escaped `\$`
+//                 (consumed as a unit so it is never the closer) or any char
+//                 that is neither an unescaped `$` nor a newline
+//   (?<!\s)    -> the char before the closing `$` is NOT whitespace
+//   \\$        -> closing `$`
+//   (?![0-9])  -> closing `$` NOT immediately followed by a digit (currency)
+export const INLINE_MATH_SOURCE =
+  "\\$(?!\\s)((?:\\\\\\$|[^$\\n])+?)(?<!\\s)\\$(?![0-9])";
+
+/** Global matcher for the export-side prose escaper. */
+export const inlineMathGlobalRe = (): RegExp =>
+  new RegExp(INLINE_MATH_SOURCE, "g");
+
+/** Anchored matcher for the import-side marked tokenizer. */
+export const inlineMathAnchoredRe = (): RegExp =>
+  new RegExp("^" + INLINE_MATH_SOURCE);
+
+/** Decode a tokenizer-captured inner LaTeX: an escaped `\$` becomes `$`. */
+export const decodeInlineMathLatex = (inner: string): string =>
+  inner.replace(/\\\$/g, "$");
+
+/** Escape LaTeX for the `$…$` inline form so a literal `$` cannot close early. */
+export const encodeInlineMathLatex = (latex: string): string =>
+  latex.replace(/\$/g, "\\$");
+
+/**
+ * Whether a `mathInline` node's LaTeX can be safely serialized as `$LaTeX$`
+ * (vs. the always-lossless schema-HTML `<span>` fallback). Requires:
+ *   - non-empty (an empty span has no readable `$…$` form),
+ *   - non-whitespace edges (pandoc's opening/closing whitespace rules),
+ *   - single line (inline math never spans lines),
+ *   - no pre-existing `\$` and no trailing `\` — either would make the
+ *     `$`→`\$` escape ambiguous on decode (a `\\$` sequence, or an escaped
+ *     closing `$`), so those rare cases take the `<span>` fallback instead.
+ * NOTE: a following-sibling digit (which would also break the pandoc closing
+ * rule) cannot be seen from the node alone; that case is handled by the
+ * serializer's inline-children pass, not here.
+ */
+export const inlineMathSerializable = (latex: string): boolean =>
+  latex.length > 0 &&
+  !/^\s/.test(latex) &&
+  !/\s$/.test(latex) &&
+  !/[\r\n]/.test(latex) &&
+  !latex.includes("\\$") &&
+  !/\\$/.test(latex);
+
+/** Escape a value for an HTML double-quoted attribute (only & and " matter). */
+export const escapeMathAttr = (value: string): string =>
+  value.replace(/&/g, "&amp;").replace(/"/g, "&quot;");
diff --git a/packages/prosemirror-markdown/src/lib/media-html.ts b/packages/prosemirror-markdown/src/lib/media-html.ts
new file mode 100644
index 00000000..733f5aed
--- /dev/null
+++ b/packages/prosemirror-markdown/src/lib/media-html.ts
@@ -0,0 +1,172 @@
+/**
+ * Shared schema-HTML builders for the media/discriminator family (#293 canon
+ * #8).
+ *
+ * Canon #8 gives ten node types (youtube/video/audio/drawio/excalidraw —
+ * image-form; pdf/attachment/embed — link-form; pageEmbed/transclusionReference
+ * — standalone) a readable markdown TOP-LEVEL form (`![](src)`/`[text](src)`/a
+ * bare comment) plus a discriminator `<!--name {…}-->` comment. But TWO other
+ * paths still need the RAW SCHEMA-HTML form of each node:
+ *
+ *   1. The serializer's raw-HTML/columns path (`blockToHtml`): a comment node is
+ *      dropped by the DOM parse stage that reads a raw-HTML block back, so inside
+ *      a column/cell these nodes MUST stay schema HTML or they vanish (data loss).
+ *   2. The importer's `applyCommentDirectives`: to materialize the discriminator
+ *      comment it rebuilds the SAME schema element the raw-HTML path emits, then
+ *      swaps it in for the `<img>`/`<a>`/comment.
+ *
+ * Keeping these builders in ONE module means the serializer's raw-HTML path and
+ * the importer's materialization can never drift: both call the same function.
+ * Each builder reproduces BYTE-FOR-BYTE the schema HTML the top-level
+ * `processNode` cases previously returned (so existing columns/raw-HTML goldens
+ * stay green), and each output round-trips through the matching schema parseHTML
+ * in docmost-schema.ts.
+ */
+
+/**
+ * Escape a value interpolated into an HTML double-quoted attribute value.
+ * Identical semantics to markdown-converter's `escapeAttr`: escape ONLY `&` and
+ * `"` (idempotent; parse5 decodes both back). `<`/`>`/`'` are deliberately left
+ * alone so values never accumulate escapes across round-trips.
+ */
+const escapeAttr = (value: unknown): string =>
+  String(value).replace(/&/g, "&amp;").replace(/"/g, "&quot;");
+
+/**
+ * Uploaded `<video>` player. Emits `<div><video …></video></div>`; the outer
+ * `<div>` (no data-type) forces block treatment so marked does not wrap the
+ * inline `<video>` in a `<p>`. Mirrors the Video schema: src/aria-label standard
+ * attrs, the rest as data-*.
+ */
+export function videoToHtml(attrs: Record<string, any>): string {
+  const parts: string[] = [`src="${escapeAttr(attrs.src ?? "")}"`];
+  if (attrs.alt) parts.push(`aria-label="${escapeAttr(attrs.alt)}"`);
+  if (attrs.attachmentId)
+    parts.push(`data-attachment-id="${escapeAttr(attrs.attachmentId)}"`);
+  if (attrs.width != null) parts.push(`width="${escapeAttr(attrs.width)}"`);
+  if (attrs.height != null) parts.push(`height="${escapeAttr(attrs.height)}"`);
+  if (attrs.size != null) parts.push(`data-size="${escapeAttr(attrs.size)}"`);
+  if (attrs.align) parts.push(`data-align="${escapeAttr(attrs.align)}"`);
+  if (attrs.aspectRatio != null)
+    parts.push(`data-aspect-ratio="${escapeAttr(attrs.aspectRatio)}"`);
+  return `<div><video ${parts.join(" ")}></video></div>`;
+}
+
+/** YouTube embed. Emits `div[data-type="youtube"]` (src via data-src). */
+export function youtubeToHtml(attrs: Record<string, any>): string {
+  const parts: string[] = [
+    `data-type="youtube"`,
+    `data-src="${escapeAttr(attrs.src ?? "")}"`,
+  ];
+  if (attrs.width != null)
+    parts.push(`data-width="${escapeAttr(attrs.width)}"`);
+  if (attrs.height != null)
+    parts.push(`data-height="${escapeAttr(attrs.height)}"`);
+  if (attrs.align) parts.push(`data-align="${escapeAttr(attrs.align)}"`);
+  return `<div ${parts.join(" ")}></div>`;
+}
+
+/** Uploaded `<audio>` player. Emits `<div><audio …></audio></div>`. */
+export function audioToHtml(attrs: Record<string, any>): string {
+  const parts: string[] = [`src="${escapeAttr(attrs.src ?? "")}"`];
+  if (attrs.attachmentId)
+    parts.push(`data-attachment-id="${escapeAttr(attrs.attachmentId)}"`);
+  if (attrs.size != null) parts.push(`data-size="${escapeAttr(attrs.size)}"`);
+  return `<div><audio ${parts.join(" ")}></audio></div>`;
+}
+
+/**
+ * draw.io / excalidraw diagram (shared diagramAttributes). Emits
+ * `div[data-type="drawio"|"excalidraw"]` carrying src/title/alt/width/height/
+ * size/aspectRatio/align/attachmentId as data-*.
+ */
+export function diagramToHtml(
+  type: "drawio" | "excalidraw",
+  attrs: Record<string, any>,
+): string {
+  const parts: string[] = [
+    `data-type="${type}"`,
+    `data-src="${escapeAttr(attrs.src ?? "")}"`,
+  ];
+  if (attrs.title != null) parts.push(`data-title="${escapeAttr(attrs.title)}"`);
+  if (attrs.alt != null) parts.push(`data-alt="${escapeAttr(attrs.alt)}"`);
+  if (attrs.width != null)
+    parts.push(`data-width="${escapeAttr(attrs.width)}"`);
+  if (attrs.height != null)
+    parts.push(`data-height="${escapeAttr(attrs.height)}"`);
+  if (attrs.size != null) parts.push(`data-size="${escapeAttr(attrs.size)}"`);
+  if (attrs.aspectRatio != null)
+    parts.push(`data-aspect-ratio="${escapeAttr(attrs.aspectRatio)}"`);
+  if (attrs.align) parts.push(`data-align="${escapeAttr(attrs.align)}"`);
+  if (attrs.attachmentId)
+    parts.push(`data-attachment-id="${escapeAttr(attrs.attachmentId)}"`);
+  return `<div ${parts.join(" ")}></div>`;
+}
+
+/** Generic provider embed. Emits `div[data-type="embed"]` (src/provider/… data-*). */
+export function embedToHtml(attrs: Record<string, any>): string {
+  const parts: string[] = [
+    `data-type="embed"`,
+    `data-src="${escapeAttr(attrs.src ?? "")}"`,
+    `data-provider="${escapeAttr(attrs.provider ?? "")}"`,
+  ];
+  if (attrs.align) parts.push(`data-align="${escapeAttr(attrs.align)}"`);
+  if (attrs.width != null)
+    parts.push(`data-width="${escapeAttr(attrs.width)}"`);
+  if (attrs.height != null)
+    parts.push(`data-height="${escapeAttr(attrs.height)}"`);
+  return `<div ${parts.join(" ")}></div>`;
+}
+
+/** Uploaded file attachment. Emits `div[data-type="attachment"]` (data-attachment-*). */
+export function attachmentToHtml(attrs: Record<string, any>): string {
+  const parts: string[] = [
+    `data-type="attachment"`,
+    `data-attachment-url="${escapeAttr(attrs.url ?? "")}"`,
+  ];
+  if (attrs.name)
+    parts.push(`data-attachment-name="${escapeAttr(attrs.name)}"`);
+  if (attrs.mime)
+    parts.push(`data-attachment-mime="${escapeAttr(attrs.mime)}"`);
+  if (attrs.size != null)
+    parts.push(`data-attachment-size="${escapeAttr(attrs.size)}"`);
+  if (attrs.attachmentId)
+    parts.push(`data-attachment-id="${escapeAttr(attrs.attachmentId)}"`);
+  return `<div ${parts.join(" ")}></div>`;
+}
+
+/** Embedded PDF viewer. Emits `div[data-type="pdf"]` (src std, name/… data-*). */
+export function pdfToHtml(attrs: Record<string, any>): string {
+  const parts: string[] = [
+    `data-type="pdf"`,
+    `src="${escapeAttr(attrs.src ?? "")}"`,
+  ];
+  if (attrs.name) parts.push(`data-name="${escapeAttr(attrs.name)}"`);
+  if (attrs.attachmentId)
+    parts.push(`data-attachment-id="${escapeAttr(attrs.attachmentId)}"`);
+  if (attrs.size != null) parts.push(`data-size="${escapeAttr(attrs.size)}"`);
+  if (attrs.width != null) parts.push(`width="${escapeAttr(attrs.width)}"`);
+  if (attrs.height != null) parts.push(`height="${escapeAttr(attrs.height)}"`);
+  return `<div ${parts.join(" ")}></div>`;
+}
+
+/** Whole-page live embed. Emits `div[data-type="pageEmbed"]` (data-source-page-id). */
+export function pageEmbedToHtml(attrs: Record<string, any>): string {
+  const parts: string[] = [`data-type="pageEmbed"`];
+  if (attrs.sourcePageId)
+    parts.push(`data-source-page-id="${escapeAttr(attrs.sourcePageId)}"`);
+  return `<div ${parts.join(" ")}></div>`;
+}
+
+/**
+ * Live transclusion reference. Emits `div[data-type="transclusionReference"]`
+ * (data-source-page-id + data-transclusion-id).
+ */
+export function transclusionReferenceToHtml(attrs: Record<string, any>): string {
+  const parts: string[] = [`data-type="transclusionReference"`];
+  if (attrs.sourcePageId)
+    parts.push(`data-source-page-id="${escapeAttr(attrs.sourcePageId)}"`);
+  if (attrs.transclusionId)
+    parts.push(`data-transclusion-id="${escapeAttr(attrs.transclusionId)}"`);
+  return `<div ${parts.join(" ")}></div>`;
+}
diff --git a/packages/git-sync/src/lib/node-ops.ts b/packages/prosemirror-markdown/src/lib/node-ops.ts
similarity index 100%
rename from packages/git-sync/src/lib/node-ops.ts
rename to packages/prosemirror-markdown/src/lib/node-ops.ts
diff --git a/packages/git-sync/src/lib/page-file.ts b/packages/prosemirror-markdown/src/lib/page-file.ts
similarity index 100%
rename from packages/git-sync/src/lib/page-file.ts
rename to packages/prosemirror-markdown/src/lib/page-file.ts
diff --git a/packages/git-sync/test/canonicalize-extra.test.ts b/packages/prosemirror-markdown/test/canonicalize-extra.test.ts
similarity index 90%
rename from packages/git-sync/test/canonicalize-extra.test.ts
rename to packages/prosemirror-markdown/test/canonicalize-extra.test.ts
index e2103f80..fc3fa067 100644
--- a/packages/git-sync/test/canonicalize-extra.test.ts
+++ b/packages/prosemirror-markdown/test/canonicalize-extra.test.ts
@@ -6,7 +6,8 @@ import { canonicalizeContent, docsCanonicallyEqual } from 'docmost-client';
 
 // ---------------------------------------------------------------------------
 // Gaps NOT covered by canonicalize.test.ts (test-strategy report §2 diff):
-//   - the *.align family (drawio/excalidraw/video/youtube/embed): a "center"
+//   - the *.align family (drawio/excalidraw/video/youtube/embed AND image, whose
+//     align default is unified to "center" per #293 canon #4): a "center"
 //     default is dropped, a non-default value is kept;
 //   - comment.resolved: TRUE is PRESERVED (only resolved:false is normalized);
 //   - link.target / link.rel NON-default values are kept;
@@ -39,21 +40,27 @@ describe('canonicalizeContent — *.align default family', () => {
     });
   }
 
-  it('image align is NOT in KNOWN_DEFAULTS: a non-null align survives, null is dropped', () => {
-    // image.align defaults to null, so it is handled by the null-drop rule and
-    // a real value ("left") must be kept (no spurious default match).
+  it('image align default is now "center" (#293 canon #4): center/null dropped, left kept', () => {
+    // A real non-default value ("left") must be kept.
     const kept = canonicalizeContent({
       type: 'image',
       attrs: { id: 'i-1', src: '/a.png', align: 'left' },
     });
     expect(kept.attrs).toEqual({ src: '/a.png', align: 'left' });
-    // An image with align:"center" must KEEP it (center is NOT a default for
-    // image, only for the diagram/media family) — guards against over-matching.
+    // #293 canon #4 unified the image align default to "center" (matching
+    // editor-ext), so a center image now DROPS align exactly like the diagram/
+    // media family — bare `![](src)` images stay canonically clean.
     const center = canonicalizeContent({
       type: 'image',
       attrs: { id: 'i-2', src: '/b.png', align: 'center' },
     });
-    expect(center.attrs).toEqual({ src: '/b.png', align: 'center' });
+    expect(center.attrs).toEqual({ src: '/b.png' });
+    // A null align is likewise dropped (null-drop rule) and re-imports as center.
+    const nullAlign = canonicalizeContent({
+      type: 'image',
+      attrs: { id: 'i-3', src: '/c.png', align: null },
+    });
+    expect(nullAlign.attrs).toEqual({ src: '/c.png' });
   });
 });
 
diff --git a/packages/git-sync/test/canonicalize.test.ts b/packages/prosemirror-markdown/test/canonicalize.test.ts
similarity index 100%
rename from packages/git-sync/test/canonicalize.test.ts
rename to packages/prosemirror-markdown/test/canonicalize.test.ts
diff --git a/packages/git-sync/test/diagram-roundtrip.test.ts b/packages/prosemirror-markdown/test/diagram-roundtrip.test.ts
similarity index 65%
rename from packages/git-sync/test/diagram-roundtrip.test.ts
rename to packages/prosemirror-markdown/test/diagram-roundtrip.test.ts
index d8ffc5fe..bcc55ff8 100644
--- a/packages/git-sync/test/diagram-roundtrip.test.ts
+++ b/packages/prosemirror-markdown/test/diagram-roundtrip.test.ts
@@ -32,15 +32,16 @@ describe('diagram round-trip (docmost-schema diagramAttributes)', () => {
     const doc2 = await markdownToProseMirror(md1);
     const md2 = convertProseMirrorToMarkdown(doc2);
 
-    // Exact serialized form: numbers render as bare data-* values; attribute
-    // order follows the converter's emit order (src, then width/height/size/
-    // aspect-ratio/align, then attachment-id).
+    // #293 canon #8 (image-form): src is the markdown target; every OTHER
+    // non-default attr rides in the ALWAYS-emitted `drawio` discriminator comment
+    // (numerics stringified, stable key order width/height/size/aspectRatio then
+    // attachmentId). align="center" is the schema default, so it is OMITTED.
     expect(md1).toBe(
-      '<div data-type="drawio" data-src="/d.drawio" data-width="640" data-height="480" data-size="1234" data-aspect-ratio="1.777" data-align="center" data-attachment-id="att-1"></div>',
+      '![](/d.drawio)<!--drawio {"width":"640","height":"480","size":"1234","aspectRatio":"1.777","attachmentId":"att-1"}-->',
     );
 
-    // A second export reproduces the first byte-for-byte (drawio align default
-    // is already "center", so nothing new materializes on import).
+    // A second export reproduces the first byte-for-byte: align="center"
+    // re-materializes as the schema default on import and is omitted again.
     expect(md2).toBe(md1);
 
     // Re-import coerces every numeric attr to a STRING because parseHTML reads
@@ -64,10 +65,10 @@ describe('diagram round-trip (docmost-schema diagramAttributes)', () => {
   });
 
   // SPEC case 2: minimal excalidraw atom with ONLY string attrs (no align, no
-  // numeric attrs). Locks the one-time export divergence (align='center'
-  // default materializes only on import) plus escapeAttr of title/alt through
-  // the data-title/data-alt path.
-  it('excalidraw materializes align default only on import and escapes title/alt', async () => {
+  // numeric attrs). #293 canon #8 image-form: title/alt ride in the comment JSON
+  // (JSON-encoded, NOT HTML-escaped) and align='center' is omitted as the
+  // schema default — so the one-time divergence the OLD div-form had is GONE.
+  it('excalidraw round-trips title/alt via the discriminator comment (byte-stable, align default omitted)', async () => {
     const input = doc({
       type: 'excalidraw',
       attrs: {
@@ -81,21 +82,18 @@ describe('diagram round-trip (docmost-schema diagramAttributes)', () => {
     const doc2 = await markdownToProseMirror(md1);
     const md2 = convertProseMirrorToMarkdown(doc2);
 
-    // First export: no align emitted (the input doc carries no align), and the
-    // " in title becomes &quot;, the & in alt becomes &amp; via escapeAttr.
+    // #293 canon #8: src in the target; title/alt in the ALWAYS-emitted
+    // `excalidraw` comment as compact JSON (the " in title is JSON-escaped as \",
+    // the & in alt stays literal — JSON, not HTML). No align emitted (default).
     expect(md1).toBe(
-      '<div data-type="excalidraw" data-src="/e.excalidraw" data-title="My &quot;Diagram&quot;" data-alt="a&amp;b"></div>',
+      '![](/e.excalidraw)<!--excalidraw {"title":"My \\"Diagram\\"","alt":"a&b"}-->',
     );
 
-    // Second export: align='center' has now materialized (the schema's
-    // diagramAttributes default), so md2 gains a data-align="center" suffix and
-    // is NOT byte-equal to md1. This one-time divergence is the diagram quirk.
-    expect(md2).toBe(
-      '<div data-type="excalidraw" data-src="/e.excalidraw" data-title="My &quot;Diagram&quot;" data-alt="a&amp;b" data-align="center"></div>',
-    );
-    expect(md2).not.toBe(md1);
+    // Byte-stable: align='center' re-materializes as the schema default on import
+    // and is omitted again on export #2, so md2 === md1 (no diagram quirk now).
+    expect(md2).toBe(md1);
 
-    // Re-import decodes the escaped entities back to the original characters.
+    // Re-import decodes the JSON payload back to the original characters.
     const attrs2 = doc2.content[0].attrs;
     expect(attrs2.title).toBe('My "Diagram"');
     expect(attrs2.alt).toBe('a&b');
diff --git a/packages/git-sync/test/docmost-schema-attrs.test.ts b/packages/prosemirror-markdown/test/docmost-schema-attrs.test.ts
similarity index 100%
rename from packages/git-sync/test/docmost-schema-attrs.test.ts
rename to packages/prosemirror-markdown/test/docmost-schema-attrs.test.ts
diff --git a/packages/git-sync/test/fixtures/corpus/01-headings-paragraphs.json b/packages/prosemirror-markdown/test/fixtures/corpus/01-headings-paragraphs.json
similarity index 100%
rename from packages/git-sync/test/fixtures/corpus/01-headings-paragraphs.json
rename to packages/prosemirror-markdown/test/fixtures/corpus/01-headings-paragraphs.json
diff --git a/packages/git-sync/test/fixtures/corpus/02-inline-marks.json b/packages/prosemirror-markdown/test/fixtures/corpus/02-inline-marks.json
similarity index 100%
rename from packages/git-sync/test/fixtures/corpus/02-inline-marks.json
rename to packages/prosemirror-markdown/test/fixtures/corpus/02-inline-marks.json
diff --git a/packages/git-sync/test/fixtures/corpus/03-lists.json b/packages/prosemirror-markdown/test/fixtures/corpus/03-lists.json
similarity index 100%
rename from packages/git-sync/test/fixtures/corpus/03-lists.json
rename to packages/prosemirror-markdown/test/fixtures/corpus/03-lists.json
diff --git a/packages/git-sync/test/fixtures/corpus/04-blocks.json b/packages/prosemirror-markdown/test/fixtures/corpus/04-blocks.json
similarity index 100%
rename from packages/git-sync/test/fixtures/corpus/04-blocks.json
rename to packages/prosemirror-markdown/test/fixtures/corpus/04-blocks.json
diff --git a/packages/git-sync/test/fixtures/corpus/05-table.json b/packages/prosemirror-markdown/test/fixtures/corpus/05-table.json
similarity index 100%
rename from packages/git-sync/test/fixtures/corpus/05-table.json
rename to packages/prosemirror-markdown/test/fixtures/corpus/05-table.json
diff --git a/packages/git-sync/test/fixtures/corpus/06-diagrams.json b/packages/prosemirror-markdown/test/fixtures/corpus/06-diagrams.json
similarity index 100%
rename from packages/git-sync/test/fixtures/corpus/06-diagrams.json
rename to packages/prosemirror-markdown/test/fixtures/corpus/06-diagrams.json
diff --git a/packages/git-sync/test/fixtures/corpus/07-textstyle-mention.json b/packages/prosemirror-markdown/test/fixtures/corpus/07-textstyle-mention.json
similarity index 100%
rename from packages/git-sync/test/fixtures/corpus/07-textstyle-mention.json
rename to packages/prosemirror-markdown/test/fixtures/corpus/07-textstyle-mention.json
diff --git a/packages/git-sync/test/fixtures/corpus/08-details.json b/packages/prosemirror-markdown/test/fixtures/corpus/08-details.json
similarity index 100%
rename from packages/git-sync/test/fixtures/corpus/08-details.json
rename to packages/prosemirror-markdown/test/fixtures/corpus/08-details.json
diff --git a/packages/git-sync/test/fixtures/corpus/09-columns.json b/packages/prosemirror-markdown/test/fixtures/corpus/09-columns.json
similarity index 100%
rename from packages/git-sync/test/fixtures/corpus/09-columns.json
rename to packages/prosemirror-markdown/test/fixtures/corpus/09-columns.json
diff --git a/packages/git-sync/test/fixtures/corpus/10-mention-in-heading.json b/packages/prosemirror-markdown/test/fixtures/corpus/10-mention-in-heading.json
similarity index 100%
rename from packages/git-sync/test/fixtures/corpus/10-mention-in-heading.json
rename to packages/prosemirror-markdown/test/fixtures/corpus/10-mention-in-heading.json
diff --git a/packages/git-sync/test/fixtures/known-limitations/image-diagrams.json b/packages/prosemirror-markdown/test/fixtures/corpus/11-image-diagrams.json
similarity index 100%
rename from packages/git-sync/test/fixtures/known-limitations/image-diagrams.json
rename to packages/prosemirror-markdown/test/fixtures/corpus/11-image-diagrams.json
diff --git a/packages/git-sync/test/fixtures/sample-doc.json b/packages/prosemirror-markdown/test/fixtures/sample-doc.json
similarity index 100%
rename from packages/git-sync/test/fixtures/sample-doc.json
rename to packages/prosemirror-markdown/test/fixtures/sample-doc.json
diff --git a/packages/prosemirror-markdown/test/footnote.test.ts b/packages/prosemirror-markdown/test/footnote.test.ts
new file mode 100644
index 00000000..7d6fe4db
--- /dev/null
+++ b/packages/prosemirror-markdown/test/footnote.test.ts
@@ -0,0 +1,509 @@
+import { describe, expect, it } from "vitest";
+// Import the converters DIRECTLY from src (NOT the docmost-client barrel, which
+// mutates the global DOM at import time), matching the other converter tests.
+import { convertProseMirrorToMarkdown } from "../src/lib/markdown-converter.js";
+import { markdownToProseMirror } from "../src/lib/markdown-to-prosemirror.js";
+
+// ---------------------------------------------------------------------------
+// Tiny builders (mirror the other converter tests).
+// ---------------------------------------------------------------------------
+const doc = (...nodes: any[]) => ({ type: "doc", content: nodes });
+const P = (...content: any[]) => ({ type: "paragraph", content });
+const T = (text: string, marks?: any[]) =>
+  marks ? { type: "text", text, marks } : { type: "text", text };
+const ref = (id: string) => ({ type: "footnoteReference", attrs: { id } });
+const list = (...defs: any[]) => ({ type: "footnotesList", content: defs });
+const def = (id: string, ...paras: any[]) => ({
+  type: "footnoteDefinition",
+  attrs: { id },
+  content: paras,
+});
+
+// Find the FIRST node of a type anywhere in a PM tree (depth first).
+function findNode(n: any, type: string): any {
+  if (!n || typeof n !== "object") return undefined;
+  if (n.type === type) return n;
+  if (Array.isArray(n.content)) {
+    for (const c of n.content) {
+      const hit = findNode(c, type);
+      if (hit) return hit;
+    }
+  }
+  return undefined;
+}
+// Collect EVERY node of a type.
+function findAll(n: any, type: string, out: any[] = []): any[] {
+  if (!n || typeof n !== "object") return out;
+  if (n.type === type) out.push(n);
+  if (Array.isArray(n.content)) n.content.forEach((c: any) => findAll(c, type, out));
+  return out;
+}
+// Concatenate all text under a node.
+function allText(n: any): string {
+  if (!n || typeof n !== "object") return "";
+  if (n.type === "text") return n.text || "";
+  if (Array.isArray(n.content)) return n.content.map(allText).join("");
+  return "";
+}
+
+// ---------------------------------------------------------------------------
+// basic: `^[body]` at the reference point, byte-stable round trip.
+// ---------------------------------------------------------------------------
+describe("inline footnote: basic", () => {
+  it("serializes a ref + def to `text^[a note]` and re-imports losslessly", async () => {
+    const d = doc(P(T("text"), ref("fn1")), list(def("fn1", P(T("a note")))));
+    const md = convertProseMirrorToMarkdown(d);
+    expect(md).toBe("text^[a note]");
+
+    const back = await markdownToProseMirror(md);
+    const r = findNode(back, "footnoteReference");
+    const l = findNode(back, "footnotesList");
+    const dfn = findNode(back, "footnoteDefinition");
+    expect(r).toBeDefined();
+    expect(l).toBeDefined();
+    expect(dfn).toBeDefined();
+    // The note body rode along, not just the wrapper.
+    expect(allText(dfn)).toBe("a note");
+    // The reference points at the matching definition (derived id).
+    expect(r.attrs.id).toBe(dfn.attrs.id);
+    // Ids are assigned sequentially by the import post-pass (F1), not hashed.
+    expect(r.attrs.id).toBe("fn-1");
+
+    // Byte-stable: re-export equals the first export.
+    const md2 = convertProseMirrorToMarkdown(back);
+    expect(md2).toBe(md);
+  });
+});
+
+// ---------------------------------------------------------------------------
+// bracket balancing (MANDATORY): a `[link](url)` inside the body is captured
+// whole and survives as a link mark in the definition.
+// ---------------------------------------------------------------------------
+describe("inline footnote: bracket balancing", () => {
+  it("captures a full balanced `[link](url)` body and keeps the link", async () => {
+    const body = "note with a ";
+    const d = doc(
+      P(T("x"), ref("fn1")),
+      list(
+        def(
+          "fn1",
+          P(
+            T(body),
+            T("link", [{ type: "link", attrs: { href: "https://x" } }]),
+            T(" inside"),
+          ),
+        ),
+      ),
+    );
+    const md = convertProseMirrorToMarkdown(d);
+    expect(md).toBe("x^[note with a [link](https://x) inside]");
+
+    const back = await markdownToProseMirror(md);
+    const dfn = findNode(back, "footnoteDefinition");
+    expect(allText(dfn)).toBe("note with a link inside");
+    // The link mark survived inside the definition (parser did NOT cut at the
+    // first inner `]`).
+    const linkText = findAll(dfn, "text").find((t: any) =>
+      (t.marks || []).some((m: any) => m.type === "link"),
+    );
+    expect(linkText).toBeDefined();
+    expect(linkText.text).toBe("link");
+    expect(linkText.marks[0].attrs.href).toBe("https://x");
+
+    const md2 = convertProseMirrorToMarkdown(back);
+    expect(md2).toBe(md);
+  });
+
+  it("escapes a STRAY unbalanced `]`/`[` in body text and round-trips it", async () => {
+    const d = doc(
+      P(T("x"), ref("fn1")),
+      list(def("fn1", P(T("a ] and [ stray")))),
+    );
+    const md = convertProseMirrorToMarkdown(d);
+    // The stray brackets are backslash-escaped so `^[…]` stays parseable.
+    expect(md).toBe("x^[a \\] and \\[ stray]");
+
+    const back = await markdownToProseMirror(md);
+    const dfn = findNode(back, "footnoteDefinition");
+    expect(allText(dfn)).toBe("a ] and [ stray");
+
+    const md2 = convertProseMirrorToMarkdown(back);
+    expect(md2).toBe(md);
+  });
+});
+
+// ---------------------------------------------------------------------------
+// multi-paragraph body -> literal `\n` separator.
+// ---------------------------------------------------------------------------
+describe("inline footnote: multi-paragraph body", () => {
+  it("joins two paragraphs with a literal `\\n` and re-splits them", async () => {
+    const d = doc(
+      P(T("x"), ref("fn1")),
+      list(def("fn1", P(T("para one")), P(T("para two")))),
+    );
+    const md = convertProseMirrorToMarkdown(d);
+    // The separator is the two literal characters backslash + n.
+    expect(md).toBe("x^[para one\\npara two]");
+    expect(md.includes("\\n")).toBe(true);
+    // NOT a real newline inside the footnote.
+    expect(md.includes("\n")).toBe(false);
+
+    const back = await markdownToProseMirror(md);
+    const dfn = findNode(back, "footnoteDefinition");
+    const paras = (dfn.content || []).filter((p: any) => p.type === "paragraph");
+    expect(paras.length).toBe(2);
+    expect(allText(paras[0])).toBe("para one");
+    expect(allText(paras[1])).toBe("para two");
+
+    const md2 = convertProseMirrorToMarkdown(back);
+    expect(md2).toBe(md);
+  });
+});
+
+// ---------------------------------------------------------------------------
+// real backslash-n escaping (MANDATORY): a literal `\n` in the body text is
+// emitted as `\\n` and round-trips to the literal text, NOT a paragraph break.
+// ---------------------------------------------------------------------------
+describe("inline footnote: real backslash-n escaping", () => {
+  it("escapes a literal `\\n` as `\\\\n` and keeps it a single paragraph", async () => {
+    // Body text contains the two literal characters: backslash, n.
+    const d = doc(
+      P(T("x"), ref("fn1")),
+      list(def("fn1", P(T("path C:\\new here")))),
+    );
+    const md = convertProseMirrorToMarkdown(d);
+    // The real backslash-n becomes an ESCAPED backslash-n (`\\n`).
+    expect(md).toBe("x^[path C:\\\\new here]");
+
+    const back = await markdownToProseMirror(md);
+    const dfn = findNode(back, "footnoteDefinition");
+    const paras = (dfn.content || []).filter((p: any) => p.type === "paragraph");
+    // A single paragraph — the `\n` was NOT read as a paragraph break.
+    expect(paras.length).toBe(1);
+    expect(allText(dfn)).toBe("path C:\\new here");
+
+    const md2 = convertProseMirrorToMarkdown(back);
+    expect(md2).toBe(md);
+  });
+});
+
+// ---------------------------------------------------------------------------
+// dedup / multiple refs.
+// ---------------------------------------------------------------------------
+describe("inline footnote: dedup", () => {
+  it("two refs to the SAME def emit `^[same]` twice and MERGE on parse", async () => {
+    const d = doc(
+      P(T("a"), ref("fn1"), T(" b"), ref("fn1")),
+      list(def("fn1", P(T("same text")))),
+    );
+    const md = convertProseMirrorToMarkdown(d);
+    expect(md).toBe("a^[same text] b^[same text]");
+
+    const back = await markdownToProseMirror(md);
+    // Two references, ONE definition (merged), sharing the same id.
+    const refs = findAll(back, "footnoteReference");
+    const defs = findAll(back, "footnoteDefinition");
+    expect(refs.length).toBe(2);
+    expect(defs.length).toBe(1);
+    expect(refs[0].attrs.id).toBe(refs[1].attrs.id);
+    expect(refs[0].attrs.id).toBe(defs[0].attrs.id);
+
+    const md2 = convertProseMirrorToMarkdown(back);
+    expect(md2).toBe(md);
+  });
+
+  it("two `^[identical]` in SOURCE merge to one definition", async () => {
+    const back = await markdownToProseMirror("a^[note] b^[note]");
+    const refs = findAll(back, "footnoteReference");
+    const defs = findAll(back, "footnoteDefinition");
+    expect(refs.length).toBe(2);
+    expect(defs.length).toBe(1);
+    expect(refs[0].attrs.id).toBe(defs[0].attrs.id);
+  });
+});
+
+// ---------------------------------------------------------------------------
+// footnote inside a column -> raw-HTML `<sup data-fn-text>` form (NOT `^[…]`).
+// ---------------------------------------------------------------------------
+describe("inline footnote: inside a column", () => {
+  it("carries the body on `<sup data-fn-text>` and round-trips", async () => {
+    const d = doc(
+      {
+        type: "columns",
+        content: [
+          {
+            type: "column",
+            attrs: { width: "50%" },
+            content: [P(T("col "), ref("fn1"))],
+          },
+        ],
+      },
+      list(def("fn1", P(T("colnote")))),
+    );
+    const md = convertProseMirrorToMarkdown(d);
+    // Raw-HTML path: the ref carries its text ON the sup, NOT as `^[…]`.
+    expect(md).toContain('data-fn-text="colnote"');
+    expect(md).not.toContain("^[");
+
+    const back = await markdownToProseMirror(md);
+    // The reference stays inside the column; the definition is at doc level.
+    const col = findNode(back, "column");
+    expect(findNode(col, "footnoteReference")).toBeDefined();
+    const dfn = findNode(back, "footnoteDefinition");
+    expect(allText(dfn)).toBe("colnote");
+    const r = findNode(back, "footnoteReference");
+    expect(r.attrs.id).toBe(dfn.attrs.id);
+
+    // The footnote portion is byte-stable on re-export (the surrounding columns
+    // node applies its own layout/width normalization, unrelated to footnotes).
+    // The raw-HTML column sup carries the body on data-fn-text and NO id (F1);
+    // the id is assigned by the import post-pass.
+    const md2 = convertProseMirrorToMarkdown(back);
+    expect(md2).toContain('data-fn-text="colnote"');
+    expect(md2).not.toContain("data-id=");
+  });
+});
+
+// ---------------------------------------------------------------------------
+// orphan definition: a def with no reference is not silently lost.
+// ---------------------------------------------------------------------------
+describe("inline footnote: orphan definition", () => {
+  it("appends an unreferenced definition as its own `^[body]` line", async () => {
+    const d = doc(P(T("body text")), list(def("fnX", P(T("orphan note")))));
+    const md = convertProseMirrorToMarkdown(d);
+    expect(md).toBe("body text\n\n^[orphan note]");
+
+    const back = await markdownToProseMirror(md);
+    const dfn = findNode(back, "footnoteDefinition");
+    expect(dfn).toBeDefined();
+    expect(allText(dfn)).toBe("orphan note");
+  });
+});
+
+// ---------------------------------------------------------------------------
+// no backward compat: `[^id]` / `[^id]: def` stay literal (no footnote node).
+// ---------------------------------------------------------------------------
+describe("inline footnote: no backward compat for the reference form", () => {
+  it("does not parse `[^1]` into a footnote node", async () => {
+    const back = await markdownToProseMirror("see [^1] here");
+    expect(findNode(back, "footnoteReference")).toBeUndefined();
+    expect(findNode(back, "footnotesList")).toBeUndefined();
+    // The literal text survives.
+    expect(allText(back)).toContain("[^1]");
+  });
+
+  it("does not parse a `[^1]: def` definition line into a footnote node", async () => {
+    const back = await markdownToProseMirror("text\n\n[^1]: a definition");
+    expect(findNode(back, "footnoteReference")).toBeUndefined();
+    expect(findNode(back, "footnoteDefinition")).toBeUndefined();
+    expect(findNode(back, "footnotesList")).toBeUndefined();
+  });
+});
+
+// ---------------------------------------------------------------------------
+// literal `^[` in prose must NOT materialize a phantom footnote on re-import.
+// ---------------------------------------------------------------------------
+describe("inline footnote: literal `^[` in prose", () => {
+  it("escapes a literal `^[…]` in text so it stays text, byte-stable", async () => {
+    const d = doc(P(T("see ^[not a note] here")));
+    const md = convertProseMirrorToMarkdown(d);
+    // The opening `^[` is broken with a backslash so the tokenizer never fires.
+    expect(md).toBe("see ^\\[not a note] here");
+
+    const back = await markdownToProseMirror(md);
+    expect(findNode(back, "footnoteReference")).toBeUndefined();
+    expect(allText(back)).toBe("see ^[not a note] here");
+
+    const md2 = convertProseMirrorToMarkdown(back);
+    expect(md2).toBe(md);
+  });
+});
+
+// ---------------------------------------------------------------------------
+// fail-open: unbalanced `^[` and empty `^[]` do not crash.
+// ---------------------------------------------------------------------------
+describe("inline footnote: fail-open", () => {
+  it("leaves an unbalanced `^[` as literal text, no crash", async () => {
+    const back = await markdownToProseMirror("dangling ^[ open bracket");
+    expect(findNode(back, "footnoteReference")).toBeUndefined();
+    expect(allText(back)).toContain("^[ open bracket");
+  });
+
+  it("treats `^[]` as a footnote with an empty body, no crash", async () => {
+    const back = await markdownToProseMirror("empty^[]");
+    const r = findNode(back, "footnoteReference");
+    const dfn = findNode(back, "footnoteDefinition");
+    expect(r).toBeDefined();
+    expect(dfn).toBeDefined();
+    expect(allText(dfn)).toBe("");
+    // Byte-stable: an empty-body footnote re-exports as `^[]`.
+    expect(convertProseMirrorToMarkdown(back)).toBe("empty^[]");
+  });
+});
+
+// ---------------------------------------------------------------------------
+// F1 (CRITICAL): DIFFERENT bodies must NEVER merge — dedup keys on exact text,
+// not a 32-bit hash (the old djb2 hash collided `"sgrs rj"` / `"a gtkfr"`).
+// ---------------------------------------------------------------------------
+describe("inline footnote: distinct bodies never merge (F1)", () => {
+  it("keeps the hash-colliding pair `sgrs rj` / `a gtkfr` as two distinct defs", async () => {
+    // These two DIFFERENT bodies hashed to the same fn-16myybs under djb2, which
+    // silently dropped the second body. With text-exact dedup they must survive
+    // as two separate definitions.
+    const d = doc(
+      P(T("x"), ref("fnA"), T(" y"), ref("fnB")),
+      list(def("fnA", P(T("sgrs rj"))), def("fnB", P(T("a gtkfr")))),
+    );
+    const md = convertProseMirrorToMarkdown(d);
+    expect(md).toBe("x^[sgrs rj] y^[a gtkfr]");
+
+    const back = await markdownToProseMirror(md);
+    const defs = findAll(back, "footnoteDefinition");
+    const refs = findAll(back, "footnoteReference");
+    // BOTH bodies survive as DISTINCT definitions.
+    expect(defs.length).toBe(2);
+    const bodies = defs.map(allText).sort();
+    expect(bodies).toEqual(["a gtkfr", "sgrs rj"]);
+    // Two refs, each pointing at a DIFFERENT def id.
+    expect(refs.length).toBe(2);
+    expect(refs[0].attrs.id).not.toBe(refs[1].attrs.id);
+    expect(new Set(defs.map((x: any) => x.attrs.id)).size).toBe(2);
+
+    const md2 = convertProseMirrorToMarkdown(back);
+    expect(md2).toBe(md);
+  });
+});
+
+// ---------------------------------------------------------------------------
+// F2 (CRITICAL): a body ending in `\` (or `\` before `]`) must survive `^[…]`.
+// Each must round-trip BYTE-STABLE across 3 iterations, footnote intact.
+// ---------------------------------------------------------------------------
+describe("inline footnote: raw backslash bodies survive (F2)", () => {
+  const cases: Array<{ name: string; body: string; expectMd: string }> = [
+    {
+      name: "trailing backslash (Windows path)",
+      body: "C:\\dir\\",
+      expectMd: "x^[C:\\\\dir\\\\]",
+    },
+    {
+      name: "backslash before a literal bracket",
+      body: "a \\] b",
+      expectMd: "x^[a \\\\\\] b]",
+    },
+    {
+      name: "regex with trailing backslash",
+      body: "re\\gex\\",
+      expectMd: "x^[re\\\\gex\\\\]",
+    },
+  ];
+  for (const { name, body, expectMd } of cases) {
+    it(`round-trips ${name} byte-stable x3 with the backslash preserved`, async () => {
+      const d = doc(P(T("x"), ref("fn1")), list(def("fn1", P(T(body)))));
+      let md = convertProseMirrorToMarkdown(d);
+      expect(md).toBe(expectMd);
+
+      // Three full iterations must all be byte-identical and keep the footnote.
+      for (let iter = 0; iter < 3; iter++) {
+        const back = await markdownToProseMirror(md);
+        const dfn = findNode(back, "footnoteDefinition");
+        expect(dfn).toBeDefined();
+        // The backslashes are preserved EXACTLY in the note body.
+        expect(allText(dfn)).toBe(body);
+        const md2 = convertProseMirrorToMarkdown(back);
+        expect(md2).toBe(md);
+        md = md2;
+      }
+    });
+  }
+});
+
+// ---------------------------------------------------------------------------
+// F4: assembleFootnotes must not emit a DUPLICATE <section data-footnotes> when
+// the HTML already carries one (a footnote list that landed in a column).
+// ---------------------------------------------------------------------------
+describe("inline footnote: no duplicate footnotes section (F4)", () => {
+  it("produces exactly one footnotesList when a column footnote is present", async () => {
+    const d = doc(
+      {
+        type: "columns",
+        content: [
+          { type: "column", attrs: { width: "50%" }, content: [P(T("c "), ref("fn1"))] },
+        ],
+      },
+      list(def("fn1", P(T("colnote")))),
+    );
+    const md = convertProseMirrorToMarkdown(d);
+    const back = await markdownToProseMirror(md);
+    // Exactly one assembled footnotes list, not two.
+    expect(findAll(back, "footnotesList").length).toBe(1);
+  });
+});
+
+// ---------------------------------------------------------------------------
+// N1 (data-loss): NESTED inline footnotes must round-trip — the assembly pass
+// runs to a FIXED POINT so an inner `^[…]` spawned by parseInline is also
+// assigned an id, built into a def, and stripped (no dangling ref, no lost body).
+// ---------------------------------------------------------------------------
+describe("inline footnote: nested footnotes (N1)", () => {
+  it("keeps `^[outer ^[inner] tail]` as TWO defs, inner preserved, byte-stable", async () => {
+    const md1 = "text ^[outer ^[inner] tail] end";
+    const back = await markdownToProseMirror(md1);
+    const defs = findAll(back, "footnoteDefinition");
+    const refs = findAll(back, "footnoteReference");
+    // Two distinct definitions (outer + inner); two references.
+    expect(defs.length).toBe(2);
+    expect(refs.length).toBe(2);
+    expect(new Set(defs.map((d: any) => d.attrs.id)).size).toBe(2);
+    const bodies = defs.map(allText).sort();
+    expect(bodies).toEqual(["inner", "outer  tail"]);
+    // The OUTER definition body carries a footnoteReference to the inner def.
+    const outer = defs.find((d: any) => allText(d).includes("outer"));
+    const inner = defs.find((d: any) => allText(d) === "inner");
+    const nestedRef = findNode(outer, "footnoteReference");
+    expect(nestedRef).toBeDefined();
+    expect(nestedRef.attrs.id).toBe(inner.attrs.id);
+    // Byte-stable across two further iterations (md1 === md2 === md3).
+    const md2 = convertProseMirrorToMarkdown(back);
+    expect(md2).toBe(md1);
+    const md3 = convertProseMirrorToMarkdown(await markdownToProseMirror(md2));
+    expect(md3).toBe(md2);
+  });
+
+  it("round-trips a 3-level nest `^[a ^[b ^[c] d] e]` (three defs)", async () => {
+    const md1 = "z ^[a ^[b ^[c] d] e] z";
+    const back = await markdownToProseMirror(md1);
+    const defs = findAll(back, "footnoteDefinition");
+    expect(defs.length).toBe(3);
+    expect(new Set(defs.map((d: any) => d.attrs.id)).size).toBe(3);
+    expect(defs.map(allText).sort()).toEqual(["a  e", "b  d", "c"]);
+    const md2 = convertProseMirrorToMarkdown(back);
+    expect(md2).toBe(md1);
+    const md3 = convertProseMirrorToMarkdown(await markdownToProseMirror(md2));
+    expect(md3).toBe(md2);
+  });
+});
+
+// ---------------------------------------------------------------------------
+// N2: a generated id must never collide with an id already present in a REUSED
+// footnotes section (the counter is seeded past the max existing `fn-N`).
+// ---------------------------------------------------------------------------
+describe("inline footnote: generated ids never collide with a reused section (N2)", () => {
+  it("seeds the counter past an existing `fn-1` def in a legacy section", async () => {
+    // A legacy `<section data-footnotes>` (existing `fn-1`) reaches the body as
+    // raw HTML; the new inline `^[…]` must NOT be assigned `fn-1` too.
+    const md =
+      "text^[new note]\n\n" +
+      '<section data-footnotes><div data-footnote-def data-id="fn-1">' +
+      "<p>existing note</p></div></section>";
+    const back = await markdownToProseMirror(md);
+    const defs = findAll(back, "footnoteDefinition");
+    // Both notes survive as DISTINCT definitions in a SINGLE list.
+    expect(defs.length).toBe(2);
+    expect(new Set(defs.map((d: any) => d.attrs.id)).size).toBe(2);
+    expect(findAll(back, "footnotesList").length).toBe(1);
+    expect(defs.map(allText).sort()).toEqual(["existing note", "new note"]);
+    // The pre-existing id is preserved; the new one is seeded past it.
+    expect(defs.map((d: any) => d.attrs.id)).toContain("fn-1");
+    expect(defs.map((d: any) => d.attrs.id)).toContain("fn-2");
+  });
+});
diff --git a/packages/prosemirror-markdown/test/highlight.test.ts b/packages/prosemirror-markdown/test/highlight.test.ts
new file mode 100644
index 00000000..012fcddc
--- /dev/null
+++ b/packages/prosemirror-markdown/test/highlight.test.ts
@@ -0,0 +1,249 @@
+import { describe, expect, it } from 'vitest';
+// Import both directions DIRECTLY from src (NOT the docmost-client barrel, which
+// pulls in collaboration.ts and mutates the global DOM at import time), matching
+// the other converter unit tests.
+import { convertProseMirrorToMarkdown } from '../src/lib/markdown-converter.js';
+import { markdownToProseMirror } from '../src/lib/markdown-to-prosemirror.js';
+
+// #293 canon #7: a `highlight` mark WITHOUT a color serializes as the
+// Obsidian/GFM `==text==` syntax; a highlight WITH a color KEEPS the
+// `<mark style="background-color: …">` HTML form. On the raw-HTML path
+// (columns / spanned cells) BOTH forms stay `<mark>` because markdown is not
+// re-parsed there. This file locks the serialize form, the round-trip, and the
+// literal-`==` escape that keeps a literal `==` from becoming a phantom mark.
+
+const doc = (...nodes: any[]) => ({ type: 'doc', content: nodes });
+const text = (t: string, marks?: any[]) =>
+  marks ? { type: 'text', text: t, marks } : { type: 'text', text: t };
+const para = (...inline: any[]) => ({ type: 'paragraph', content: inline });
+
+// Find the first text node anywhere in a PM tree that carries a mark of `type`.
+const firstMarkedText = (node: any, type: string): any => {
+  if (node?.type === 'text' && (node.marks || []).some((m: any) => m.type === type)) {
+    return node;
+  }
+  for (const child of node?.content || []) {
+    const hit = firstMarkedText(child, type);
+    if (hit) return hit;
+  }
+  return null;
+};
+const mark = (textNode: any, type: string): any =>
+  (textNode?.marks || []).find((m: any) => m.type === type);
+// Concatenate all text within a subtree (order-preserving).
+const allText = (node: any): string => {
+  if (node?.type === 'text') return node.text || '';
+  return (node?.content || []).map(allText).join('');
+};
+// Does ANY text node in the tree carry a mark of `type`?
+const hasMark = (node: any, type: string): boolean => !!firstMarkedText(node, type);
+
+// PM -> MD -> PM round-trip.
+const roundTrip = async (d: any) => {
+  const md1 = convertProseMirrorToMarkdown(d);
+  const doc2 = await markdownToProseMirror(md1);
+  const md2 = convertProseMirrorToMarkdown(doc2);
+  return { md1, doc2, md2 };
+};
+
+describe('#293 #7: no-color highlight <-> ==text==', () => {
+  it('serializes a no-color highlight as exactly ==text==', () => {
+    expect(convertProseMirrorToMarkdown(doc(para(text('important', [{ type: 'highlight' }]))))).toBe(
+      '==important==',
+    );
+  });
+
+  it('imports ==text== as a highlight mark with NO color', async () => {
+    const d = await markdownToProseMirror('==important==');
+    const t = firstMarkedText(d, 'highlight');
+    expect(t).toBeTruthy();
+    expect(t.text).toBe('important');
+    // A bare <mark> carries no background-color, so the color attr is null.
+    expect(mark(t, 'highlight').attrs?.color ?? null).toBeNull();
+  });
+
+  it('is byte-stable and re-imports as a color-less highlight', async () => {
+    const { md1, md2, doc2 } = await roundTrip(
+      doc(para(text('a base '), text('hl', [{ type: 'highlight' }]), text(' tail'))),
+    );
+    expect(md1).toBe('a base ==hl== tail');
+    expect(md2).toBe(md1);
+    const t = firstMarkedText(doc2, 'highlight');
+    expect(t.text).toBe('hl');
+    expect(mark(t, 'highlight').attrs?.color ?? null).toBeNull();
+  });
+});
+
+describe('#293 #7: colored highlight keeps <mark style=…>', () => {
+  it('serializes a colored highlight as the <mark style=…> HTML form (NOT ==)', () => {
+    const out = convertProseMirrorToMarkdown(
+      doc(para(text('c', [{ type: 'highlight', attrs: { color: '#ff0000' } }]))),
+    );
+    expect(out).toBe('<mark style="background-color: #ff0000">c</mark>');
+    expect(out).not.toContain('==');
+  });
+
+  it('round-trips a colored highlight preserving its color', async () => {
+    const { md1, md2, doc2 } = await roundTrip(
+      doc(para(text('c', [{ type: 'highlight', attrs: { color: '#abcdef' } }]))),
+    );
+    expect(md1).toBe('<mark style="background-color: #abcdef">c</mark>');
+    expect(md2).toBe(md1);
+    const t = firstMarkedText(doc2, 'highlight');
+    expect(mark(t, 'highlight').attrs?.color).toBe('#abcdef');
+  });
+});
+
+describe('#293 #7: raw-HTML path (columns) stays <mark>, never ==', () => {
+  const oneColumn = (...blocks: any[]) => ({
+    type: 'columns',
+    attrs: { layout: 'two' },
+    content: [{ type: 'column', content: blocks }],
+  });
+
+  it('a no-color highlight inside a column serializes as <mark> (inlineToHtml), not ==', () => {
+    const out = convertProseMirrorToMarkdown(doc(oneColumn(para(text('p', [{ type: 'highlight' }])))));
+    expect(out).toContain('<mark>p</mark>');
+    // The `==` markdown syntax must NOT leak into a raw-HTML container (it would
+    // survive as literal text there because columns are not re-parsed).
+    expect(out).not.toContain('==');
+  });
+
+  it('a colored highlight inside a column keeps <mark style=…>', () => {
+    const out = convertProseMirrorToMarkdown(
+      doc(oneColumn(para(text('p', [{ type: 'highlight', attrs: { color: '#00ff00' } }])))),
+    );
+    expect(out).toContain('<mark style="background-color: #00ff00">p</mark>');
+  });
+
+  it('round-trips a highlight inside a column (byte-stable, mark preserved)', async () => {
+    const { md1, md2, doc2 } = await roundTrip(
+      doc(oneColumn(para(text('p', [{ type: 'highlight' }])))),
+    );
+    expect(md1).toContain('<mark>p</mark>');
+    expect(md2).toBe(md1);
+    expect(hasMark(doc2, 'highlight')).toBe(true);
+  });
+});
+
+describe('#293 #7: highlight wrapping other marks', () => {
+  it('serializes bold-inside-highlight as ==**x**== and round-trips both marks', async () => {
+    const { md1, md2, doc2 } = await roundTrip(
+      doc(para(text('x', [{ type: 'bold' }, { type: 'highlight' }]))),
+    );
+    expect(md1).toBe('==**x**==');
+    expect(md2).toBe(md1);
+    const t = firstMarkedText(doc2, 'highlight');
+    expect(t).toBeTruthy();
+    expect((t.marks || []).some((m: any) => m.type === 'bold')).toBe(true);
+    expect(t.text).toBe('x');
+  });
+});
+
+describe('#293 #7: inline code containing == stays code, not a highlight', () => {
+  it('imports `a == b` as an inline code span, not a highlight', async () => {
+    const d = await markdownToProseMirror('`a == b`');
+    expect(hasMark(d, 'highlight')).toBe(false);
+    const codeText = firstMarkedText(d, 'code');
+    expect(codeText).toBeTruthy();
+    expect(codeText.text).toBe('a == b');
+  });
+
+  it('round-trips an inline code span carrying == (byte-stable, no highlight)', async () => {
+    const { md1, md2, doc2 } = await roundTrip(doc(para(text('a == b', [{ type: 'code' }]))));
+    expect(md1).toBe('`a == b`');
+    expect(md2).toBe(md1);
+    expect(hasMark(doc2, 'highlight')).toBe(false);
+    expect(firstMarkedText(doc2, 'code').text).toBe('a == b');
+  });
+});
+
+describe('#293 #7: literal == in plain prose round-trips as text (no phantom highlight)', () => {
+  it('a lone literal == (a == b) is escaped and re-imports as literal text', async () => {
+    const { md1, md2, doc2 } = await roundTrip(doc(para(text('a == b'))));
+    // Each `=` of the pair is backslash-escaped so marked decodes it back.
+    expect(md1).toBe('a \\=\\= b');
+    expect(md2).toBe(md1);
+    expect(hasMark(doc2, 'highlight')).toBe(false);
+    expect(allText(doc2)).toBe('a == b');
+  });
+
+  it('a literal ==...== pair in prose does NOT materialize a highlight', async () => {
+    const { md1, md2, doc2 } = await roundTrip(doc(para(text('x ==not hl== y'))));
+    expect(md1).toBe('x \\=\\=not hl\\=\\= y');
+    expect(md2).toBe(md1);
+    expect(hasMark(doc2, 'highlight')).toBe(false);
+    expect(allText(doc2)).toBe('x ==not hl== y');
+  });
+
+  it('a highlight over text that itself contains a literal == round-trips both', async () => {
+    const { md1, md2, doc2 } = await roundTrip(
+      doc(para(text('a == b', [{ type: 'highlight' }]))),
+    );
+    // The inner literal `==` is escaped; the highlight `==` delimiters are added
+    // AFTER escaping, so the mark's own delimiters are intact.
+    expect(md1).toBe('==a \\=\\= b==');
+    expect(md2).toBe(md1);
+    const t = firstMarkedText(doc2, 'highlight');
+    expect(t.text).toBe('a == b');
+  });
+});
+
+describe('#293 #7: fail-open edges (empty / unbalanced ==)', () => {
+  it('empty ==== does not crash and stays literal (no highlight)', async () => {
+    const d = await markdownToProseMirror('====');
+    expect(hasMark(d, 'highlight')).toBe(false);
+    expect(allText(d)).toBe('====');
+  });
+
+  it('unbalanced ==x does not crash and stays literal (no highlight)', async () => {
+    const d = await markdownToProseMirror('==x');
+    expect(hasMark(d, 'highlight')).toBe(false);
+    expect(allText(d)).toBe('==x');
+  });
+
+  it('two highlights on one line both parse (lazy inner)', async () => {
+    const d = await markdownToProseMirror('==a== ==b==');
+    const first = firstMarkedText(d, 'highlight');
+    expect(first.text).toBe('a');
+    // Both highlighted runs are present.
+    expect(allText(d)).toContain('a');
+    expect(allText(d)).toContain('b');
+  });
+});
+
+describe('#293 #7: a codeBlock containing == is NOT escaped (literal code preserved)', () => {
+  // Regression: the canon #7 `==` -> `\=\=` escape lives in `case "text"`, but
+  // code-fence content is literal and marked does NOT decode `\=` inside a fence,
+  // so routing code through that path would permanently stamp backslashes into a
+  // `==` comparison (ubiquitous in source). codeBlock must read raw child text.
+  const codeBlock = (t: string, language = '') => ({
+    type: 'codeBlock',
+    attrs: { language },
+    content: [{ type: 'text', text: t }],
+  });
+
+  it('exports `==` in code verbatim (no \\=\\=) and round-trips byte-stably', async () => {
+    const d = doc(codeBlock('if (a == b) return c == d;', 'js'));
+    const md1 = convertProseMirrorToMarkdown(d);
+    expect(md1).toBe('```js\nif (a == b) return c == d;\n```');
+    expect(md1).not.toContain('\\='); // no backslash corruption
+    const back = await markdownToProseMirror(md1);
+    // The code text survives with no backslash corruption and no phantom
+    // highlight (marked re-adds a trailing "\n" to fence content on import,
+    // which the serializer strips again — hence trimEnd here; byte-stability of
+    // the markdown is asserted separately below).
+    expect(allText(back).trimEnd()).toBe('if (a == b) return c == d;');
+    expect(allText(back)).not.toContain('\\=');
+    expect(hasMark(back, 'highlight')).toBe(false);
+    expect(convertProseMirrorToMarkdown(back)).toBe(md1); // byte-stable
+  });
+
+  it('a real markdown code block with == imports clean and re-exports clean', async () => {
+    const src = '```\nx == y\n```';
+    const back = await markdownToProseMirror(src);
+    expect(allText(back).trimEnd()).toBe('x == y');
+    expect(allText(back)).not.toContain('\\=');
+    expect(convertProseMirrorToMarkdown(back)).toBe(src); // byte-stable
+  });
+});
diff --git a/packages/prosemirror-markdown/test/image-comment.test.ts b/packages/prosemirror-markdown/test/image-comment.test.ts
new file mode 100644
index 00000000..605e3e5b
--- /dev/null
+++ b/packages/prosemirror-markdown/test/image-comment.test.ts
@@ -0,0 +1,265 @@
+import { describe, expect, it } from 'vitest';
+// Import DIRECTLY from src (matching the other converter unit tests), not the
+// docmost-client barrel.
+import { convertProseMirrorToMarkdown } from '../src/lib/markdown-converter.js';
+import { markdownToProseMirror } from '../src/lib/markdown-to-prosemirror.js';
+
+// ---------------------------------------------------------------------------
+// #293 canon #4: images ALWAYS serialize as `![alt](src)`. Non-default attrs
+// ride along in an attached `<!--img {…}-->` comment on the SAME line, which the
+// importer materializes back onto the <img> before generateJSON drops it. An
+// attr equal to the schema default is NOT emitted. The image align default is
+// unified to "center" (matching editor-ext), so bare/center images stay clean
+// and only a genuinely non-default alignment (left/right) emits a comment.
+//
+// In raw-HTML contexts (inside a column / spanned cell) the prior `<img …>` form
+// is kept; comments are dropped by the DOM parse stage there.
+// ---------------------------------------------------------------------------
+
+const doc = (...nodes: any[]) => ({ type: 'doc', content: nodes });
+const image = (attrs: any) => doc({ type: 'image', attrs: { src: '/i.png', ...attrs } });
+
+// Find the first image node anywhere in a PM JSON doc.
+function findImage(node: any): any | null {
+  if (!node || typeof node !== 'object') return null;
+  if (node.type === 'image') return node;
+  if (Array.isArray(node.content)) {
+    for (const child of node.content) {
+      const hit = findImage(child);
+      if (hit) return hit;
+    }
+  }
+  return null;
+}
+
+// Export a doc, re-import it, and hand back the markdown + re-imported image.
+async function roundTrip(source: any): Promise<{ md: string; img: any; back: any }> {
+  const md = convertProseMirrorToMarkdown(source);
+  const back = await markdownToProseMirror(md);
+  return { md, img: findImage(back), back };
+}
+
+describe('#293 canon #4 — image serialization + attached img-comment', () => {
+  it('a bare image (src only) emits `![]()` with NO comment and round-trips', async () => {
+    const { md, img } = await roundTrip(image({}));
+    expect(md).toBe('![](/i.png)');
+    expect(md).not.toContain('<!--img');
+    expect(img).toBeTruthy();
+    expect(img.attrs.src).toBe('/i.png');
+    // align falls back to the unified "center" default on import.
+    expect(img.attrs.align).toBe('center');
+  });
+
+  it('src + alt emits `![alt](src)` with NO comment and round-trips', async () => {
+    const { md, img } = await roundTrip(image({ alt: 'схема' }));
+    expect(md).toBe('![схема](/i.png)');
+    expect(md).not.toContain('<!--img');
+    expect(img.attrs.alt).toBe('схема');
+  });
+
+  it('alt with markdown-ACTIVE punctuation is escaped and round-trips byte-stable (F1)', async () => {
+    // The alt sits in the `![alt]` label, re-parsed as CommonMark inline on
+    // import; without escaping, a bracket/emphasis in a realistic description
+    // would make the image node VANISH or collapse emphasis. Assert the image
+    // survives with the exact alt AND the markdown is byte-stable on re-export.
+    for (const alt of [
+      'a]b[c', 'Figure [1]', 'the *new* logo', 'x_y_z', 'see ![img', 'a & b',
+      // Canon inline-extension triggers this same package introduces (F5): math
+      // `$`, highlight `==`, footnote `^[` — an unescaped one turns the alt into
+      // a math/highlight/footnote node on import.
+      'x $A$ y', '5$ and 10$', 'use ==bold==', '^[fn]', 'cost $5 == price',
+    ]) {
+      const md1 = convertProseMirrorToMarkdown(image({ alt }));
+      const back = await markdownToProseMirror(md1);
+      const img = findImage(back);
+      expect(img).toBeTruthy(); // image node did NOT vanish
+      expect(img.attrs.alt).toBe(alt); // exact alt preserved
+      expect(convertProseMirrorToMarkdown(back)).toBe(md1); // byte-stable
+    }
+  });
+
+  it('align "center" (the default) emits a bare image, NO comment, round-trips to center', async () => {
+    const { md, img } = await roundTrip(image({ align: 'center' }));
+    expect(md).toBe('![](/i.png)');
+    expect(md).not.toContain('<!--img');
+    expect(img.attrs.align).toBe('center');
+  });
+
+  it('a null align emits a bare image and re-imports as the "center" default', async () => {
+    const { md, img } = await roundTrip(image({ align: null }));
+    expect(md).toBe('![](/i.png)');
+    expect(img.attrs.align).toBe('center');
+  });
+
+  it('align "left" emits an img-comment and round-trips', async () => {
+    const { md, img } = await roundTrip(image({ align: 'left' }));
+    expect(md).toBe('![](/i.png) <!--img {"align":"left"}-->');
+    expect(img.attrs.align).toBe('left');
+  });
+
+  it('align "right" emits an img-comment and round-trips', async () => {
+    const { md, img } = await roundTrip(image({ align: 'right' }));
+    expect(md).toBe('![](/i.png) <!--img {"align":"right"}-->');
+    expect(img.attrs.align).toBe('right');
+  });
+
+  it('width alone emits a single-key comment and round-trips', async () => {
+    const { md, img } = await roundTrip(image({ width: '420' }));
+    expect(md).toBe('![](/i.png) <!--img {"width":"420"}-->');
+    expect(img.attrs.width).toBe('420');
+  });
+
+  it('height alone emits a single-key comment and round-trips', async () => {
+    const { md, img } = await roundTrip(image({ height: '300' }));
+    expect(md).toBe('![](/i.png) <!--img {"height":"300"}-->');
+    expect(img.attrs.height).toBe('300');
+  });
+
+  it('size alone emits a single-key comment and round-trips', async () => {
+    const { md, img } = await roundTrip(image({ size: '48' }));
+    expect(md).toBe('![](/i.png) <!--img {"size":"48"}-->');
+    expect(img.attrs.size).toBe('48');
+  });
+
+  it('aspectRatio alone emits a single-key comment and round-trips', async () => {
+    const { md, img } = await roundTrip(image({ aspectRatio: '1.777' }));
+    expect(md).toBe('![](/i.png) <!--img {"aspectRatio":"1.777"}-->');
+    expect(img.attrs.aspectRatio).toBe('1.777');
+  });
+
+  it('attachmentId (the file link — data-loss critical) rides in the comment and round-trips', async () => {
+    const { md, img } = await roundTrip(image({ attachmentId: 'att-777' }));
+    expect(md).toBe('![](/i.png) <!--img {"attachmentId":"att-777"}-->');
+    expect(img.attrs.attachmentId).toBe('att-777');
+  });
+
+  it('caption rides in the comment and round-trips', async () => {
+    const { md, img } = await roundTrip(image({ caption: 'Рис. 1' }));
+    expect(md).toBe('![](/i.png) <!--img {"caption":"Рис. 1"}-->');
+    expect(img.attrs.caption).toBe('Рис. 1');
+  });
+
+  it('title rides in the comment and round-trips', async () => {
+    const { md, img } = await roundTrip(image({ title: 'a tooltip' }));
+    expect(md).toBe('![](/i.png) <!--img {"title":"a tooltip"}-->');
+    expect(img.attrs.title).toBe('a tooltip');
+  });
+
+  it('multiple attrs at once appear in the stable key order and round-trip', async () => {
+    const { md, img } = await roundTrip(
+      image({
+        alt: 'схема',
+        width: '420',
+        height: '300',
+        align: 'left',
+        size: '48',
+        aspectRatio: '1.5',
+        attachmentId: 'att-1',
+        caption: 'Рис. 1',
+        title: 'tip',
+      }),
+    );
+    // Stable order: width, height, align, size, aspectRatio, attachmentId, caption, title.
+    expect(md).toBe(
+      '![схема](/i.png) <!--img {"width":"420","height":"300","align":"left","size":"48","aspectRatio":"1.5","attachmentId":"att-1","caption":"Рис. 1","title":"tip"}-->',
+    );
+    expect(img.attrs.width).toBe('420');
+    expect(img.attrs.height).toBe('300');
+    expect(img.attrs.align).toBe('left');
+    expect(img.attrs.size).toBe('48');
+    expect(img.attrs.aspectRatio).toBe('1.5');
+    expect(img.attrs.attachmentId).toBe('att-1');
+    expect(img.attrs.caption).toBe('Рис. 1');
+    expect(img.attrs.title).toBe('tip');
+  });
+
+  // MANDATORY (#293 canon #4): a caption containing the comment-closing `-->`
+  // must be encoded so it can never break the HTML comment; JSON.parse restores
+  // it byte-exact on import.
+  it('a caption containing `-->` is escaped, does not break the comment, and round-trips byte-exact', async () => {
+    const caption = 'see --> here';
+    const { md, img } = await roundTrip(image({ caption }));
+    // The `--` pair is defused as the JSON unicode escape, so the literal
+    // caption text is NOT present verbatim and the comment cannot close early.
+    expect(md).toContain('\\u002d\\u002d');
+    expect(md).not.toContain('see --> here');
+    // The comment still closes exactly once, at the very end.
+    expect(md.endsWith('-->')).toBe(true);
+    // Restored byte-exact on re-import.
+    expect(img.attrs.caption).toBe('see --> here');
+  });
+
+  // A whole raw comment-closer as the caption is the adversarial edge.
+  it('a caption that IS `-->` round-trips byte-exact', async () => {
+    const { img } = await roundTrip(image({ caption: '-->' }));
+    expect(img.attrs.caption).toBe('-->');
+  });
+
+  it('an image INSIDE a column keeps the raw <img> form (no img-comment) and round-trips', async () => {
+    const source = doc({
+      type: 'columns',
+      attrs: { layout: 'two' },
+      content: [
+        {
+          type: 'column',
+          content: [
+            {
+              type: 'image',
+              attrs: { src: '/i.png', alt: 'c', width: '320', align: 'left', attachmentId: 'att-9' },
+            },
+          ],
+        },
+        { type: 'column', content: [{ type: 'paragraph', content: [{ type: 'text', text: 'r' }] }] },
+      ],
+    });
+    const md = convertProseMirrorToMarkdown(source);
+    expect(md).toContain('<img');
+    expect(md).not.toContain('<!--img');
+    const back = await markdownToProseMirror(md);
+    const img = findImage(back);
+    expect(img).toBeTruthy();
+    expect(img.attrs.width).toBe('320');
+    expect(img.attrs.align).toBe('left');
+    expect(img.attrs.attachmentId).toBe('att-9');
+  });
+
+  // ---- Fail-open behavior ---------------------------------------------------
+
+  it('malformed JSON in an img-comment is ignored; the image keeps default attrs (no crash)', async () => {
+    const back = await markdownToProseMirror('![](/i.png) <!--img {bad-->');
+    const img = findImage(back);
+    expect(img).toBeTruthy();
+    expect(img.attrs.width).toBeNull();
+    expect(img.attrs.align).toBe('center'); // default
+  });
+
+  it('a STANDALONE img-comment (no adjacent <img>) is inert — no image materialized', async () => {
+    const back = await markdownToProseMirror('<!--img {"width":10}-->');
+    expect(findImage(back)).toBeNull();
+  });
+
+  it('unknown keys in a valid img-comment are ignored; the image is otherwise default', async () => {
+    const back = await markdownToProseMirror('![](/i.png) <!--img {"zzz":1}-->');
+    const img = findImage(back);
+    expect(img).toBeTruthy();
+    expect(img.attrs.width).toBeNull();
+    expect(img.attrs.align).toBe('center');
+    expect((img.attrs as any).zzz).toBeUndefined();
+  });
+
+  it('NUMERIC sizing attrs serialize as strings and round-trip byte-stably', () => {
+    // The import side reads DOM attributes back as strings, so a numeric source
+    // value must be stringified in the payload or the first round-trip churns
+    // `420 -> "420"` (a spurious one-time git diff). Assert the emitted string
+    // form AND that a second export is byte-identical to the first.
+    const d = image({ width: 420, height: 200, size: 80, aspectRatio: 1.5 });
+    const md1 = convertProseMirrorToMarkdown(d);
+    expect(md1).toBe(
+      '![](/i.png) <!--img {"width":"420","height":"200","size":"80","aspectRatio":"1.5"}-->',
+    );
+    return markdownToProseMirror(md1).then((back) => {
+      const md2 = convertProseMirrorToMarkdown(back);
+      expect(md2).toBe(md1); // byte-stable: no 420 -> "420" churn
+    });
+  });
+});
diff --git a/packages/prosemirror-markdown/test/machinery-comments.test.ts b/packages/prosemirror-markdown/test/machinery-comments.test.ts
new file mode 100644
index 00000000..f8674091
--- /dev/null
+++ b/packages/prosemirror-markdown/test/machinery-comments.test.ts
@@ -0,0 +1,194 @@
+import { describe, expect, it } from 'vitest';
+// Import DIRECTLY from src (NOT the docmost-client barrel, which pulls in
+// collaboration.ts and mutates the global DOM at import time), matching the
+// other converter unit tests.
+import { convertProseMirrorToMarkdown } from '../src/lib/markdown-converter.js';
+import { markdownToProseMirror } from '../src/lib/markdown-to-prosemirror.js';
+import { standaloneCommentFor } from '../src/lib/attached-comment.js';
+
+// #293 canon decision #5: `subpages` and `pageBreak` serialize as STANDALONE
+// HTML comments on their own line —
+//   <!--subpages-->            <!--subpages {"recursive":true}-->   <!--pagebreak-->
+// — invisible in any markdown renderer, yet round-tripping (the importer
+// materializes them back into the block atom before generateJSON drops the
+// comment). Position determines legality: they are honored ONLY standalone; a
+// comment attached after visible text is INERT. Inside a raw-HTML container
+// (columns/cells) the DOM parse stage discards comment nodes, so there the
+// schema `<div data-type="...">` form is emitted instead. These tests assert the
+// EXACT emitted markdown and a lossless round trip (non-vacuous).
+
+const doc = (...nodes: any[]) => ({ type: 'doc', content: nodes });
+const text = (t: string) => ({ type: 'text', text: t });
+const para = (...inline: any[]) => ({ type: 'paragraph', content: inline });
+
+// Recursively collect every node type present in a doc.
+const collectTypes = (n: any, set = new Set<string>()): Set<string> => {
+  if (!n || typeof n !== 'object') return set;
+  if (n.type) set.add(n.type);
+  if (Array.isArray(n.content)) n.content.forEach((c: any) => collectTypes(c, set));
+  return set;
+};
+
+// Find the subpages node anywhere in a doc (for attribute assertions).
+const findNode = (n: any, type: string): any => {
+  if (!n || typeof n !== 'object') return undefined;
+  if (n.type === type) return n;
+  if (Array.isArray(n.content)) {
+    for (const c of n.content) {
+      const hit = findNode(c, type);
+      if (hit) return hit;
+    }
+  }
+  return undefined;
+};
+
+describe('standaloneCommentFor primitive (#293 #5)', () => {
+  it('emits a name-only comment when there are no attrs', () => {
+    expect(standaloneCommentFor('pagebreak')).toBe('<!--pagebreak-->');
+    expect(standaloneCommentFor('subpages')).toBe('<!--subpages-->');
+    expect(standaloneCommentFor('subpages', {})).toBe('<!--subpages-->');
+    expect(standaloneCommentFor('subpages', null)).toBe('<!--subpages-->');
+  });
+
+  it('emits a compact JSON body when attrs are present', () => {
+    expect(standaloneCommentFor('subpages', { recursive: true })).toBe(
+      '<!--subpages {"recursive":true}-->',
+    );
+  });
+
+  it('shares the attached encoder `--` escaping (payload cannot close early)', () => {
+    const s = standaloneCommentFor('subpages', { note: 'a--b' });
+    expect(s).toBe('<!--subpages {"note":"a\\u002d\\u002db"}-->');
+    // No premature `--` inside the payload -> the comment cannot terminate early.
+    expect(s.slice('<!--'.length, -'-->'.length)).not.toContain('--');
+  });
+});
+
+describe('subpages standalone serialization (#293 #5)', () => {
+  it('default subpages -> exactly <!--subpages-->', () => {
+    expect(convertProseMirrorToMarkdown(doc({ type: 'subpages' }))).toBe('<!--subpages-->');
+  });
+
+  it('markdown <!--subpages--> -> a subpages node, byte-stable re-export', async () => {
+    const md = '<!--subpages-->';
+    const doc2 = await markdownToProseMirror(md);
+    expect(collectTypes(doc2).has('subpages')).toBe(true);
+    expect(convertProseMirrorToMarkdown(doc2)).toBe(md);
+  });
+
+  it('recursive subpages -> <!--subpages {"recursive":true}--> and round-trips recursive:true', async () => {
+    const md = convertProseMirrorToMarkdown(
+      doc({ type: 'subpages', attrs: { recursive: true } }),
+    );
+    expect(md).toBe('<!--subpages {"recursive":true}-->');
+    const doc2 = await markdownToProseMirror(md);
+    const node = findNode(doc2, 'subpages');
+    expect(node).toBeTruthy();
+    expect(node.attrs.recursive).toBe(true);
+    // Byte-stable second export closes the loop.
+    expect(convertProseMirrorToMarkdown(doc2)).toBe(md);
+  });
+});
+
+describe('pageBreak standalone serialization (#293 #5)', () => {
+  it('pageBreak -> exactly <!--pagebreak-->', () => {
+    expect(convertProseMirrorToMarkdown(doc({ type: 'pageBreak' }))).toBe('<!--pagebreak-->');
+  });
+
+  it('markdown <!--pagebreak--> round-trips to a pageBreak node, byte-stable', async () => {
+    const md = '<!--pagebreak-->';
+    const doc2 = await markdownToProseMirror(md);
+    expect(collectTypes(doc2).has('pageBreak')).toBe(true);
+    expect(convertProseMirrorToMarkdown(doc2)).toBe(md);
+  });
+});
+
+describe('subpages inside a column uses the div-form, not a comment (#293 #5)', () => {
+  // A column is a raw-HTML block: the DOM parse stage discards comment nodes, so
+  // a comment inside it would silently vanish. The converter MUST emit the
+  // schema div-form there instead.
+  const columnsDoc = doc({
+    type: 'columns',
+    content: [
+      { type: 'column', attrs: { width: '50%' }, content: [{ type: 'subpages' }] },
+      { type: 'column', attrs: { width: '50%' }, content: [para(text('side'))] },
+    ],
+  });
+
+  it('serializes the column subpages as <div data-type="subpages">, not <!--subpages-->', () => {
+    const md = convertProseMirrorToMarkdown(columnsDoc);
+    expect(md).toContain('data-type="subpages"');
+    // The bare standalone comment must NOT appear inside the raw-HTML column.
+    expect(md).not.toContain('<!--subpages-->');
+  });
+
+  it('round-trips back to a subpages node still inside a column', async () => {
+    const md = convertProseMirrorToMarkdown(columnsDoc);
+    const doc2 = await markdownToProseMirror(md);
+    const column = findNode(doc2, 'column');
+    expect(column).toBeTruthy();
+    expect(collectTypes(column).has('subpages')).toBe(true);
+  });
+});
+
+describe('position legality / fail-open (#293 #5)', () => {
+  it('an ATTACHED <!--subpages--> after paragraph text is INERT (no subpages node)', async () => {
+    const doc2 = await markdownToProseMirror('para text <!--subpages-->');
+    expect(collectTypes(doc2).has('subpages')).toBe(false);
+    // The paragraph text survives, and no comment marker leaks into the body.
+    expect(JSON.stringify(doc2)).not.toContain('<!--');
+  });
+
+  it('a malformed <!--subpages {bad--> is INERT (no crash, no subpages node)', async () => {
+    const doc2 = await markdownToProseMirror('<!--subpages {bad-->');
+    expect(collectTypes(doc2).has('subpages')).toBe(false);
+  });
+});
+
+describe('multi-node document order across standalone comments (#293 #5)', () => {
+  // The riskiest part of the parser change: a LEADING standalone comment is
+  // parsed at document level (outside <body>) and must be re-inserted into the
+  // body in document order, interleaved correctly with real block content. A
+  // MID-document comment (pageBreak here) exercises the in-body branch. This
+  // locks the ordering the review flagged as covered only by manual checks.
+  const topTypes = (d: any) => (d.content || []).map((n: any) => n.type);
+
+  it('leading + mid + trailing standalone comments keep document order', async () => {
+    const d = doc(
+      { type: 'subpages' }, // leading -> parsed at document level
+      para(text('a')),
+      { type: 'pageBreak' }, // mid -> parsed in-body
+      para(text('b')),
+    );
+    const md = convertProseMirrorToMarkdown(d);
+    expect(md).toBe('<!--subpages-->\n\na\n\n<!--pagebreak-->\n\nb');
+    const d2 = await markdownToProseMirror(md);
+    // Order must be preserved exactly, not just membership.
+    expect(topTypes(d2)).toEqual([
+      'subpages',
+      'paragraph',
+      'pageBreak',
+      'paragraph',
+    ]);
+    // And byte-stable on re-export.
+    expect(convertProseMirrorToMarkdown(d2)).toBe(md);
+  });
+
+  it('two leading standalone comments keep their relative order', async () => {
+    const d = doc({ type: 'subpages' }, { type: 'pageBreak' }, para(text('x')));
+    const md = convertProseMirrorToMarkdown(d);
+    expect(md).toBe('<!--subpages-->\n\n<!--pagebreak-->\n\nx');
+    const d2 = await markdownToProseMirror(md);
+    expect(topTypes(d2)).toEqual(['subpages', 'pageBreak', 'paragraph']);
+    expect(convertProseMirrorToMarkdown(d2)).toBe(md);
+  });
+
+  it('a trailing standalone comment stays last', async () => {
+    const d = doc(para(text('x')), { type: 'subpages' });
+    const md = convertProseMirrorToMarkdown(d);
+    expect(md).toBe('x\n\n<!--subpages-->');
+    const d2 = await markdownToProseMirror(md);
+    expect(topTypes(d2)).toEqual(['paragraph', 'subpages']);
+    expect(convertProseMirrorToMarkdown(d2)).toBe(md);
+  });
+});
diff --git a/packages/git-sync/test/markdown-converter-gaps.test.ts b/packages/prosemirror-markdown/test/markdown-converter-gaps.test.ts
similarity index 92%
rename from packages/git-sync/test/markdown-converter-gaps.test.ts
rename to packages/prosemirror-markdown/test/markdown-converter-gaps.test.ts
index 47ab05bc..4aae6b3b 100644
--- a/packages/git-sync/test/markdown-converter-gaps.test.ts
+++ b/packages/prosemirror-markdown/test/markdown-converter-gaps.test.ts
@@ -36,29 +36,30 @@ async function roundTrip(node: any): Promise<{ md1: string; doc2: any; md2: stri
 // existing documented `it.fails` bugs in markdown-roundtrip.property.test.ts).
 // ---------------------------------------------------------------------------
 describe('pageBreak data loss (no converter case — SPEC §11 divergence)', () => {
-  it('exports a pageBreak node to the schema-matching block div', () => {
-    // FIXED: a standalone pageBreak now emits the block-level HTML div so the
-    // node survives instead of being erased to "".
+  it('exports a pageBreak node to the standalone comment (#293 #5)', () => {
+    // #293 canon #5: a standalone pageBreak now serializes as the readable,
+    // renderer-invisible comment `<!--pagebreak-->` (re-materialized on import),
+    // instead of the earlier raw <div> block.
     expect(convertProseMirrorToMarkdown(doc({ type: 'pageBreak' }))).toBe(
-      '<div data-type="pageBreak"></div>',
+      '<!--pagebreak-->',
     );
   });
 
   it('keeps a pageBreak sitting BETWEEN two paragraphs on export', () => {
-    // FIXED: with surrounding content the divider is emitted as its own block
+    // With surrounding content the divider is emitted as its own comment line
     // between the two paragraphs (joined by the doc "\n\n"), no longer dropped.
     const out = convertProseMirrorToMarkdown(
       doc(para(text('before')), { type: 'pageBreak' }, para(text('after'))),
     );
     expect(out).toBe(
-      'before\n\n<div data-type="pageBreak"></div>\n\nafter',
+      'before\n\n<!--pagebreak-->\n\nafter',
     );
-    expect(out).toContain('pageBreak');
+    expect(out).toContain('<!--pagebreak-->');
   });
 
   // FIXED: a pageBreak node now survives an export -> import -> export cycle
-  // because the FIRST export emits the schema-matching block div, which marked
-  // passes through and generateJSON rebuilds into a pageBreak node again.
+  // because the FIRST export emits the standalone comment, which the importer
+  // materializes back into a pageBreak node again.
   it('a pageBreak node round-trips (export -> import yields a pageBreak)', async () => {
     const { md1, doc2 } = await roundTrip({ type: 'pageBreak' });
     expect(md1).not.toBe('');
@@ -68,18 +69,18 @@ describe('pageBreak data loss (no converter case — SPEC §11 divergence)', ()
 });
 
 // ---------------------------------------------------------------------------
-// 2. subpages round-trip (`case "subpages"` emits the schema-matching div).
+// 2. subpages round-trip (#293 #5 standalone comment).
 //
 // It used to emit the literal `{{SUBPAGES}}`, which has no markdown/HTML meaning,
 // so on re-import the subpages BLOCK came back as a plain PARAGRAPH carrying the
 // literal string (the embed rendered as visible "{{SUBPAGES}}" text on the page
-// after a sync — data loss). It now emits `<div data-type="subpages">` like the
-// other embed nodes, so the schema's parseHTML rebuilds the subpages node.
+// after a sync — data loss). Per canon #5 it now emits the standalone comment
+// `<!--subpages-->`, which the importer materializes back into a subpages node.
 // ---------------------------------------------------------------------------
-describe('subpages round-trip (schema-matching div)', () => {
-  it('emits the subpages div and re-imports as a subpages node (no literal leak)', async () => {
+describe('subpages round-trip (standalone comment #293 #5)', () => {
+  it('emits the subpages comment and re-imports as a subpages node (no literal leak)', async () => {
     const { md1, doc2 } = await roundTrip({ type: 'subpages' });
-    expect(md1).toBe('<div data-type="subpages"></div>');
+    expect(md1).toBe('<!--subpages-->');
 
     const collect = (n: any): string[] => [
       n.type,
@@ -477,22 +478,24 @@ describe('converter gap coverage — documented round-trip data loss (specs 12
     expect(docsCanonicallyEqual(d, doc2)).toBe(false);
   });
 
-  // 14. The image emitter drops the title attribute (silently lost on round-trip).
-  it('an image title attribute is dropped on export and lost on re-import', async () => {
+  // 14. #293 canon #4: the image title now round-trips via the attached
+  //     `<!--img {…}-->` comment (previously silently dropped).
+  it('an image title attribute round-trips via the attached img-comment', async () => {
     const d = doc({
       type: 'image',
       attrs: { src: '/i.png', alt: 'a', title: 't"q' },
     });
     const md1 = convertProseMirrorToMarkdown(d);
-    expect(md1).toBe('![a](/i.png)'); // no title, no quotes
+    // The quote in the title is JSON-escaped inside the comment payload.
+    expect(md1).toBe('![a](/i.png) <!--img {"title":"t\\"q"}-->');
 
     const doc2 = await markdownToProseMirror(md1);
     const img = (doc2.content || []).find((n: any) => n.type === 'image');
     expect(img).toBeTruthy();
-    expect(img.attrs?.title).toBeNull(); // the original 't"q' was dropped
+    expect(img.attrs?.title).toBe('t"q'); // restored byte-exact
     expect(img.attrs?.src).toBe('/i.png');
     expect(img.attrs?.alt).toBe('a');
-    expect(docsCanonicallyEqual(d, doc2)).toBe(false);
+    expect(docsCanonicallyEqual(d, doc2)).toBe(true);
   });
 });
 
@@ -506,8 +509,10 @@ describe('converter gap coverage — raw-HTML container round-trips (specs 15–
         attrs: { src: '/i.png', alt: 'cap', width: 320, align: 'center' },
       }),
     );
+    // #293 canon #4: image align default is unified to "center", so a center
+    // image inside a column no longer emits a redundant align="center".
     expect(md1).toBe(
-      '<div data-type="columns" data-layout="two"><div data-type="column"><img src="/i.png" alt="cap" width="320" align="center"></div></div>',
+      '<div data-type="columns" data-layout="two"><div data-type="column"><img src="/i.png" alt="cap" width="320"></div></div>',
     );
     expect(md2).toBe(md1);
     expect(colChildOf(doc2)?.type).toBe('image');
@@ -786,11 +791,11 @@ describe('converter gap coverage — raw-HTML container round-trips (specs 15–
 });
 
 // ===========================================================================
-// 30. heading.textAlign round-trip (A1). The paragraph case already exports a
-// non-default alignment as a styled `<p style="text-align:…">` that re-parses
-// losslessly; headings used to emit only the bare `## text` form, silently
-// DROPPING textAlign on export. The heading case is now symmetric: an aligned
-// heading exports as `<hN style="text-align:…">` and re-parses back to a heading
+// 30. heading.textAlign round-trip (A1). Bare `## text` markdown carries no
+// alignment, so an aligned heading used to silently DROP textAlign on export.
+// Per #293 canon #9 an aligned heading now keeps the readable `## text` form and
+// ATTACHES a trailing `<!--attrs {"textAlign":…}-->` comment (replacing the old
+// `<hN style="text-align:…">` HTML form). It re-parses back to a heading
 // carrying BOTH the level and the textAlign, so the round-trip is lossless; an
 // UNaligned heading still emits the bare `## text` markdown form (no churn).
 // ===========================================================================
@@ -801,21 +806,22 @@ const alignedHeading = (level: number, align: string, ...inline: any[]) => ({
 });
 
 describe('heading.textAlign round-trip (A1)', () => {
-  it('an aligned heading exports as <hN style="text-align:…"> (not bare ##)', () => {
+  it('an aligned heading keeps "## text" and attaches a <!--attrs--> comment (#293 #9)', () => {
     expect(convertProseMirrorToMarkdown(doc(alignedHeading(2, 'center', text('Title'))))).toBe(
-      '<h2 style="text-align:center">Title</h2>',
+      '## Title <!--attrs {"textAlign":"center"}-->',
     );
   });
 
   it('survives export -> import -> export losslessly (level AND textAlign preserved)', async () => {
     const input = alignedHeading(2, 'center', text('Title'));
     const { md1, doc2, md2 } = await roundTrip(input);
-    // Export direction: a styled <hN>, injection-safe via escapeAttr.
-    expect(md1).toBe('<h2 style="text-align:center">Title</h2>');
+    // Export direction: `## Title` plus the attached alignment comment (#293 #9).
+    expect(md1).toBe('## Title <!--attrs {"textAlign":"center"}-->');
     // Import direction: re-parses to a heading node with the level AND textAlign
-    // (the raw <hN style> HTML block flows through marked -> generateJSON, where
-    // the heading parse rule matches and the textAlign global attr reads the
-    // style back). Byte-stable second export closes the loop.
+    // (marked keeps the comment inside the <h2>; applyAttachedComments re-expresses
+    // it as an inline style before generateJSON, where the heading parse rule
+    // matches and the textAlign global attr reads it back). Byte-stable second
+    // export closes the loop.
     const h = doc2.content[0];
     expect(h.type).toBe('heading');
     expect(h.attrs.level).toBe(2);
diff --git a/packages/git-sync/test/markdown-converter-golden.test.ts b/packages/prosemirror-markdown/test/markdown-converter-golden.test.ts
similarity index 69%
rename from packages/git-sync/test/markdown-converter-golden.test.ts
rename to packages/prosemirror-markdown/test/markdown-converter-golden.test.ts
index f8ba6b76..86a00e25 100644
--- a/packages/git-sync/test/markdown-converter-golden.test.ts
+++ b/packages/prosemirror-markdown/test/markdown-converter-golden.test.ts
@@ -51,43 +51,49 @@ describe('columns / column (raw-HTML layout wrapper)', () => {
   });
 });
 
-describe('embed / audio / pdf (previously emitted nothing — invisible regression)', () => {
-  it('embed emits div[data-type="embed"] with src/provider', () => {
+describe('embed / audio / pdf top-level md-form + discriminator (#293 #8)', () => {
+  it('embed emits link-form [provider](src) + bare discriminator (defaults omitted)', () => {
+    // provider is the visible link text; align/width/height are all at their
+    // schema defaults (center/800/600), so the comment is name-only.
     expect(c({ type: 'embed', attrs: { src: 'https://x.com/e', provider: 'iframe' } })).toBe(
-      '<div data-type="embed" data-src="https://x.com/e" data-provider="iframe"></div>',
+      '[iframe](https://x.com/e)<!--embed-->',
     );
   });
 
-  it('audio emits a div-wrapped <audio> with src', () => {
-    expect(c({ type: 'audio', attrs: { src: '/a.mp3' } })).toBe(
-      '<div><audio src="/a.mp3"></audio></div>',
-    );
+  it('audio emits image-form ![](src) + bare discriminator', () => {
+    expect(c({ type: 'audio', attrs: { src: '/a.mp3' } })).toBe('![](/a.mp3)<!--audio-->');
   });
 
-  it('pdf emits div[data-type="pdf"] with src and name', () => {
+  it('pdf emits link-form [name](src) + bare discriminator', () => {
     expect(c({ type: 'pdf', attrs: { src: '/d.pdf', name: 'd.pdf' } })).toBe(
-      '<div data-type="pdf" src="/d.pdf" data-name="d.pdf"></div>',
+      '[d.pdf](/d.pdf)<!--pdf-->',
     );
   });
 });
 
-describe('drawio / excalidraw data-align asymmetry (SPEC §11)', () => {
-  it('drawio: data-align is ABSENT when align is unset', () => {
+describe('drawio / excalidraw align emission in the discriminator comment (#293 #8)', () => {
+  it('drawio: NO align key when align is unset (bare discriminator)', () => {
     const out = c({ type: 'drawio', attrs: { src: '/d.drawio' } });
-    expect(out).toBe('<div data-type="drawio" data-src="/d.drawio"></div>');
-    expect(out).not.toContain('data-align');
+    expect(out).toBe('![](/d.drawio)<!--drawio-->');
+    expect(out).not.toContain('align');
   });
 
-  it('drawio: data-align is PRESENT for a non-default align', () => {
+  it('drawio: an "align" key IS present for a non-default align', () => {
     expect(c({ type: 'drawio', attrs: { src: '/d.drawio', align: 'right' } })).toBe(
-      '<div data-type="drawio" data-src="/d.drawio" data-align="right"></div>',
+      '![](/d.drawio)<!--drawio {"align":"right"}-->',
     );
   });
 
-  it('excalidraw: data-align is ABSENT when align is unset', () => {
+  it('drawio: the default align "center" is OMITTED (byte-stable image-form parity)', () => {
+    const out = c({ type: 'drawio', attrs: { src: '/d.drawio', align: 'center' } });
+    expect(out).toBe('![](/d.drawio)<!--drawio-->');
+    expect(out).not.toContain('align');
+  });
+
+  it('excalidraw: NO align key when align is unset (bare discriminator)', () => {
     const out = c({ type: 'excalidraw', attrs: { src: '/e.excalidraw' } });
-    expect(out).toBe('<div data-type="excalidraw" data-src="/e.excalidraw"></div>');
-    expect(out).not.toContain('data-align');
+    expect(out).toBe('![](/e.excalidraw)<!--excalidraw-->');
+    expect(out).not.toContain('align');
   });
 });
 
@@ -97,7 +103,9 @@ describe('inline-mark matrix (underline/sub/sup/highlight±color/textStyle/comme
       [[{ type: 'underline' }], '<u>m</u>'],
       [[{ type: 'subscript' }], '<sub>m</sub>'],
       [[{ type: 'superscript' }], '<sup>m</sup>'],
-      [[{ type: 'highlight' }], '<mark>m</mark>'],
+      // #293 canon #7: a no-color highlight now serializes as `==m==` (Obsidian
+      // syntax); only a COLORED highlight keeps the `<mark style=…>` HTML form.
+      [[{ type: 'highlight' }], '==m=='],
       [
         [{ type: 'highlight', attrs: { color: '#ff0000' } }],
         '<mark style="background-color: #ff0000">m</mark>',
@@ -129,27 +137,26 @@ describe('inline-mark matrix (underline/sub/sup/highlight±color/textStyle/comme
   });
 });
 
-describe('paragraph.textAlign -> <p style="text-align:...">', () => {
-  it('non-default alignment emits an HTML <p style="text-align:...">', () => {
-    // #7 fix: a non-default paragraph alignment now round-trips. It is exported
-    // as an HTML `<p style="text-align:center">` (the schema's paragraph
-    // parseHTML reads `style="text-align"` back onto `textAlign` on import), so
-    // the alignment survives instead of collapsing to bare text. (The old
-    // `<div align="center">` form was NOT re-parsed onto the paragraph and was
-    // therefore lossy.)
+describe('paragraph.textAlign -> attached <!--attrs--> comment (#293 #9)', () => {
+  it('non-default alignment emits a trailing <!--attrs {"textAlign":…}--> comment', () => {
+    // #293 canon #9: a non-default paragraph alignment now round-trips as an
+    // ATTACHED HTML comment at the END of the block line instead of the old
+    // `<p style="text-align:center">` wrapper (which the maintainer had to patch
+    // A14->A15->A16). The importer's applyAttachedComments step reads the comment
+    // back onto `textAlign` before the DOM stage drops it.
     expect(c({ type: 'paragraph', attrs: { textAlign: 'center' }, content: [text('x')] })).toBe(
-      '<p style="text-align:center">x</p>',
+      'x <!--attrs {"textAlign":"center"}-->',
     );
   });
 
-  it('textAlign "left" (the default) is NOT wrapped', () => {
+  it('textAlign "left" (the default) emits NO comment', () => {
     expect(c({ type: 'paragraph', attrs: { textAlign: 'left' }, content: [text('x')] })).toBe('x');
   });
 });
 
 describe('subpages token + unknown-in-container fallback', () => {
-  it('subpages emits the schema-matching div (round-trips, unlike the old {{SUBPAGES}} literal)', () => {
-    expect(c({ type: 'subpages' })).toBe('<div data-type="subpages"></div>');
+  it('subpages emits the standalone comment (#293 #5, unlike the old {{SUBPAGES}} literal)', () => {
+    expect(c({ type: 'subpages' })).toBe('<!--subpages-->');
   });
 
   it('an unknown block inside a raw-HTML container is wrapped in <div> (never markdown)', () => {
@@ -177,13 +184,20 @@ describe('subpages token + unknown-in-container fallback', () => {
 
 describe('escaping idempotence (SPEC §11 phantom-diff guard)', () => {
   it('escapeAttr escapes ONLY & and " in an attribute context, and is idempotent', () => {
-    // The mathBlock `text` attr goes through escapeAttr. & -> &amp;, " -> &quot;.
-    const once = c({ type: 'mathBlock', attrs: { text: 'a & "b"' } });
-    expect(once).toBe(
+    // #293 canon #6: a TOP-LEVEL mathBlock now serializes as a `$$` fence, so
+    // to exercise the schema-HTML `text` attr (which DOES go through escapeAttr)
+    // we wrap the math in a COLUMN — the raw-HTML path keeps the `<div>` form.
+    const col = (child: any) => ({
+      type: 'columns',
+      content: [{ type: 'column', content: [child] }],
+    });
+    // & -> &amp;, " -> &quot; in the attribute context.
+    const once = c(col({ type: 'mathBlock', attrs: { text: 'a & "b"' } }));
+    expect(once).toContain(
       '<div data-type="mathBlock" data-katex="true" text="a &amp; &quot;b&quot;"></div>',
     );
     // < and > are deliberately NOT escaped (would accumulate on round-trips).
-    const angled = c({ type: 'mathBlock', attrs: { text: 'a < b > c' } });
+    const angled = c(col({ type: 'mathBlock', attrs: { text: 'a < b > c' } }));
     expect(angled).toContain('text="a < b > c"');
     expect(angled).not.toContain('&lt;');
     expect(angled).not.toContain('&gt;');
@@ -248,7 +262,10 @@ describe('empty / single-column tables', () => {
 // orderedList and a hardBreak inside a column.
 // ---------------------------------------------------------------------------
 describe('media / attachment / container full-attribute golden coverage', () => {
-  it('video: emits all optional attrs in source order (alt->aria-label, attachmentId/size/align/aspectRatio->data-*)', () => {
+  it('video: emits all optional attrs in the comment JSON in stable order (align center omitted)', () => {
+    // #293 canon #8 image-form: src in the target, all OTHER non-default attrs in
+    // the comment JSON (stable order alt/attachmentId/width/height/size/
+    // aspectRatio; align="center" is the default and is omitted).
     expect(
       c({
         type: 'video',
@@ -264,50 +281,49 @@ describe('media / attachment / container full-attribute golden coverage', () =>
         },
       }),
     ).toBe(
-      '<div><video src="/v.mp4" aria-label="clip" data-attachment-id="att-1" width="640" height="480" data-size="1234" data-align="center" data-aspect-ratio="1.777"></video></div>',
+      '![](/v.mp4)<!--video {"alt":"clip","attachmentId":"att-1","width":"640","height":"480","size":"1234","aspectRatio":"1.777"}-->',
     );
   });
 
-  it('video: with only src, every optional guard takes its false branch (src-only <video>, no data-type on wrapper)', () => {
-    expect(c({ type: 'video', attrs: { src: '/v.mp4' } })).toBe(
-      '<div><video src="/v.mp4"></video></div>',
-    );
+  it('video: with only src, the discriminator is still emitted name-only (bare ![](src)<!--video-->)', () => {
+    expect(c({ type: 'video', attrs: { src: '/v.mp4' } })).toBe('![](/v.mp4)<!--video-->');
   });
 
-  it('youtube + embed: each emits its full optional attr set in source order', () => {
-    // (a) youtube: width/height/align all present -> data-* in order.
+  it('youtube + embed: each emits its full optional attr set in the discriminator comment', () => {
+    // (a) youtube (image-form): width/height/align(right) in the comment JSON.
     expect(
       c({
         type: 'youtube',
         attrs: { src: 'https://youtu.be/abc', width: 560, height: 315, align: 'right' },
       }),
     ).toBe(
-      '<div data-type="youtube" data-src="https://youtu.be/abc" data-width="560" data-height="315" data-align="right"></div>',
+      '![](https://youtu.be/abc)<!--youtube {"width":"560","height":"315","align":"right"}-->',
     );
-    // (b) embed: align/width/height optional branches after src+provider.
+    // (b) embed (link-form): provider is the visible text; a non-default align/
+    // width/height (left/600/400 — the defaults are center/800/600) ride in JSON.
     expect(
       c({
         type: 'embed',
         attrs: { src: 'https://x.com/e', provider: 'iframe', align: 'left', width: 600, height: 400 },
       }),
     ).toBe(
-      '<div data-type="embed" data-src="https://x.com/e" data-provider="iframe" data-align="left" data-width="600" data-height="400"></div>',
+      '[iframe](https://x.com/e)<!--embed {"align":"left","width":"600","height":"400"}-->',
     );
   });
 
-  it('audio: emits data-attachment-id then data-size after src when both are set', () => {
+  it('audio: emits attachmentId then size in the comment JSON when both are set', () => {
     expect(c({ type: 'audio', attrs: { src: '/a.mp3', attachmentId: 'att-7', size: 9001 } })).toBe(
-      '<div><audio src="/a.mp3" data-attachment-id="att-7" data-size="9001"></audio></div>',
+      '![](/a.mp3)<!--audio {"attachmentId":"att-7","size":"9001"}-->',
     );
   });
 
-  it('audio: with attachmentId but no size, data-size is suppressed (size != null false branch)', () => {
+  it('audio: with attachmentId but no size, the size key is suppressed (size != null false branch)', () => {
     expect(c({ type: 'audio', attrs: { src: '/a.mp3', attachmentId: 'att-7' } })).toBe(
-      '<div><audio src="/a.mp3" data-attachment-id="att-7"></audio></div>',
+      '![](/a.mp3)<!--audio {"attachmentId":"att-7"}-->',
     );
   });
 
-  it('pdf: emits the full optional attr set in order (data-name, data-attachment-id, data-size, width, height)', () => {
+  it('pdf: emits the full optional attr set in the comment JSON (attachmentId, size, width, height)', () => {
     expect(
       c({
         type: 'pdf',
@@ -321,11 +337,11 @@ describe('media / attachment / container full-attribute golden coverage', () =>
         },
       }),
     ).toBe(
-      '<div data-type="pdf" src="/d.pdf" data-name="d.pdf" data-attachment-id="att-9" data-size="2048" width="800" height="600"></div>',
+      '[d.pdf](/d.pdf)<!--pdf {"attachmentId":"att-9","size":"2048","width":"800","height":"600"}-->',
     );
   });
 
-  it('attachment: emits data-attachment-name/mime/size/id in order after the always-present url', () => {
+  it('attachment: emits mime/size/attachmentId in the comment JSON after the [name](url) target', () => {
     expect(
       c({
         type: 'attachment',
@@ -338,13 +354,14 @@ describe('media / attachment / container full-attribute golden coverage', () =>
         },
       }),
     ).toBe(
-      '<div data-type="attachment" data-attachment-url="/f.zip" data-attachment-name="f.zip" data-attachment-mime="application/zip" data-attachment-size="512" data-attachment-id="att-3"></div>',
+      '[f.zip](/f.zip)<!--attachment {"mime":"application/zip","size":"512","attachmentId":"att-3"}-->',
     );
   });
 
-  it('attachment: with only a url, no spurious data-attachment-name/mime/size/id appear (all guards false)', () => {
+  it('attachment: with only a url, the link text is empty and the discriminator is name-only', () => {
+    // name is null -> empty visible text `[]`; no mime/size/id -> bare comment.
     expect(c({ type: 'attachment', attrs: { url: '/f.zip' } })).toBe(
-      '<div data-type="attachment" data-attachment-url="/f.zip"></div>',
+      '[](/f.zip)<!--attachment-->',
     );
   });
 
diff --git a/packages/git-sync/test/markdown-converter-html-marks.test.ts b/packages/prosemirror-markdown/test/markdown-converter-html-marks.test.ts
similarity index 100%
rename from packages/git-sync/test/markdown-converter-html-marks.test.ts
rename to packages/prosemirror-markdown/test/markdown-converter-html-marks.test.ts
diff --git a/packages/git-sync/test/markdown-converter.test.ts b/packages/prosemirror-markdown/test/markdown-converter.test.ts
similarity index 94%
rename from packages/git-sync/test/markdown-converter.test.ts
rename to packages/prosemirror-markdown/test/markdown-converter.test.ts
index 98cb88c0..2a39de6c 100644
--- a/packages/git-sync/test/markdown-converter.test.ts
+++ b/packages/prosemirror-markdown/test/markdown-converter.test.ts
@@ -390,27 +390,26 @@ describe('convertProseMirrorToMarkdown', () => {
 
   // ---------------------------------------------------------------------------
   describe('math', () => {
-    it('inline math carries LaTeX in a text attr WITHOUT escaping < or >', () => {
+    it('inline math serializes as $LaTeX$ (Obsidian-native), no HTML escaping', () => {
       const out = convertProseMirrorToMarkdown(
         doc(para({ type: 'mathInline', attrs: { text: 'a < b' } })),
       );
-      // < and > must NOT be HTML-escaped (idempotency); only & and " would be.
-      expect(out).toBe(
-        '<span data-type="mathInline" data-katex="true" text="a < b"></span>',
-      );
+      // #293 canon #6: readable `$…$` form; the LaTeX is verbatim (no HTML
+      // attribute escaping of < or & in the fence form).
+      expect(out).toBe('$a < b$');
       expect(out).not.toContain('&lt;');
+      expect(out).not.toContain('<span');
     });
 
-    it('block math carries LaTeX in a text attr WITHOUT escaping < or >', () => {
+    it('block math serializes as a $$ fence on its own lines', () => {
       const out = convertProseMirrorToMarkdown(
         doc({ type: 'mathBlock', attrs: { text: 'x > y & z' } }),
       );
-      // & IS escaped (entity-significant), but < and > are NOT.
-      expect(out).toBe(
-        '<div data-type="mathBlock" data-katex="true" text="x > y &amp; z"></div>',
-      );
-      expect(out).not.toContain('&lt;');
-      expect(out).not.toContain('&gt;');
+      // #293 canon #6: `$$\n<latex>\n$$`. The LaTeX is verbatim inside the fence
+      // (plain markdown, so & is NOT entity-escaped as it would be in an attr).
+      expect(out).toBe('$$\nx > y & z\n$$');
+      expect(out).not.toContain('&amp;');
+      expect(out).not.toContain('<div');
     });
   });
 
@@ -430,33 +429,31 @@ describe('convertProseMirrorToMarkdown', () => {
       );
     });
 
-    it('attachment emits div with schema data-attachment-* attrs', () => {
+    it('attachment emits link-form [name](url) + discriminator comment (#293 #8)', () => {
       const out = convertProseMirrorToMarkdown(
         doc({
           type: 'attachment',
           attrs: { url: '/files/x.zip', name: 'x.zip', mime: 'application/zip', size: 99 },
         }),
       );
+      // #293 canon #8: url is the markdown target, name is the visible link text,
+      // and every other attr rides in the ALWAYS-emitted `attachment` comment.
       expect(out).toBe(
-        '<div data-type="attachment" data-attachment-url="/files/x.zip" ' +
-          'data-attachment-name="x.zip" data-attachment-mime="application/zip" ' +
-          'data-attachment-size="99"></div>',
+        '[x.zip](/files/x.zip)<!--attachment {"mime":"application/zip","size":"99"}-->',
       );
     });
 
-    it('video emits a <div>-wrapped <video> with schema attrs', () => {
+    it('video emits image-form ![](src) + discriminator comment (#293 #8)', () => {
       const out = convertProseMirrorToMarkdown(
         doc({
           type: 'video',
           attrs: { src: '/v.mp4', alt: 'clip', width: 640 },
         }),
       );
-      expect(out).toBe(
-        '<div><video src="/v.mp4" aria-label="clip" width="640"></video></div>',
-      );
+      expect(out).toBe('![](/v.mp4)<!--video {"alt":"clip","width":"640"}-->');
     });
 
-    it('youtube emits a div[data-type="youtube"] with data-src', () => {
+    it('youtube emits image-form ![](src) + discriminator comment (#293 #8)', () => {
       const out = convertProseMirrorToMarkdown(
         doc({
           type: 'youtube',
@@ -464,8 +461,7 @@ describe('convertProseMirrorToMarkdown', () => {
         }),
       );
       expect(out).toBe(
-        '<div data-type="youtube" data-src="https://youtu.be/abc" ' +
-          'data-width="560" data-height="315"></div>',
+        '![](https://youtu.be/abc)<!--youtube {"width":"560","height":"315"}-->',
       );
     });
   });
diff --git a/packages/git-sync/test/markdown-document-envelope.test.ts b/packages/prosemirror-markdown/test/markdown-document-envelope.test.ts
similarity index 100%
rename from packages/git-sync/test/markdown-document-envelope.test.ts
rename to packages/prosemirror-markdown/test/markdown-document-envelope.test.ts
diff --git a/packages/git-sync/test/markdown-document.test.ts b/packages/prosemirror-markdown/test/markdown-document.test.ts
similarity index 100%
rename from packages/git-sync/test/markdown-document.test.ts
rename to packages/prosemirror-markdown/test/markdown-document.test.ts
diff --git a/packages/git-sync/test/markdown-roundtrip-spoiler-caption.test.ts b/packages/prosemirror-markdown/test/markdown-roundtrip-spoiler-caption.test.ts
similarity index 90%
rename from packages/git-sync/test/markdown-roundtrip-spoiler-caption.test.ts
rename to packages/prosemirror-markdown/test/markdown-roundtrip-spoiler-caption.test.ts
index ea6b4c00..8802c610 100644
--- a/packages/git-sync/test/markdown-roundtrip-spoiler-caption.test.ts
+++ b/packages/prosemirror-markdown/test/markdown-roundtrip-spoiler-caption.test.ts
@@ -8,8 +8,9 @@ import {
 // predated and must now preserve losslessly:
 //   - the `spoiler` inline mark (issue #259), emitted as raw inline HTML
 //     `<span data-spoiler="true">…</span>` (Markdown has no native syntax);
-//   - the image `caption` attribute (issue #221), emitted as `data-caption`
-//     on the raw <img> (Markdown `![](src)` cannot carry it).
+//   - the image `caption` attribute (issue #221). A top-level image now emits
+//     it in an attached `<!--img {…}-->` comment (#293 canon #4); a raw <img>
+//     with `data-caption` in incoming Markdown still parses it back too.
 // We exercise the real export -> import -> export cycle: a PM doc must survive
 // PM -> MD -> PM unchanged, and the raw-HTML forms in incoming Markdown must
 // parse back to the mark/attribute.
@@ -99,8 +100,9 @@ describe("image caption round-trip (#221)", () => {
     });
 
     const md1 = convertProseMirrorToMarkdown(source);
-    // A captioned image takes the raw <img> form so data-caption can ride along.
-    expect(md1).toContain('data-caption="A grey cat"');
+    // #293 canon #4: a top-level captioned image now serializes as the clean
+    // `![alt](src)` plus an attached `<!--img {…}-->` comment carrying caption.
+    expect(md1).toBe('![cat](/files/a.png) <!--img {"caption":"A grey cat"}-->');
 
     const doc2 = await markdownToProseMirror(md1);
     const img = findImage(doc2);
diff --git a/packages/git-sync/test/markdown-roundtrip.property.test.ts b/packages/prosemirror-markdown/test/markdown-roundtrip.property.test.ts
similarity index 100%
rename from packages/git-sync/test/markdown-roundtrip.property.test.ts
rename to packages/prosemirror-markdown/test/markdown-roundtrip.property.test.ts
diff --git a/packages/git-sync/test/markdown-to-prosemirror-gaps.test.ts b/packages/prosemirror-markdown/test/markdown-to-prosemirror-gaps.test.ts
similarity index 100%
rename from packages/git-sync/test/markdown-to-prosemirror-gaps.test.ts
rename to packages/prosemirror-markdown/test/markdown-to-prosemirror-gaps.test.ts
diff --git a/packages/prosemirror-markdown/test/math.test.ts b/packages/prosemirror-markdown/test/math.test.ts
new file mode 100644
index 00000000..27d71e63
--- /dev/null
+++ b/packages/prosemirror-markdown/test/math.test.ts
@@ -0,0 +1,262 @@
+import { describe, expect, it } from 'vitest';
+// Import DIRECTLY from src so we exercise the real converter pair (the parser
+// lives in markdown-to-prosemirror.ts; importing it mutates the global DOM via
+// jsdom at module load, which @tiptap/html's generateJSON needs under Node).
+import { convertProseMirrorToMarkdown } from '../src/lib/markdown-converter.js';
+import { markdownToProseMirror } from '../src/lib/markdown-to-prosemirror.js';
+
+// ---------------------------------------------------------------------------
+// #293 canon #6: math -> `$…$` (inline) and `$$…$$` (block).
+//
+// The CENTRAL correctness constraint is that a single/currency `$` is NEVER
+// math (`$5`, `it costs $5 and $10` stay literal), and a would-be-math `$x$`
+// span in PROSE round-trips as literal text (never a phantom math node). These
+// tests pin the serialize forms, the pandoc currency rule, the low-churn prose
+// escape, the columns/raw-HTML schema-HTML form, and codeBlock/inline-code
+// safety, and assert byte-stable round-trips throughout.
+// ---------------------------------------------------------------------------
+
+const doc = (...nodes: any[]) => ({ type: 'doc', content: nodes });
+const text = (t: string, marks?: any[]) =>
+  marks ? { type: 'text', text: t, marks } : { type: 'text', text: t };
+const para = (...inline: any[]) => ({ type: 'paragraph', content: inline });
+
+// export -> import -> export. Returns md1, the re-imported doc, and md2 (which
+// MUST equal md1 for the git-sync data path to be byte-stable).
+async function roundTrip(node: any) {
+  const md1 = convertProseMirrorToMarkdown(doc(node));
+  const doc2 = await markdownToProseMirror(md1);
+  const md2 = convertProseMirrorToMarkdown(doc2);
+  return { md1, doc2, md2 };
+}
+
+// Depth-first find the first node of a type in a re-imported doc.
+function findNode(n: any, type: string): any {
+  if (!n || typeof n !== 'object') return undefined;
+  if (n.type === type) return n;
+  if (Array.isArray(n.content)) {
+    for (const c of n.content) {
+      const hit = findNode(c, type);
+      if (hit) return hit;
+    }
+  }
+  return undefined;
+}
+
+// Concatenate every text run under a node (for asserting text is preserved).
+function allText(n: any): string {
+  if (!n || typeof n !== 'object') return '';
+  if (n.type === 'text') return n.text || '';
+  if (Array.isArray(n.content)) return n.content.map(allText).join('');
+  return '';
+}
+
+describe('mathInline serialize + round-trip', () => {
+  it('mathInline x^2 -> exact $x^2$ and re-imports as mathInline attrs.text x^2', async () => {
+    const { md1, doc2, md2 } = await roundTrip(para({ type: 'mathInline', attrs: { text: 'x^2' } }));
+    expect(md1).toBe('$x^2$');
+    expect(md2).toBe(md1); // byte-stable
+    const math = findNode(doc2, 'mathInline');
+    expect(math).toBeDefined();
+    expect(math.attrs.text).toBe('x^2');
+    // No stray literal text, no math-shaped currency false positive.
+    expect(allText(doc2)).toBe('');
+  });
+
+  it('mathInline surrounded by prose round-trips as math (not currency)', async () => {
+    const { md1, doc2, md2 } = await roundTrip(
+      para(text('let '), { type: 'mathInline', attrs: { text: 'x^2' } }, text(' be')),
+    );
+    expect(md1).toBe('let $x^2$ be');
+    expect(md2).toBe(md1);
+    expect(findNode(doc2, 'mathInline').attrs.text).toBe('x^2');
+  });
+
+  it('LaTeX containing a literal $ is escaped \\$ and round-trips exact', async () => {
+    const { md1, doc2, md2 } = await roundTrip(para({ type: 'mathInline', attrs: { text: 'a$b' } }));
+    expect(md1).toBe('$a\\$b$'); // inner $ escaped so it cannot close early
+    expect(md2).toBe(md1);
+    expect(findNode(doc2, 'mathInline').attrs.text).toBe('a$b');
+  });
+
+  it('empty mathInline falls back to the lossless schema-HTML <span> form', async () => {
+    const { md1, doc2, md2 } = await roundTrip(para({ type: 'mathInline', attrs: { text: '' } }));
+    // An empty `$$` would look like a block; the span form is lossless.
+    expect(md1).toBe('<span data-type="mathInline" data-katex="true" text=""></span>');
+    expect(md2).toBe(md1);
+    expect(findNode(doc2, 'mathInline')).toBeDefined();
+  });
+
+  it('mathInline whose LaTeX carries a pre-existing \\$ takes the span fallback', async () => {
+    // `\$` before escaping would make the `$`→`\$` escape ambiguous, so this
+    // rare case uses the always-lossless schema-HTML form (documented fork).
+    const { md1, doc2, md2 } = await roundTrip(para({ type: 'mathInline', attrs: { text: '\\$100' } }));
+    expect(md1).toContain('<span data-type="mathInline"');
+    expect(md1).not.toContain('$\\$100$');
+    expect(md2).toBe(md1);
+    expect(findNode(doc2, 'mathInline').attrs.text).toBe('\\$100');
+  });
+
+  it('mathInline immediately followed by a digit text run uses the span fallback (round-trips)', async () => {
+    // `$x^2$5` would fail the pandoc closing rule (digit after `$`), so the math
+    // node falls back to the lossless span form; the "5" stays literal text.
+    const { md1, doc2, md2 } = await roundTrip(
+      para({ type: 'mathInline', attrs: { text: 'x^2' } }, text('5')),
+    );
+    expect(md1).toBe('<span data-type="mathInline" data-katex="true" text="x^2"></span>5');
+    expect(md1).not.toContain('$x^2$5');
+    expect(md2).toBe(md1);
+    expect(findNode(doc2, 'mathInline').attrs.text).toBe('x^2');
+    expect(allText(doc2)).toBe('5');
+  });
+});
+
+describe('mathBlock serialize + round-trip', () => {
+  it('multi-line mathBlock -> $$ fence with LaTeX intact, byte-stable', async () => {
+    const latex = '\\int_0^1 f\n= 1';
+    const { md1, doc2, md2 } = await roundTrip({ type: 'mathBlock', attrs: { text: latex } });
+    expect(md1).toBe('$$\n\\int_0^1 f\n= 1\n$$');
+    expect(md2).toBe(md1);
+    const math = findNode(doc2, 'mathBlock');
+    expect(math).toBeDefined();
+    expect(math.attrs.text).toBe(latex); // multi-line preserved
+  });
+
+  it('single-line mathBlock round-trips', async () => {
+    const { md1, doc2, md2 } = await roundTrip({ type: 'mathBlock', attrs: { text: 'a^2+b^2' } });
+    expect(md1).toBe('$$\na^2+b^2\n$$');
+    expect(md2).toBe(md1);
+    expect(findNode(doc2, 'mathBlock').attrs.text).toBe('a^2+b^2');
+  });
+
+  it('empty mathBlock round-trips as an empty $$ fence', async () => {
+    const { md1, doc2, md2 } = await roundTrip({ type: 'mathBlock', attrs: { text: '' } });
+    expect(md1).toBe('$$\n\n$$');
+    expect(md2).toBe(md1);
+    expect(findNode(doc2, 'mathBlock')).toBeDefined();
+  });
+
+  it('mathBlock whose LaTeX contains a $$ takes the lossless <div> fallback', async () => {
+    const { md1, doc2, md2 } = await roundTrip({ type: 'mathBlock', attrs: { text: 'a $$ b' } });
+    expect(md1).toContain('<div data-type="mathBlock"');
+    expect(md1).not.toBe('$$\na $$ b\n$$');
+    expect(md2).toBe(md1);
+    expect(findNode(doc2, 'mathBlock').attrs.text).toBe('a $$ b');
+  });
+});
+
+describe('currency: a single/currency $ is NEVER math', () => {
+  const cases = ['it costs $5', '$5 and $10', 'a $5 b $6 c', 'price is $5', 'pay $5 now'];
+  for (const original of cases) {
+    it(`"${original}" stays literal text with NO backslashes and NO math node`, async () => {
+      const { md1, doc2, md2 } = await roundTrip(para(text(original)));
+      // Emitted markdown carries NO escaping (currency has no valid closing $).
+      expect(md1).toBe(original);
+      expect(md1).not.toContain('\\$');
+      expect(md2).toBe(md1);
+      // No math node materialized; the text is preserved EXACTLY.
+      expect(findNode(doc2, 'mathInline')).toBeUndefined();
+      expect(allText(doc2)).toBe(original);
+    });
+  }
+
+  it('a currency amount preserves the exact string across a round trip', async () => {
+    const { doc2 } = await roundTrip(para(text('$5 and $10')));
+    expect(allText(doc2)).toBe('$5 and $10');
+    expect(findNode(doc2, 'mathInline')).toBeUndefined();
+  });
+});
+
+describe('prose $x$ (would-be math) round-trips as literal text (escaped)', () => {
+  it('the set $A$ -> \\$A\\$ and re-imports as literal text, no math node', async () => {
+    const { md1, doc2, md2 } = await roundTrip(para(text('the set $A$ is closed')));
+    expect(md1).toBe('the set \\$A\\$ is closed');
+    expect(md2).toBe(md1); // byte-stable
+    expect(findNode(doc2, 'mathInline')).toBeUndefined();
+    // The literal text is preserved exactly (backslashes are a serialization
+    // detail, decoded back on import).
+    expect(allText(doc2)).toBe('the set $A$ is closed');
+  });
+});
+
+describe('math inside a column keeps the schema-HTML form (NOT $…$)', () => {
+  const oneColumn = (child: any) => ({
+    type: 'columns',
+    content: [{ type: 'column', content: [child] }],
+  });
+
+  it('mathBlock in a column emits <div> (no $$ fence), round-trips', async () => {
+    const { md1, doc2, md2 } = await roundTrip(
+      oneColumn({ type: 'mathBlock', attrs: { text: 'a^2+b^2' } }),
+    );
+    expect(md1).toContain('<div data-type="mathBlock" data-katex="true" text="a^2+b^2"></div>');
+    expect(md1).not.toContain('$$');
+    // The schema-HTML math form survives the round trip (a re-imported column
+    // gains a default data-layout, so we assert the math div, not full equality).
+    expect(md2).toContain('<div data-type="mathBlock" data-katex="true" text="a^2+b^2"></div>');
+    expect(md2).not.toContain('$$');
+    expect(findNode(doc2, 'mathBlock').attrs.text).toBe('a^2+b^2');
+  });
+
+  it('mathInline in a column paragraph emits <span> (no $…$), round-trips', async () => {
+    const { md1, doc2, md2 } = await roundTrip(
+      oneColumn(para(text('eq: '), { type: 'mathInline', attrs: { text: 'x_i' } })),
+    );
+    expect(md1).toContain('<span data-type="mathInline" data-katex="true" text="x_i"></span>');
+    expect(md1).not.toContain('$x_i$');
+    expect(md2).toContain('<span data-type="mathInline" data-katex="true" text="x_i"></span>');
+    expect(md2).not.toContain('$x_i$');
+    expect(findNode(doc2, 'mathInline').attrs.text).toBe('x_i');
+  });
+});
+
+describe('code is never math (canon #7 codeBlock regression class)', () => {
+  it('inline `code` span containing $x$ / $5 stays code, no math, no backslashes', async () => {
+    const { md1, doc2, md2 } = await roundTrip(
+      para(text('$x$ and $5', [{ type: 'code' }])),
+    );
+    // A code run is emitted verbatim in a backtick span — no `$` escaping, no math.
+    expect(md1).toBe('`$x$ and $5`');
+    expect(md1).not.toContain('\\$');
+    expect(md2).toBe(md1);
+    expect(findNode(doc2, 'mathInline')).toBeUndefined();
+    const codeRun = findNode(doc2, 'text');
+    expect(codeRun.marks?.some((m: any) => m.type === 'code')).toBe(true);
+    expect(codeRun.text).toBe('$x$ and $5');
+  });
+
+  it('codeBlock containing $…$ and $5 stays code, no math, no backslash corruption', async () => {
+    const code = 'cost = $5\nx = $y$';
+    const { md1, doc2, md2 } = await roundTrip({
+      type: 'codeBlock',
+      attrs: { language: 'python' },
+      content: [text(code)],
+    });
+    // Fenced code is literal: the `$` are verbatim, no escaping, no math node.
+    expect(md1).toContain('cost = $5');
+    expect(md1).toContain('x = $y$');
+    expect(md1).not.toContain('\\$');
+    expect(md2).toBe(md1);
+    expect(findNode(doc2, 'mathInline')).toBeUndefined();
+    expect(findNode(doc2, 'mathBlock')).toBeUndefined();
+    // The `$` are preserved verbatim inside the fence (marked re-adds one
+    // trailing newline the exporter strips again, so compare against that).
+    const codeText = allText(findNode(doc2, 'codeBlock'));
+    expect(codeText).toContain('cost = $5');
+    expect(codeText).toContain('x = $y$');
+    expect(codeText).not.toContain('\\$');
+  });
+});
+
+describe('fail-open: unbalanced / lone $ never crashes and stays literal', () => {
+  for (const src of ['$', '$$', 'a $ b', '$ x $', 'unbalanced $x here']) {
+    it(`"${src}" imports without crash and materializes no math node`, async () => {
+      const doc2 = await markdownToProseMirror(src);
+      expect(doc2).toBeDefined();
+      expect(findNode(doc2, 'mathInline')).toBeUndefined();
+      // `$$` alone would only ever be a fence with content; a lone `$$` line is
+      // not a valid fence, so no mathBlock either.
+      expect(findNode(doc2, 'mathBlock')).toBeUndefined();
+    });
+  }
+});
diff --git a/packages/prosemirror-markdown/test/media-comments.test.ts b/packages/prosemirror-markdown/test/media-comments.test.ts
new file mode 100644
index 00000000..35ccb783
--- /dev/null
+++ b/packages/prosemirror-markdown/test/media-comments.test.ts
@@ -0,0 +1,481 @@
+import { describe, expect, it } from 'vitest';
+import {
+  convertProseMirrorToMarkdown,
+  markdownToProseMirror,
+} from 'docmost-client';
+
+// ---------------------------------------------------------------------------
+// #293 canon #8 — media family -> md-form + discriminator comment.
+//
+// Ten node types move their TOP-LEVEL form from raw schema HTML to a readable
+// markdown target plus a discriminator `<!--name {…}-->` comment whose NAME
+// selects the node type:
+//
+//   IMAGE-FORM  `![](src)<!--name …-->`   youtube, video, audio, drawio, excalidraw
+//   LINK-FORM   `[text](src)<!--name …-->` pdf, attachment, embed
+//   STANDALONE  `<!--name …-->`            pageEmbed (pageembed), transclusionReference (transclusion)
+//
+// For EACH type this suite pins (1) a representative node -> exact md + a
+// byte-stable, lossless round-trip; (2) a MINIMAL node -> the discriminator is
+// STILL emitted and re-imports as the right TYPE (never an image/link); (3) the
+// same node INSIDE a column -> the schema-HTML form (no comment). Plus the
+// discriminator-integrity contract (a bare image / bare link with NO comment)
+// and fail-open behavior. The columns/raw-HTML form is the git-sync data path's
+// SAFETY net: a comment node is dropped inside a raw-HTML block, so these MUST
+// stay schema HTML there or the node vanishes.
+// ---------------------------------------------------------------------------
+
+const mkDoc = (content: any[]) => ({ type: 'doc', content });
+
+/** export -> import -> export, returning both markdowns and the re-parsed doc. */
+async function roundTrip(doc: any) {
+  const md1 = convertProseMirrorToMarkdown(doc);
+  const doc2 = await markdownToProseMirror(md1);
+  const md2 = convertProseMirrorToMarkdown(doc2);
+  return { md1, md2, doc2 };
+}
+
+/** Find the first node of a given type anywhere in a PM doc tree. */
+const findFirst = (node: any, type: string): any => {
+  if (node && node.type === type) return node;
+  for (const child of node?.content || []) {
+    const hit = findFirst(child, type);
+    if (hit) return hit;
+  }
+  return null;
+};
+
+/** True when any text run in the tree carries a `link` MARK (links are marks). */
+const hasLinkMark = (node: any): boolean => {
+  if (Array.isArray(node?.marks) && node.marks.some((m: any) => m?.type === 'link'))
+    return true;
+  return (node?.content || []).some((c: any) => hasLinkMark(c));
+};
+
+/** Wrap a single node in a two-column layout (the raw-HTML container path). */
+const inColumn = (node: any) =>
+  mkDoc([
+    {
+      type: 'columns',
+      attrs: { layout: 'two_equal' },
+      content: [
+        { type: 'column', content: [node] },
+        { type: 'column', content: [{ type: 'paragraph', content: [{ type: 'text', text: 'x' }] }] },
+      ],
+    },
+  ]);
+
+// ---------------------------------------------------------------------------
+// Per-type: exact md, lossless byte-stable round-trip, minimal-node
+// discriminator, and the in-column schema-HTML form.
+// ---------------------------------------------------------------------------
+
+describe('#293 #8 IMAGE-FORM: youtube', () => {
+  it('representative node -> exact md + lossless byte-stable round-trip', async () => {
+    const doc = mkDoc([
+      { type: 'youtube', attrs: { src: 'https://youtu.be/abc', width: 560, height: 315, align: 'right' } },
+    ]);
+    const { md1, md2, doc2 } = await roundTrip(doc);
+    expect(md1).toBe(
+      '![](https://youtu.be/abc)<!--youtube {"width":"560","height":"315","align":"right"}-->',
+    );
+    expect(md2).toBe(md1);
+    const yt = findFirst(doc2, 'youtube');
+    expect(yt).not.toBeNull();
+    expect(yt.attrs.src).toBe('https://youtu.be/abc');
+    expect(yt.attrs.width).toBe('560');
+    expect(yt.attrs.height).toBe('315');
+    expect(yt.attrs.align).toBe('right');
+  });
+
+  it('minimal node -> discriminator STILL emitted; round-trips to youtube (NOT image)', async () => {
+    const { md1, doc2 } = await roundTrip(mkDoc([{ type: 'youtube', attrs: { src: '/y' } }]));
+    expect(md1).toBe('![](/y)<!--youtube-->');
+    expect(findFirst(doc2, 'youtube')).not.toBeNull();
+    expect(findFirst(doc2, 'image')).toBeNull();
+  });
+
+  it('inside a column -> schema-HTML form (data-type="youtube", NO comment)', async () => {
+    const { md1, doc2 } = await roundTrip(
+      inColumn({ type: 'youtube', attrs: { src: '/y', width: 560 } }),
+    );
+    expect(md1).toContain('data-type="youtube"');
+    expect(md1).toContain('data-src="/y"');
+    expect(md1).not.toContain('<!--youtube');
+    expect(findFirst(doc2, 'youtube')).not.toBeNull();
+  });
+});
+
+describe('#293 #8 IMAGE-FORM: video', () => {
+  it('representative node -> exact md + lossless byte-stable round-trip (attachmentId preserved)', async () => {
+    const doc = mkDoc([
+      {
+        type: 'video',
+        attrs: { src: '/v.mp4', alt: 'clip', attachmentId: 'ATT_V', width: 640, height: 480, size: 1234, aspectRatio: 1.777 },
+      },
+    ]);
+    const { md1, md2, doc2 } = await roundTrip(doc);
+    expect(md1).toBe(
+      '![](/v.mp4)<!--video {"alt":"clip","attachmentId":"ATT_V","width":"640","height":"480","size":"1234","aspectRatio":"1.777"}-->',
+    );
+    expect(md2).toBe(md1);
+    const v = findFirst(doc2, 'video');
+    expect(v.attrs.src).toBe('/v.mp4');
+    expect(v.attrs.alt).toBe('clip');
+    // Data-loss-critical id link survives.
+    expect(v.attrs.attachmentId).toBe('ATT_V');
+    expect(v.attrs.aspectRatio).toBe('1.777');
+  });
+
+  it('minimal node -> discriminator STILL emitted; round-trips to video (NOT image)', async () => {
+    const { md1, doc2 } = await roundTrip(mkDoc([{ type: 'video', attrs: { src: '/v.mp4' } }]));
+    expect(md1).toBe('![](/v.mp4)<!--video-->');
+    expect(findFirst(doc2, 'video')).not.toBeNull();
+    expect(findFirst(doc2, 'image')).toBeNull();
+  });
+
+  it('inside a column -> schema-HTML <video> form (NO comment)', async () => {
+    const { md1, doc2 } = await roundTrip(
+      inColumn({ type: 'video', attrs: { src: '/v.mp4', attachmentId: 'ATT_V' } }),
+    );
+    expect(md1).toContain('<video ');
+    expect(md1).toContain('data-attachment-id="ATT_V"');
+    expect(md1).not.toContain('<!--video');
+    expect(findFirst(doc2, 'video').attrs.attachmentId).toBe('ATT_V');
+  });
+});
+
+describe('#293 #8 IMAGE-FORM: audio', () => {
+  it('representative node -> exact md + lossless byte-stable round-trip', async () => {
+    const { md1, md2, doc2 } = await roundTrip(
+      mkDoc([{ type: 'audio', attrs: { src: '/a.mp3', attachmentId: 'ATT_A', size: 9001 } }]),
+    );
+    expect(md1).toBe('![](/a.mp3)<!--audio {"attachmentId":"ATT_A","size":"9001"}-->');
+    expect(md2).toBe(md1);
+    const a = findFirst(doc2, 'audio');
+    expect(a.attrs.src).toBe('/a.mp3');
+    expect(a.attrs.attachmentId).toBe('ATT_A');
+    expect(a.attrs.size).toBe('9001');
+  });
+
+  it('minimal node -> discriminator STILL emitted; round-trips to audio (NOT image)', async () => {
+    const { md1, doc2 } = await roundTrip(mkDoc([{ type: 'audio', attrs: { src: '/a.mp3' } }]));
+    expect(md1).toBe('![](/a.mp3)<!--audio-->');
+    expect(findFirst(doc2, 'audio')).not.toBeNull();
+    expect(findFirst(doc2, 'image')).toBeNull();
+  });
+
+  it('inside a column -> schema-HTML <audio> form (NO comment)', async () => {
+    const { md1, doc2 } = await roundTrip(inColumn({ type: 'audio', attrs: { src: '/a.mp3' } }));
+    expect(md1).toContain('<audio ');
+    expect(md1).not.toContain('<!--audio');
+    expect(findFirst(doc2, 'audio')).not.toBeNull();
+  });
+});
+
+describe('#293 #8 IMAGE-FORM: drawio / excalidraw (NAME discriminates the two)', () => {
+  for (const type of ['drawio', 'excalidraw'] as const) {
+    it(`${type}: representative node -> exact md + lossless byte-stable round-trip`, async () => {
+      const { md1, md2, doc2 } = await roundTrip(
+        mkDoc([{ type, attrs: { src: `/d.${type}`, title: 'T', width: 640, attachmentId: 'ATT_D' } }]),
+      );
+      expect(md1).toBe(`![](/d.${type})<!--${type} {"title":"T","width":"640","attachmentId":"ATT_D"}-->`);
+      expect(md2).toBe(md1);
+      const d = findFirst(doc2, type);
+      expect(d).not.toBeNull();
+      expect(d.attrs.src).toBe(`/d.${type}`);
+      expect(d.attrs.title).toBe('T');
+      expect(d.attrs.attachmentId).toBe('ATT_D');
+      // The OTHER diagram type must NOT appear (NAME is the discriminator).
+      expect(findFirst(doc2, type === 'drawio' ? 'excalidraw' : 'drawio')).toBeNull();
+    });
+
+    it(`${type}: minimal node -> discriminator STILL emitted; round-trips to ${type} (NOT image)`, async () => {
+      const { md1, doc2 } = await roundTrip(mkDoc([{ type, attrs: { src: `/d.${type}` } }]));
+      expect(md1).toBe(`![](/d.${type})<!--${type}-->`);
+      expect(findFirst(doc2, type)).not.toBeNull();
+      expect(findFirst(doc2, 'image')).toBeNull();
+    });
+
+    it(`${type}: inside a column -> schema-HTML data-type="${type}" form (NO comment)`, async () => {
+      const { md1, doc2 } = await roundTrip(
+        inColumn({ type, attrs: { src: `/d.${type}`, attachmentId: 'ATT_D' } }),
+      );
+      expect(md1).toContain(`data-type="${type}"`);
+      expect(md1).not.toContain(`<!--${type}`);
+      expect(findFirst(doc2, type).attrs.attachmentId).toBe('ATT_D');
+    });
+  }
+});
+
+describe('#293 #8 LINK-FORM: pdf', () => {
+  it('representative node -> exact md + lossless byte-stable round-trip', async () => {
+    const { md1, md2, doc2 } = await roundTrip(
+      mkDoc([{ type: 'pdf', attrs: { src: '/d.pdf', name: 'd.pdf', attachmentId: 'ATT_P', size: 2048 } }]),
+    );
+    expect(md1).toBe('[d.pdf](/d.pdf)<!--pdf {"attachmentId":"ATT_P","size":"2048"}-->');
+    expect(md2).toBe(md1);
+    const p = findFirst(doc2, 'pdf');
+    expect(p.attrs.src).toBe('/d.pdf');
+    expect(p.attrs.name).toBe('d.pdf');
+    expect(p.attrs.attachmentId).toBe('ATT_P');
+    expect(p.attrs.size).toBe('2048');
+  });
+
+  it('minimal node -> discriminator STILL emitted; round-trips to pdf (NOT a plain link)', async () => {
+    const { md1, doc2 } = await roundTrip(mkDoc([{ type: 'pdf', attrs: { src: '/d.pdf', name: 'd.pdf' } }]));
+    expect(md1).toBe('[d.pdf](/d.pdf)<!--pdf-->');
+    expect(findFirst(doc2, 'pdf')).not.toBeNull();
+    expect(hasLinkMark(doc2)).toBe(false);
+  });
+
+  it('a filename with []\\ is escaped in the link text and round-trips losslessly', async () => {
+    const { md1, doc2 } = await roundTrip(mkDoc([{ type: 'pdf', attrs: { src: '/x', name: 'a]b[c.pdf' } }]));
+    expect(md1).toBe('[a\\]b\\[c.pdf](/x)<!--pdf-->');
+    expect(findFirst(doc2, 'pdf').attrs.name).toBe('a]b[c.pdf');
+  });
+
+  it('a filename with markdown-ACTIVE punctuation round-trips byte- AND value-stable', async () => {
+    // The link label is parsed as inline content, so emphasis/code/strike/
+    // autolink/entity/image markers would be consumed and lost via a.textContent
+    // if not escaped. Each of these names would corrupt without the full escape
+    // (e.g. `report *v2*.pdf` -> `report v2.pdf`). Assert both value AND byte
+    // stability (md2 === md1) so a real filename cannot silently churn a vault.
+    for (const name of [
+      'report *v2*.pdf',
+      'draft _final_.pdf',
+      'use `code`.pdf',
+      'a~~b~~.pdf',
+      'tag <x> & y.pdf',
+      'amp &amp; here.pdf',
+      '![shot](x).pdf',
+      // Canon inline-extension triggers (F5): math `$`, highlight `==`, footnote
+      // `^[` — a filename carrying these must not become a math/highlight/footnote
+      // node on import.
+      'data $A$.csv',
+      'q3 ==final==.pdf',
+      '5$ and 10$.pdf',
+      'note ^[x].pdf',
+    ]) {
+      const { md1, md2, doc2 } = await roundTrip(mkDoc([{ type: 'pdf', attrs: { src: '/x', name } }]));
+      expect(md2).toBe(md1); // byte-stable, no churn
+      expect(findFirst(doc2, 'pdf').attrs.name).toBe(name); // exact value preserved
+    }
+  });
+
+  it('inside a column -> schema-HTML data-type="pdf" form (NO comment)', async () => {
+    const { md1, doc2 } = await roundTrip(
+      inColumn({ type: 'pdf', attrs: { src: '/d.pdf', name: 'd.pdf', attachmentId: 'ATT_P' } }),
+    );
+    expect(md1).toContain('data-type="pdf"');
+    expect(md1).toContain('data-name="d.pdf"');
+    expect(md1).not.toContain('<!--pdf');
+    expect(findFirst(doc2, 'pdf').attrs.attachmentId).toBe('ATT_P');
+  });
+});
+
+describe('#293 #8 LINK-FORM: attachment', () => {
+  it('representative node -> exact md + lossless byte-stable round-trip', async () => {
+    const { md1, md2, doc2 } = await roundTrip(
+      mkDoc([{ type: 'attachment', attrs: { url: '/f.zip', name: 'f.zip', mime: 'application/zip', size: 512, attachmentId: 'ATT_Z' } }]),
+    );
+    expect(md1).toBe(
+      '[f.zip](/f.zip)<!--attachment {"mime":"application/zip","size":"512","attachmentId":"ATT_Z"}-->',
+    );
+    expect(md2).toBe(md1);
+    const a = findFirst(doc2, 'attachment');
+    expect(a.attrs.url).toBe('/f.zip');
+    expect(a.attrs.name).toBe('f.zip');
+    expect(a.attrs.mime).toBe('application/zip');
+    expect(a.attrs.attachmentId).toBe('ATT_Z');
+  });
+
+  it('minimal node (url only) -> empty text + discriminator; round-trips to attachment (NOT a link)', async () => {
+    const { md1, doc2 } = await roundTrip(mkDoc([{ type: 'attachment', attrs: { url: '/f.zip' } }]));
+    expect(md1).toBe('[](/f.zip)<!--attachment-->');
+    const a = findFirst(doc2, 'attachment');
+    expect(a).not.toBeNull();
+    expect(a.attrs.url).toBe('/f.zip');
+    expect(hasLinkMark(doc2)).toBe(false);
+  });
+
+  it('inside a column -> schema-HTML data-type="attachment" form (NO comment)', async () => {
+    const { md1, doc2 } = await roundTrip(
+      inColumn({ type: 'attachment', attrs: { url: '/f.zip', name: 'f.zip', attachmentId: 'ATT_Z' } }),
+    );
+    expect(md1).toContain('data-type="attachment"');
+    expect(md1).toContain('data-attachment-url="/f.zip"');
+    expect(md1).not.toContain('<!--attachment');
+    expect(findFirst(doc2, 'attachment').attrs.attachmentId).toBe('ATT_Z');
+  });
+});
+
+describe('#293 #8 LINK-FORM: embed', () => {
+  it('representative node -> exact md + lossless byte-stable round-trip', async () => {
+    const { md1, md2, doc2 } = await roundTrip(
+      mkDoc([{ type: 'embed', attrs: { src: 'https://x.com/e', provider: 'iframe', align: 'left', width: 600, height: 400 } }]),
+    );
+    expect(md1).toBe('[iframe](https://x.com/e)<!--embed {"align":"left","width":"600","height":"400"}-->');
+    expect(md2).toBe(md1);
+    const e = findFirst(doc2, 'embed');
+    expect(e.attrs.src).toBe('https://x.com/e');
+    expect(e.attrs.provider).toBe('iframe');
+    expect(e.attrs.align).toBe('left');
+  });
+
+  it('minimal node -> discriminator STILL emitted; round-trips to embed (NOT a link)', async () => {
+    const { md1, doc2 } = await roundTrip(
+      mkDoc([{ type: 'embed', attrs: { src: 'https://x.com/e', provider: 'iframe' } }]),
+    );
+    expect(md1).toBe('[iframe](https://x.com/e)<!--embed-->');
+    const e = findFirst(doc2, 'embed');
+    expect(e).not.toBeNull();
+    expect(e.attrs.provider).toBe('iframe');
+    expect(hasLinkMark(doc2)).toBe(false);
+  });
+
+  it('inside a column -> schema-HTML data-type="embed" form (NO comment)', async () => {
+    const { md1, doc2 } = await roundTrip(
+      inColumn({ type: 'embed', attrs: { src: 'https://x.com/e', provider: 'iframe' } }),
+    );
+    expect(md1).toContain('data-type="embed"');
+    expect(md1).toContain('data-provider="iframe"');
+    expect(md1).not.toContain('<!--embed');
+    expect(findFirst(doc2, 'embed').attrs.provider).toBe('iframe');
+  });
+});
+
+describe('#293 #8 STANDALONE: pageEmbed', () => {
+  it('representative node -> exact md + lossless byte-stable round-trip (sourcePageId preserved)', async () => {
+    const { md1, md2, doc2 } = await roundTrip(
+      mkDoc([{ type: 'pageEmbed', attrs: { sourcePageId: 'PAGE_X' } }]),
+    );
+    expect(md1).toBe('<!--pageembed {"sourcePageId":"PAGE_X"}-->');
+    expect(md2).toBe(md1);
+    const pe = findFirst(doc2, 'pageEmbed');
+    expect(pe).not.toBeNull();
+    expect(pe.attrs.sourcePageId).toBe('PAGE_X');
+  });
+
+  it('minimal node -> name-only discriminator; round-trips to pageEmbed', async () => {
+    const { md1, doc2 } = await roundTrip(mkDoc([{ type: 'pageEmbed', attrs: {} }]));
+    expect(md1).toBe('<!--pageembed-->');
+    expect(findFirst(doc2, 'pageEmbed')).not.toBeNull();
+  });
+
+  it('inside a column -> schema-HTML data-type="pageEmbed" form (NO comment)', async () => {
+    const { md1, doc2 } = await roundTrip(
+      inColumn({ type: 'pageEmbed', attrs: { sourcePageId: 'PAGE_X' } }),
+    );
+    expect(md1).toContain('data-type="pageEmbed"');
+    expect(md1).toContain('data-source-page-id="PAGE_X"');
+    expect(md1).not.toContain('<!--pageembed');
+    expect(findFirst(doc2, 'pageEmbed').attrs.sourcePageId).toBe('PAGE_X');
+  });
+});
+
+describe('#293 #8 STANDALONE: transclusionReference', () => {
+  it('representative node -> exact md + lossless byte-stable round-trip (both id links preserved)', async () => {
+    const { md1, md2, doc2 } = await roundTrip(
+      mkDoc([{ type: 'transclusionReference', attrs: { sourcePageId: 'PAGE_X', transclusionId: 'TR_Y' } }]),
+    );
+    expect(md1).toBe('<!--transclusion {"sourcePageId":"PAGE_X","transclusionId":"TR_Y"}-->');
+    expect(md2).toBe(md1);
+    const tr = findFirst(doc2, 'transclusionReference');
+    expect(tr).not.toBeNull();
+    expect(tr.attrs.sourcePageId).toBe('PAGE_X');
+    expect(tr.attrs.transclusionId).toBe('TR_Y');
+  });
+
+  it('minimal node -> name-only discriminator; round-trips to transclusionReference', async () => {
+    const { md1, doc2 } = await roundTrip(mkDoc([{ type: 'transclusionReference', attrs: {} }]));
+    expect(md1).toBe('<!--transclusion-->');
+    expect(findFirst(doc2, 'transclusionReference')).not.toBeNull();
+  });
+
+  it('inside a column -> schema-HTML data-type="transclusionReference" form (NO comment)', async () => {
+    const { md1, doc2 } = await roundTrip(
+      inColumn({ type: 'transclusionReference', attrs: { sourcePageId: 'PAGE_X', transclusionId: 'TR_Y' } }),
+    );
+    expect(md1).toContain('data-type="transclusionReference"');
+    expect(md1).toContain('data-transclusion-id="TR_Y"');
+    expect(md1).not.toContain('<!--transclusion');
+    expect(findFirst(doc2, 'transclusionReference').attrs.transclusionId).toBe('TR_Y');
+  });
+});
+
+// ---------------------------------------------------------------------------
+// Discriminator integrity: the NAME is the ONLY type selector. A bare markdown
+// target with NO following comment is NEVER sniffed into a media type.
+// ---------------------------------------------------------------------------
+
+describe('#293 #8 discriminator integrity (no comment -> never a media type)', () => {
+  it('a bare ![](url) with NO comment is an IMAGE, never youtube/video/etc.', async () => {
+    const doc2 = await markdownToProseMirror('![](https://youtu.be/abc)');
+    expect(findFirst(doc2, 'image')).not.toBeNull();
+    for (const t of ['youtube', 'video', 'audio', 'drawio', 'excalidraw']) {
+      expect(findFirst(doc2, t)).toBeNull();
+    }
+  });
+
+  it('a bare [text](src) with NO comment is a plain link, never pdf/attachment/embed', async () => {
+    const doc2 = await markdownToProseMirror('[report.pdf](/files/report.pdf)');
+    // The link MARK survives; NO media node materializes.
+    expect(hasLinkMark(doc2)).toBe(true);
+    for (const t of ['pdf', 'attachment', 'embed']) {
+      expect(findFirst(doc2, t)).toBeNull();
+    }
+  });
+});
+
+// ---------------------------------------------------------------------------
+// Fail-open: malformed/misplaced discriminators never crash and never corrupt.
+// ---------------------------------------------------------------------------
+
+describe('#293 #8 fail-open', () => {
+  it('malformed JSON after an image-form target does not throw; stays an image', async () => {
+    const md = '![](u.png)<!--youtube {bad-->';
+    const doc2 = await markdownToProseMirror(md);
+    // The comment is inert (parseAttachedComment returns null), so the img is
+    // left as a plain image and nothing throws.
+    expect(findFirst(doc2, 'image')).not.toBeNull();
+    expect(findFirst(doc2, 'youtube')).toBeNull();
+    // Byte-stable on the way back out (no phantom growth).
+    const back = convertProseMirrorToMarkdown(doc2);
+    expect(convertProseMirrorToMarkdown(await markdownToProseMirror(back))).toBe(back);
+  });
+
+  it('malformed JSON after a link-form target does not throw; stays a plain link', async () => {
+    const doc2 = await markdownToProseMirror('[f](/x)<!--attachment {bad}-->');
+    expect(findFirst(doc2, 'attachment')).toBeNull();
+    expect(hasLinkMark(doc2)).toBe(true);
+  });
+
+  it('a malformed standalone discriminator does not throw and materializes no atom', async () => {
+    const doc2 = await markdownToProseMirror('<!--pageembed {oops-->');
+    expect(findFirst(doc2, 'pageEmbed')).toBeNull();
+    expect(findFirst(doc2, 'transclusionReference')).toBeNull();
+  });
+
+  it('an unknown key in a valid comment is ignored (fail-open); the node still materializes', async () => {
+    const doc2 = await markdownToProseMirror('![](/y)<!--youtube {"unknownKey":1,"width":"560"}-->');
+    const yt = findFirst(doc2, 'youtube');
+    expect(yt).not.toBeNull();
+    expect(yt.attrs.width).toBe('560');
+    expect(yt.attrs).not.toHaveProperty('unknownKey');
+  });
+
+  it('an image-form discriminator with NO adjacent <img> is inert', async () => {
+    // `text <!--youtube-->` puts the comment inside a <p> next to text, not an
+    // <img>: wrong element -> inert, no youtube node, no crash.
+    const doc2 = await markdownToProseMirror('some text <!--youtube-->');
+    expect(findFirst(doc2, 'youtube')).toBeNull();
+    expect(findFirst(doc2, 'paragraph')).not.toBeNull();
+  });
+
+  it('a standalone media discriminator in ATTACHED position (next to text) is inert', async () => {
+    const doc2 = await markdownToProseMirror('inline text <!--pageembed {"sourcePageId":"p1"}-->');
+    expect(findFirst(doc2, 'pageEmbed')).toBeNull();
+    expect(findFirst(doc2, 'paragraph')).not.toBeNull();
+  });
+});
diff --git a/packages/git-sync/test/media-roundtrip.test.ts b/packages/prosemirror-markdown/test/media-roundtrip.test.ts
similarity index 73%
rename from packages/git-sync/test/media-roundtrip.test.ts
rename to packages/prosemirror-markdown/test/media-roundtrip.test.ts
index cc687704..9cde5541 100644
--- a/packages/git-sync/test/media-roundtrip.test.ts
+++ b/packages/prosemirror-markdown/test/media-roundtrip.test.ts
@@ -52,9 +52,9 @@ describe('media atom round-trip (audio/video/pdf/attachment/embed/youtube)', ()
     ]);
     const { md1, md2, doc2 } = await roundTrip(doc);
 
-    expect(md1).toBe(
-      '<div><audio src="/a.mp3" data-attachment-id="att-7" data-size="9001"></audio></div>',
-    );
+    // #293 canon #8 image-form: `![](src)` + the ALWAYS-emitted `audio`
+    // discriminator carrying the other attrs as JSON (numerics stringified).
+    expect(md1).toBe('![](/a.mp3)<!--audio {"attachmentId":"att-7","size":"9001"}-->');
     // Byte-stable: a second export reproduces the first exactly.
     expect(md2).toBe(md1);
 
@@ -87,8 +87,10 @@ describe('media atom round-trip (audio/video/pdf/attachment/embed/youtube)', ()
     ]);
     const { md1, md2, doc2 } = await roundTrip(doc);
 
+    // #293 canon #8 image-form: align="center" (the schema default) is OMITTED,
+    // so the whole optional set except align rides in the `video` comment JSON.
     expect(md1).toBe(
-      '<div><video src="/v.mp4" aria-label="clip" data-attachment-id="att-1" width="640" height="480" data-size="1234" data-align="center" data-aspect-ratio="1.777"></video></div>',
+      '![](/v.mp4)<!--video {"alt":"clip","attachmentId":"att-1","width":"640","height":"480","size":"1234","aspectRatio":"1.777"}-->',
     );
     expect(md2).toBe(md1);
 
@@ -108,19 +110,26 @@ describe('media atom round-trip (audio/video/pdf/attachment/embed/youtube)', ()
   });
 
   // 3. minimal video (only src) --------------------------------------------
-  it('minimal video (src only): NOT byte-stable (gains data-align="center") but canonically equal', async () => {
+  it('minimal video (src only): the discriminator is STILL emitted; byte-stable; round-trips to VIDEO not image', async () => {
     const doc = mkDoc([{ type: 'video', attrs: { src: '/v.mp4' } }]);
     const { md1, md2, doc2 } = await roundTrip(doc);
 
-    expect(md1).toBe('<div><video src="/v.mp4"></video></div>');
-    // video.align has a non-null schema default 'center' that materializes on
-    // import; the converter only emits data-align when set, so export #2 grows
-    // by data-align="center" exactly once (the documented one-time asymmetry).
-    expect(md2).toBe('<div><video src="/v.mp4" data-align="center"></video></div>');
-    expect(md2).not.toBe(md1);
+    // #293 canon #8: the comment is the type discriminator, so it is emitted even
+    // with no extra attrs (name-only). Without it a bare `![](src)` would be read
+    // as an `image`. align="center" default is omitted, so the form is byte-stable
+    // (unlike the old div-form, which gained data-align="center" on import).
+    expect(md1).toBe('![](/v.mp4)<!--video-->');
+    expect(md2).toBe(md1);
 
-    // align:'center' is normalized away via KNOWN_DEFAULTS.video, so despite the
-    // byte growth the documents ARE canonically equal.
+    // Critically: it round-trips to a VIDEO node, NOT an image.
+    const video = findFirst(doc2, 'video');
+    expect(video).not.toBeNull();
+    expect(video.type).toBe('video');
+    expect(findFirst(doc2, 'image')).toBeNull();
+    expect(video.attrs.src).toBe('/v.mp4');
+
+    // align:'center' is normalized away via KNOWN_DEFAULTS.video, so the
+    // documents ARE canonically equal.
     expect(docsCanonicallyEqual(doc, doc2)).toBe(true);
   });
 
@@ -131,9 +140,9 @@ describe('media atom round-trip (audio/video/pdf/attachment/embed/youtube)', ()
     ]);
     const { md1, md2, doc2 } = await roundTrip(doc);
 
-    expect(md1).toBe(
-      '<div data-type="pdf" src="/d.pdf" data-name="d.pdf" data-attachment-id="att-9"></div>',
-    );
+    // #293 canon #8 link-form: `[name](src)` + the `pdf` discriminator; the id
+    // link (attachmentId) is data-loss-critical and rides in the comment JSON.
+    expect(md1).toBe('[d.pdf](/d.pdf)<!--pdf {"attachmentId":"att-9"}-->');
     expect(md2).toBe(md1);
 
     const pdf = findFirst(doc2, 'pdf');
@@ -163,8 +172,10 @@ describe('media atom round-trip (audio/video/pdf/attachment/embed/youtube)', ()
     ]);
     const { md1, md2, doc2 } = await roundTrip(doc);
 
+    // #293 canon #8 link-form: url is the target, name the visible text, and
+    // mime/size/attachmentId ride in the `attachment` discriminator comment.
     expect(md1).toBe(
-      '<div data-type="attachment" data-attachment-url="/f.zip" data-attachment-name="f.zip" data-attachment-mime="application/zip" data-attachment-size="512" data-attachment-id="att-3"></div>',
+      '[f.zip](/f.zip)<!--attachment {"mime":"application/zip","size":"512","attachmentId":"att-3"}-->',
     );
     expect(md2).toBe(md1);
 
@@ -197,8 +208,10 @@ describe('media atom round-trip (audio/video/pdf/attachment/embed/youtube)', ()
     ]);
     const { md1, md2, doc2 } = await roundTrip(doc);
 
+    // #293 canon #8 link-form: provider is the visible text; the non-default
+    // align/width/height (defaults center/800/600) ride in the comment JSON.
     expect(md1).toBe(
-      '<div data-type="embed" data-src="https://x.com/e" data-provider="iframe" data-align="left" data-width="600" data-height="400"></div>',
+      '[iframe](https://x.com/e)<!--embed {"align":"left","width":"600","height":"400"}-->',
     );
     expect(md2).toBe(md1);
 
@@ -213,29 +226,27 @@ describe('media atom round-trip (audio/video/pdf/attachment/embed/youtube)', ()
   });
 
   // 7. minimal embed (only src+provider) -----------------------------------
-  it('minimal embed (src+provider): NOT byte-stable; defaults width/height materialize as NUMBERS 800/600', async () => {
+  it('minimal embed (src+provider): discriminator still emitted; byte-stable; defaults materialize as NUMBERS 800/600', async () => {
     const doc = mkDoc([
       { type: 'embed', attrs: { src: 'https://x.com/e', provider: 'iframe' } },
     ]);
     const { md1, md2, doc2 } = await roundTrip(doc);
 
-    expect(md1).toBe(
-      '<div data-type="embed" data-src="https://x.com/e" data-provider="iframe"></div>',
-    );
-    // embed has non-null schema defaults align='center', width=800, height=600
-    // that the converter never emits on export #1 but materialize on import, so
-    // export #2 grows by three data-* attrs (a one-time divergence).
-    expect(md2).toBe(
-      '<div data-type="embed" data-src="https://x.com/e" data-provider="iframe" data-align="center" data-width="800" data-height="600"></div>',
-    );
-    expect(md2).not.toBe(md1);
+    // #293 canon #8: align/width/height are all at their schema defaults
+    // (center/800/600), so the discriminator is name-only. Unlike the old
+    // div-form (which grew three data-* attrs on import), the md-form OMITS the
+    // defaults on BOTH exports, so it is byte-stable from export #1.
+    expect(md1).toBe('[iframe](https://x.com/e)<!--embed-->');
+    expect(md2).toBe(md1);
 
     const embed = findFirst(doc2, 'embed');
     expect(embed).not.toBeNull();
+    expect(embed.type).toBe('embed');
+    // Round-trips to EMBED, not a plain link.
+    expect(embed.attrs.provider).toBe('iframe');
     expect(embed.attrs.align).toBe('center');
-    // NOTE: these come from the addAttributes default (NOT parseHTML), so on the
-    // FIRST import they are the NUMBERS 800/600, not strings — parseHTML only
-    // runs when the attribute is actually present on the imported element.
+    // NOTE: these come from the addAttributes default (NOT parseHTML), so they
+    // are the NUMBERS 800/600 — parseHTML only runs when the attribute is present.
     expect(embed.attrs.width).toBe(800);
     expect(embed.attrs.height).toBe(600);
   });
@@ -255,8 +266,10 @@ describe('media atom round-trip (audio/video/pdf/attachment/embed/youtube)', ()
     ]);
     const { md1, md2, doc2 } = await roundTrip(doc);
 
+    // #293 canon #8 image-form: width/height/align(right) ride in the `youtube`
+    // discriminator comment (align "right" is non-default so it is kept).
     expect(md1).toBe(
-      '<div data-type="youtube" data-src="https://youtu.be/abc" data-width="560" data-height="315" data-align="right"></div>',
+      '![](https://youtu.be/abc)<!--youtube {"width":"560","height":"315","align":"right"}-->',
     );
     expect(md2).toBe(md1);
 
diff --git a/packages/git-sync/test/node-ops-extra.test.ts b/packages/prosemirror-markdown/test/node-ops-extra.test.ts
similarity index 100%
rename from packages/git-sync/test/node-ops-extra.test.ts
rename to packages/prosemirror-markdown/test/node-ops-extra.test.ts
diff --git a/packages/git-sync/test/node-ops.test.ts b/packages/prosemirror-markdown/test/node-ops.test.ts
similarity index 100%
rename from packages/git-sync/test/node-ops.test.ts
rename to packages/prosemirror-markdown/test/node-ops.test.ts
diff --git a/packages/git-sync/test/page-file.test.ts b/packages/prosemirror-markdown/test/page-file.test.ts
similarity index 100%
rename from packages/git-sync/test/page-file.test.ts
rename to packages/prosemirror-markdown/test/page-file.test.ts
diff --git a/packages/git-sync/test/redteam-converter.test.ts b/packages/prosemirror-markdown/test/redteam-converter.test.ts
similarity index 100%
rename from packages/git-sync/test/redteam-converter.test.ts
rename to packages/prosemirror-markdown/test/redteam-converter.test.ts
diff --git a/packages/prosemirror-markdown/test/resolved-comment-anchors.test.ts b/packages/prosemirror-markdown/test/resolved-comment-anchors.test.ts
new file mode 100644
index 00000000..2b83f223
--- /dev/null
+++ b/packages/prosemirror-markdown/test/resolved-comment-anchors.test.ts
@@ -0,0 +1,95 @@
+import { describe, expect, it } from 'vitest';
+// Import the converter DIRECTLY from src (NOT the docmost-client barrel, which
+// pulls in collaboration.ts and mutates the global DOM at import time), matching
+// the other converter unit tests (see markdown-converter-html-marks.test.ts).
+import { convertProseMirrorToMarkdown } from '../src/lib/markdown-converter.js';
+
+// gitmost #328 Channel 1: the `dropResolvedCommentAnchors` converter option
+// hides RESOLVED comment anchors from agent reads while keeping ACTIVE anchors.
+// The option defaults to false (zero behavior change for the lossless git-sync
+// export path). Two emitters read it: the top-level marks loop and the raw-HTML
+// inlineToHtml path (inside columns / spanned table cells).
+
+const text = (t: string, marks?: any[]) =>
+  marks ? { type: 'text', text: t, marks } : { type: 'text', text: t };
+const para = (...inline: any[]) => ({ type: 'paragraph', content: inline });
+const doc = (...nodes: any[]) => ({ type: 'doc', content: nodes });
+
+const commentMark = (commentId: string, resolved: boolean) => ({
+  type: 'comment',
+  attrs: { commentId, resolved },
+});
+
+// A columns node (raw-HTML container) so its children render via the
+// blockToHtml -> inlineToHtml path (the SECOND `case "comment"` emitter).
+const oneColumn = (...blocks: any[]) => ({
+  type: 'columns',
+  attrs: { layout: 'two' },
+  content: [{ type: 'column', content: blocks }],
+});
+
+describe('#328 Channel 1 — top-level emitter: dropResolvedCommentAnchors', () => {
+  const resolvedDoc = doc(
+    para(text('kept '), text('resolved', [commentMark('r1', true)])),
+  );
+  const activeDoc = doc(
+    para(text('kept '), text('active', [commentMark('a1', false)])),
+  );
+
+  it('drops a RESOLVED anchor (bare text) WITH the flag', () => {
+    const out = convertProseMirrorToMarkdown(resolvedDoc, {
+      dropResolvedCommentAnchors: true,
+    });
+    expect(out).toBe('kept resolved');
+    expect(out).not.toContain('data-comment-id');
+  });
+
+  it('PRESERVES a RESOLVED anchor WITHOUT the flag (default off)', () => {
+    const out = convertProseMirrorToMarkdown(resolvedDoc);
+    expect(out).toContain(
+      '<span data-comment-id="r1" data-resolved="true">resolved</span>',
+    );
+  });
+
+  it('KEEPS an ACTIVE anchor in BOTH cases', () => {
+    const withFlag = convertProseMirrorToMarkdown(activeDoc, {
+      dropResolvedCommentAnchors: true,
+    });
+    const withoutFlag = convertProseMirrorToMarkdown(activeDoc);
+    expect(withFlag).toContain('<span data-comment-id="a1">active</span>');
+    expect(withoutFlag).toContain('<span data-comment-id="a1">active</span>');
+  });
+});
+
+describe('#328 Channel 1 — raw-HTML inlineToHtml emitter (columns)', () => {
+  const resolvedCol = doc(
+    oneColumn(para(text('resolved', [commentMark('r1', true)]))),
+  );
+  const activeCol = doc(
+    oneColumn(para(text('active', [commentMark('a1', false)]))),
+  );
+
+  it('drops a RESOLVED anchor (bare text) WITH the flag', () => {
+    const out = convertProseMirrorToMarkdown(resolvedCol, {
+      dropResolvedCommentAnchors: true,
+    });
+    expect(out).toContain('<p>resolved</p>');
+    expect(out).not.toContain('data-comment-id');
+  });
+
+  it('PRESERVES a RESOLVED anchor WITHOUT the flag', () => {
+    const out = convertProseMirrorToMarkdown(resolvedCol);
+    expect(out).toContain(
+      '<span data-comment-id="r1" data-resolved="true">resolved</span>',
+    );
+  });
+
+  it('KEEPS an ACTIVE anchor in BOTH cases', () => {
+    const withFlag = convertProseMirrorToMarkdown(activeCol, {
+      dropResolvedCommentAnchors: true,
+    });
+    const withoutFlag = convertProseMirrorToMarkdown(activeCol);
+    expect(withFlag).toContain('<span data-comment-id="a1">active</span>');
+    expect(withoutFlag).toContain('<span data-comment-id="a1">active</span>');
+  });
+});
diff --git a/packages/git-sync/test/roundtrip-all-nodes.test.ts b/packages/prosemirror-markdown/test/roundtrip-all-nodes.test.ts
similarity index 100%
rename from packages/git-sync/test/roundtrip-all-nodes.test.ts
rename to packages/prosemirror-markdown/test/roundtrip-all-nodes.test.ts
diff --git a/packages/prosemirror-markdown/test/roundtrip-corpus.test.ts b/packages/prosemirror-markdown/test/roundtrip-corpus.test.ts
new file mode 100644
index 00000000..05814d4a
--- /dev/null
+++ b/packages/prosemirror-markdown/test/roundtrip-corpus.test.ts
@@ -0,0 +1,68 @@
+import { readFile } from 'node:fs/promises';
+import { readdirSync } from 'node:fs';
+import { fileURLToPath } from 'node:url';
+import { dirname, join } from 'node:path';
+import { describe, expect, it } from 'vitest';
+import {
+  convertProseMirrorToMarkdown,
+  markdownToProseMirror,
+  docsCanonicallyEqual,
+} from 'docmost-client';
+
+// Resolve fixtures relative to this test file so the test is CWD-independent.
+const here = dirname(fileURLToPath(import.meta.url));
+const CORPUS_DIR = join(here, 'fixtures', 'corpus');
+
+/** Run a single document through export -> import -> export. */
+async function roundTrip(doc: any) {
+  const md1 = convertProseMirrorToMarkdown(doc);
+  const doc2 = await markdownToProseMirror(md1);
+  const md2 = convertProseMirrorToMarkdown(doc2);
+  return { md1, md2, doc2 };
+}
+
+describe('round-trip corpus (SPEC §11)', () => {
+  // Discover the corpus synchronously at collection time so each fixture gets
+  // its own `it` with the file name in the test title.
+  const files = readdirSync(CORPUS_DIR)
+    .filter((name) => name.endsWith('.json'))
+    .sort();
+
+  it('has a non-empty corpus', () => {
+    expect(files.length).toBeGreaterThan(0);
+  });
+
+  for (const name of files) {
+    it(`${name}: markdown byte-stable AND canonically stable`, async () => {
+      const doc = JSON.parse(await readFile(join(CORPUS_DIR, name), 'utf8'));
+      const { md1, md2, doc2 } = await roundTrip(doc);
+
+      // 1) The byte-stable markdown property git actually needs.
+      expect(md2, `${name}: markdown not byte-stable`).toBe(md1);
+      // 2) Semantic stability (block ids stripped, default-null normalized).
+      expect(
+        docsCanonicallyEqual(doc, doc2),
+        `${name}: document not canonically stable`,
+      ).toBe(true);
+    });
+  }
+});
+
+// ---------------------------------------------------------------------------
+// FORMER KNOWN LIMITATION — now promoted into the green corpus above.
+//
+// SPEC §11 flagged images and diagrams as high round-trip risk, and
+// `image-diagrams.json` (a paragraph + block image + drawio + excalidraw) was
+// held out here with `it.fails` because it was not byte-stable on export #1: the
+// drawio/excalidraw `align` default "center" materialized on import, so export
+// #2 grew a `data-align="center"` suffix.
+//
+// #293 canon #8 removes that divergence. The diagram family now serializes at
+// TOP LEVEL as `![](src)<!--drawio|excalidraw {…}-->`, and — exactly like the
+// image `![](src)` form — a default `align:"center"` is OMITTED from the comment
+// JSON (it re-materializes as the schema default on import, then is omitted again
+// on re-export). The block-image hoist that once left a phantom empty paragraph
+// is already absorbed by `stripEmptyParagraphs`. The fixture is therefore now
+// BOTH byte-stable AND canonically stable, so it lives in fixtures/corpus as
+// `11-image-diagrams.json` and is exercised by the green corpus loop above.
+// ---------------------------------------------------------------------------
diff --git a/packages/prosemirror-markdown/test/roundtrip-helpers.ts b/packages/prosemirror-markdown/test/roundtrip-helpers.ts
new file mode 100644
index 00000000..20eb490f
--- /dev/null
+++ b/packages/prosemirror-markdown/test/roundtrip-helpers.ts
@@ -0,0 +1,75 @@
+/**
+ * Pure, IO-free comparison helpers for the idempotency round-trip checks. The
+ * round-trip harness that drives these lives in the package's tests, not in the
+ * engine.
+ */
+
+/**
+ * Recursively strip every `attrs.id` from a ProseMirror node tree. Block ids
+ * are regenerated by `markdownToProseMirror` (SPEC §11), so they must be
+ * ignored when comparing the semantic shape of two documents. Returns a NEW
+ * tree; the input is not mutated.
+ */
+export function stripBlockIds(node: any): any {
+  if (Array.isArray(node)) {
+    return node.map(stripBlockIds);
+  }
+  if (node && typeof node === "object") {
+    const out: any = {};
+    for (const key of Object.keys(node)) {
+      if (key === "attrs" && node.attrs && typeof node.attrs === "object") {
+        // Drop the `id` attr; keep every other attribute.
+        const { id, ...rest } = node.attrs as Record<string, unknown>;
+        void id;
+        out.attrs = stripBlockIds(rest);
+      } else {
+        out[key] = stripBlockIds(node[key]);
+      }
+    }
+    return out;
+  }
+  return node;
+}
+
+/**
+ * Find the first divergence between two values via a recursive deep compare.
+ * Returns a short path + the two differing values, or null if they are equal.
+ */
+export function firstDivergence(
+  a: any,
+  b: any,
+  path = "$",
+): { path: string; a: any; b: any } | null {
+  if (a === b) return null;
+
+  const ta = typeof a;
+  const tb = typeof b;
+  if (ta !== tb || a === null || b === null) {
+    return { path, a, b };
+  }
+  if (ta !== "object") {
+    return { path, a, b };
+  }
+
+  const aIsArr = Array.isArray(a);
+  const bIsArr = Array.isArray(b);
+  if (aIsArr !== bIsArr) return { path, a, b };
+
+  if (aIsArr) {
+    if (a.length !== b.length) {
+      return { path: `${path}.length`, a: a.length, b: b.length };
+    }
+    for (let i = 0; i < a.length; i++) {
+      const d = firstDivergence(a[i], b[i], `${path}[${i}]`);
+      if (d) return d;
+    }
+    return null;
+  }
+
+  const keys = new Set([...Object.keys(a), ...Object.keys(b)]);
+  for (const k of keys) {
+    const d = firstDivergence(a[k], b[k], `${path}.${k}`);
+    if (d) return d;
+  }
+  return null;
+}
diff --git a/packages/git-sync/test/roundtrip.test.ts b/packages/prosemirror-markdown/test/roundtrip.test.ts
similarity index 96%
rename from packages/git-sync/test/roundtrip.test.ts
rename to packages/prosemirror-markdown/test/roundtrip.test.ts
index 62db34b3..3132f904 100644
--- a/packages/git-sync/test/roundtrip.test.ts
+++ b/packages/prosemirror-markdown/test/roundtrip.test.ts
@@ -60,10 +60,8 @@ describe('math round-trip (mathBlock + mathInline)', () => {
     const source = { type: 'mathBlock', attrs: { text: 'a^2+b^2' } };
     const { md1, doc2, md2 } = await roundTrip(source);
 
-    // One-way emit: LaTeX rides in the `text` HTML attribute, data-katex flag set.
-    expect(md1).toBe(
-      '<div data-type="mathBlock" data-katex="true" text="a^2+b^2"></div>',
-    );
+    // #293 canon #6: block math emits a `$$` fence on its own lines.
+    expect(md1).toBe('$$\na^2+b^2\n$$');
     // Byte-stable: the second export reproduces the first exactly.
     expect(md2).toBe(md1);
 
@@ -81,9 +79,8 @@ describe('math round-trip (mathBlock + mathInline)', () => {
     const source = para({ type: 'mathInline', attrs: { text: 'x_i' } });
     const { md1, doc2, md2 } = await roundTrip(source);
 
-    expect(md1).toBe(
-      '<span data-type="mathInline" data-katex="true" text="x_i"></span>',
-    );
+    // #293 canon #6: inline math emits the Obsidian-native `$LaTeX$` form.
+    expect(md1).toBe('$x_i$');
     expect(md2).toBe(md1);
 
     // The re-imported paragraph's child is a mathInline with the LaTeX recovered.
diff --git a/packages/git-sync/test/schema-editor-ext-contract.test.ts b/packages/prosemirror-markdown/test/schema-editor-ext-contract.test.ts
similarity index 100%
rename from packages/git-sync/test/schema-editor-ext-contract.test.ts
rename to packages/prosemirror-markdown/test/schema-editor-ext-contract.test.ts
diff --git a/packages/git-sync/test/schema-surface-snapshot.test.ts b/packages/prosemirror-markdown/test/schema-surface-snapshot.test.ts
similarity index 100%
rename from packages/git-sync/test/schema-surface-snapshot.test.ts
rename to packages/prosemirror-markdown/test/schema-surface-snapshot.test.ts
diff --git a/packages/prosemirror-markdown/test/serializer-contract.test.ts b/packages/prosemirror-markdown/test/serializer-contract.test.ts
new file mode 100644
index 00000000..4ec993d7
--- /dev/null
+++ b/packages/prosemirror-markdown/test/serializer-contract.test.ts
@@ -0,0 +1,194 @@
+import { readFileSync } from "node:fs";
+import { fileURLToPath } from "node:url";
+
+import { describe, expect, it } from "vitest";
+import { getSchema } from "@tiptap/core";
+
+import { docmostExtensions } from "../src/lib/docmost-schema.js";
+import { convertProseMirrorToMarkdown } from "../src/lib/markdown-converter.js";
+import { markdownToProseMirror } from "../src/lib/markdown-to-prosemirror.js";
+
+/**
+ * SERIALIZER-CONTRACT GUARD (#293 canon #inventory, bug 3).
+ *
+ * The markdown serializer (`convertProseMirrorToMarkdown`) dispatches on
+ * `node.type` in a big `switch`. Any node type that reaches the `default` arm
+ * is NOT serialized as itself — it silently collapses to its children's text
+ * (or, for an ATOM node with no children, to the empty string). The canon
+ * inventory flagged exactly this class: had the editor schema declared inline
+ * atoms like `emoji`/`date`/`toc`, a document could carry one and the converter
+ * would drop it with no case and no error (a git-sync data-loss on the data
+ * path).
+ *
+ * INVARIANT: every node type declared in the package schema
+ * (`docmostExtensions`) has an EXPLICIT serializer case. This test derives the
+ * node-type set from the live schema and asserts a `case "<name>":` exists in
+ * the serializer source for each. A future node added to the schema WITHOUT a
+ * serializer case (the emoji/date/toc failure mode) fails here loudly.
+ *
+ * We scan the SOURCE (not behavioral output) because it is the only formulation
+ * that reliably catches a missing case for EVERY node kind: a missing case on a
+ * *container* node still emits its children via `default` (non-empty output, so
+ * a behavioral non-empty check would pass while structure was lost), whereas the
+ * source scan catches the drop regardless of whether the node is an atom or a
+ * container. A complementary behavioral check for the atom case follows.
+ */
+
+const SERIALIZER_SOURCE = readFileSync(
+  fileURLToPath(new URL("../src/lib/markdown-converter.ts", import.meta.url)),
+  "utf8",
+);
+
+function schemaNodeNames(): string[] {
+  const schema = getSchema(docmostExtensions as never);
+  return Object.keys(schema.nodes).sort();
+}
+
+describe("serializer contract: every schema node type has a serializer case", () => {
+  const nodeNames = schemaNodeNames();
+
+  it("covers a known, non-trivial set of node types", () => {
+    // Sanity: the schema really does expose the full Docmost node surface, so
+    // this test is not vacuously iterating an empty/tiny list.
+    expect(nodeNames.length).toBeGreaterThanOrEqual(40);
+    // A representative atom that would silently drop without a case.
+    expect(nodeNames).toContain("status");
+    expect(nodeNames).toContain("mention");
+  });
+
+  for (const name of schemaNodeNames()) {
+    it(`serializer has an explicit case for node type "${name}"`, () => {
+      // Node names and mark names never collide, so a `case "<node>"` anywhere
+      // in the serializer is that node's case (marks have distinct names).
+      const pattern = new RegExp(`case "${name}"\\s*:`);
+      expect(
+        pattern.test(SERIALIZER_SOURCE),
+        `Node type "${name}" is declared in the package schema but has no ` +
+          `case "${name}": in convertProseMirrorToMarkdown — it would fall ` +
+          `through to the default arm and be silently dropped on git-sync ` +
+          `export. Add a lossless serializer case (see mention/status).`,
+      ).toBe(true);
+    });
+  }
+});
+
+/**
+ * Behavioral complement: an INLINE ATOM with no serializer case collapses to
+ * "" via the default arm (exactly the emoji/date/toc risk). Prove that the two
+ * inline atoms the schema actually declares (mention, status) do NOT vanish —
+ * i.e. the default-drop path is not reached for them. This is the runtime shape
+ * the source-scan invariant protects.
+ */
+describe("serializer contract: inline atoms are not dropped to empty", () => {
+  const P = (...c: any[]) => ({ type: "paragraph", content: c });
+  const doc = (...c: any[]) => ({ type: "doc", content: c });
+
+  it("mention serializes to non-empty output", () => {
+    const md = convertProseMirrorToMarkdown(
+      doc(P({ type: "mention", attrs: { id: "u1", label: "Bob" } })),
+    );
+    expect(md.trim()).not.toBe("");
+    expect(md).toContain('data-type="mention"');
+  });
+
+  it("status serializes to non-empty output", () => {
+    const md = convertProseMirrorToMarkdown(
+      doc(P({ type: "status", attrs: { text: "Done", color: "green" } })),
+    );
+    expect(md.trim()).not.toBe("");
+    expect(md).toContain('data-type="status"');
+  });
+});
+
+/**
+ * Raw-HTML path (columns) round-trips for the two marks fixed alongside the
+ * contract test. A column renders its inline content via `inlineToHtml`, whose
+ * mark switch previously lacked a `spoiler` case (bug 1) and dropped a link's
+ * `title` (bug 2).
+ */
+
+// Walk a ProseMirror tree and return the first text run whose marks include the
+// given mark type, or undefined.
+function findMarkedText(n: any, markType: string): any {
+  if (!n || typeof n !== "object") return undefined;
+  if (
+    n.type === "text" &&
+    Array.isArray(n.marks) &&
+    n.marks.some((m: any) => m?.type === markType)
+  ) {
+    return n;
+  }
+  if (Array.isArray(n.content)) {
+    for (const c of n.content) {
+      const hit = findMarkedText(c, markType);
+      if (hit) return hit;
+    }
+  }
+  return undefined;
+}
+
+describe("raw-HTML path (columns): spoiler + link title round-trip", () => {
+  const P = (...c: any[]) => ({ type: "paragraph", content: c });
+  const doc = (...c: any[]) => ({ type: "doc", content: c });
+  const column = (...c: any[]) => ({
+    type: "column",
+    attrs: { width: "50%" },
+    content: c,
+  });
+
+  it("bug 1: a spoiler mark inside a column survives the round trip", async () => {
+    const original = doc({
+      type: "columns",
+      content: [
+        column(P({ type: "text", text: "hidden", marks: [{ type: "spoiler" }] })),
+        column(P({ type: "text", text: "plain" })),
+      ],
+    });
+    const md = convertProseMirrorToMarkdown(original);
+    // The raw-HTML path must emit the schema's spoiler span (RED before bug 1
+    // fix: inlineToHtml had no spoiler case, so the mark was dropped and the
+    // text emitted bare).
+    expect(md).toContain('data-spoiler="true"');
+    expect(md).toContain("<span data-spoiler=\"true\">hidden</span>");
+
+    const back = await markdownToProseMirror(md);
+    const spoilered = findMarkedText(back, "spoiler");
+    expect(spoilered).toBeDefined();
+    expect(spoilered.text).toBe("hidden");
+  });
+
+  it("bug 2: a link with a title inside a column keeps its title", async () => {
+    const original = doc({
+      type: "columns",
+      content: [
+        column(
+          P({
+            type: "text",
+            text: "site",
+            marks: [
+              {
+                type: "link",
+                attrs: { href: "https://example.com", title: "Example Title" },
+              },
+            ],
+          }),
+        ),
+        column(P({ type: "text", text: "plain" })),
+      ],
+    });
+    const md = convertProseMirrorToMarkdown(original);
+    // The raw-HTML anchor must carry the title (RED before bug 2 fix:
+    // inlineToHtml emitted <a href> with no title).
+    expect(md).toContain('title="Example Title"');
+    expect(md).toContain('href="https://example.com"');
+
+    const back = await markdownToProseMirror(md);
+    const linked = findMarkedText(back, "link");
+    expect(linked).toBeDefined();
+    const linkMark = linked.marks.find((m: any) => m.type === "link");
+    expect(linkMark.attrs?.href).toBe("https://example.com");
+    // The schema's link mark carries `title`; it must round-trip through the
+    // raw-HTML column path.
+    expect(linkMark.attrs?.title).toBe("Example Title");
+  });
+});
diff --git a/packages/prosemirror-markdown/test/textalign.test.ts b/packages/prosemirror-markdown/test/textalign.test.ts
new file mode 100644
index 00000000..7c8dcb89
--- /dev/null
+++ b/packages/prosemirror-markdown/test/textalign.test.ts
@@ -0,0 +1,160 @@
+import { describe, expect, it } from 'vitest';
+// Import DIRECTLY from src (NOT the docmost-client barrel, which pulls in
+// collaboration.ts and mutates global DOM at import time).
+import { convertProseMirrorToMarkdown } from '../src/lib/markdown-converter.js';
+import { markdownToProseMirror } from '../src/lib/markdown-to-prosemirror.js';
+import {
+  attachedCommentFor,
+  parseAttachedComment,
+} from '../src/lib/attached-comment.js';
+
+// #293 canon decision #9: paragraph/heading `textAlign` serializes as an
+// ATTACHED HTML comment at the END of the block line —
+//   `some text <!--attrs {"textAlign":"center"}-->`
+// — replacing the old `<div align>` / `<p style="text-align:…">` wrappers, which
+// did NOT round-trip cleanly (alignment was lost on the first stabilize pass).
+// These tests are non-vacuous: they assert the EXACT emitted markdown (so they
+// fail against any wrapper form) AND that the alignment survives a full
+// PM -> MD -> PM round trip (which the old `<div align>` never did).
+
+const doc = (...nodes: any[]) => ({ type: 'doc', content: nodes });
+const text = (t: string) => ({ type: 'text', text: t });
+const para = (align: string | null, ...inline: any[]) => ({
+  type: 'paragraph',
+  attrs: align === null ? {} : { textAlign: align },
+  content: inline,
+});
+const heading = (level: number, align: string | null, ...inline: any[]) => ({
+  type: 'heading',
+  attrs: align === null ? { level } : { level, textAlign: align },
+  content: inline,
+});
+
+// Find the first paragraph/heading node in a generated doc (skips the doc root).
+const firstBlock = (d: any) => d.content?.[0];
+
+describe('attached-comment primitives (reusable for #9/#4/#8)', () => {
+  it('attachedCommentFor emits a compact `<!--name {json}-->`', () => {
+    expect(attachedCommentFor('attrs', { textAlign: 'center' })).toBe(
+      '<!--attrs {"textAlign":"center"}-->',
+    );
+  });
+
+  it('attachedCommentFor escapes a `--` pair so it cannot close the comment early', () => {
+    // A string value containing `--` would otherwise inject `-->`. Each hyphen of
+    // the pair is emitted as the JSON unicode escape -; JSON.parse restores
+    // the original hyphens on the reading side.
+    const s = attachedCommentFor('img', { alt: 'a--b' });
+    expect(s).toBe('<!--img {"alt":"a\\u002d\\u002db"}-->');
+    // No premature `--` inside the payload (between the `<!--` opener and the
+    // `-->` closer), so the comment cannot terminate early.
+    expect(s.slice(4, -3)).not.toContain('--');
+    // Round-trip through the parser primitive restores the exact value.
+    const inner = s.slice('<!--'.length, -'-->'.length);
+    expect(parseAttachedComment(inner)).toEqual({ name: 'img', attrs: { alt: 'a--b' } });
+  });
+
+  it('parseAttachedComment fails open on malformed JSON and non-objects', () => {
+    expect(parseAttachedComment('attrs {not json}')).toBeNull();
+    expect(parseAttachedComment('attrs [1,2]')).toBeNull();
+    expect(parseAttachedComment('   ')).toBeNull();
+    // Name-only comment is a valid marker with empty attrs.
+    expect(parseAttachedComment('attrs')).toEqual({ name: 'attrs', attrs: {} });
+  });
+});
+
+describe('paragraph.textAlign serialization (#293 #9)', () => {
+  for (const align of ['center', 'right', 'justify']) {
+    it(`paragraph textAlign "${align}" -> trailing <!--attrs--> comment`, () => {
+      expect(convertProseMirrorToMarkdown(doc(para(align, text('hello'))))).toBe(
+        `hello <!--attrs {"textAlign":"${align}"}-->`,
+      );
+    });
+  }
+
+  it('default textAlign (null) emits NO comment', () => {
+    expect(convertProseMirrorToMarkdown(doc(para(null, text('hello'))))).toBe('hello');
+  });
+
+  it('"left" (visual default) emits NO comment', () => {
+    expect(convertProseMirrorToMarkdown(doc(para('left', text('hello'))))).toBe('hello');
+  });
+});
+
+describe('heading.textAlign serialization (#293 #9)', () => {
+  it('heading keeps "## text" and attaches the alignment comment', () => {
+    expect(convertProseMirrorToMarkdown(doc(heading(2, 'center', text('Title'))))).toBe(
+      '## Title <!--attrs {"textAlign":"center"}-->',
+    );
+  });
+
+  it('default heading emits the bare "## text" form', () => {
+    expect(convertProseMirrorToMarkdown(doc(heading(3, null, text('Plain'))))).toBe('### Plain');
+  });
+});
+
+describe('paragraph.textAlign round-trip PM -> MD -> PM (#293 #9)', () => {
+  for (const align of ['center', 'right', 'justify']) {
+    it(`preserves paragraph textAlign "${align}"`, async () => {
+      const md1 = convertProseMirrorToMarkdown(doc(para(align, text('hello'))));
+      expect(md1).toBe(`hello <!--attrs {"textAlign":"${align}"}-->`);
+      const doc2 = await markdownToProseMirror(md1);
+      const block = firstBlock(doc2);
+      expect(block.type).toBe('paragraph');
+      expect(block.attrs.textAlign).toBe(align);
+      // Text is intact (the trailing space before the comment is trimmed).
+      expect(block.content?.[0]?.text).toBe('hello');
+      // Byte-stable second export closes the loop.
+      expect(convertProseMirrorToMarkdown(doc2)).toBe(md1);
+    });
+  }
+
+  it('default paragraph re-imports with textAlign null (no comment survives)', async () => {
+    const md1 = convertProseMirrorToMarkdown(doc(para(null, text('hello'))));
+    const doc2 = await markdownToProseMirror(md1);
+    const block = firstBlock(doc2);
+    expect(block.type).toBe('paragraph');
+    expect(block.attrs.textAlign ?? null).toBeNull();
+  });
+});
+
+describe('heading.textAlign round-trip PM -> MD -> PM (#293 #9)', () => {
+  for (const [level, align] of [
+    [2, 'center'],
+    [3, 'right'],
+    [1, 'justify'],
+  ] as [number, string][]) {
+    it(`preserves h${level} textAlign "${align}"`, async () => {
+      const md1 = convertProseMirrorToMarkdown(doc(heading(level, align, text('Head'))));
+      expect(md1).toBe(`${'#'.repeat(level)} Head <!--attrs {"textAlign":"${align}"}-->`);
+      const doc2 = await markdownToProseMirror(md1);
+      const block = firstBlock(doc2);
+      expect(block.type).toBe('heading');
+      expect(block.attrs.level).toBe(level);
+      expect(block.attrs.textAlign).toBe(align);
+      expect(convertProseMirrorToMarkdown(doc2)).toBe(md1);
+    });
+  }
+});
+
+describe('attached-comment fail-open in the import pipeline (#293 #9)', () => {
+  it('a malformed attrs comment is ignored (default attrs kept)', async () => {
+    const doc2 = await markdownToProseMirror('hello <!--attrs {bad json}-->');
+    const block = firstBlock(doc2);
+    expect(block.type).toBe('paragraph');
+    expect(block.attrs.textAlign ?? null).toBeNull();
+    expect(block.content?.[0]?.text).toBe('hello');
+  });
+
+  it('an unknown key in a valid attrs comment is ignored, no comment leaks', async () => {
+    const doc2 = await markdownToProseMirror('hello <!--attrs {"bogus":"x"}-->');
+    const block = firstBlock(doc2);
+    expect(block.type).toBe('paragraph');
+    expect(block.attrs.textAlign ?? null).toBeNull();
+    // The unknown key and the comment marker must not survive into the body.
+    expect(block.content?.[0]?.text).toBe('hello');
+    const serialized = JSON.stringify(doc2);
+    expect(serialized).not.toContain('bogus');
+    expect(serialized).not.toContain('<!--');
+  });
+});
diff --git a/packages/prosemirror-markdown/tsconfig.json b/packages/prosemirror-markdown/tsconfig.json
new file mode 100644
index 00000000..c58cbd9d
--- /dev/null
+++ b/packages/prosemirror-markdown/tsconfig.json
@@ -0,0 +1,15 @@
+{
+  "compilerOptions": {
+    "target": "ES2022",
+    "module": "Node16",
+    "moduleResolution": "Node16",
+    "outDir": "./build",
+    "rootDir": "./src",
+    "strict": true,
+    "esModuleInterop": true,
+    "skipLibCheck": true,
+    "forceConsistentCasingInFileNames": true,
+    "declaration": true
+  },
+  "include": ["src/**/*"]
+}
diff --git a/packages/prosemirror-markdown/vitest.config.ts b/packages/prosemirror-markdown/vitest.config.ts
new file mode 100644
index 00000000..33d0fbe4
--- /dev/null
+++ b/packages/prosemirror-markdown/vitest.config.ts
@@ -0,0 +1,23 @@
+import { fileURLToPath } from 'node:url';
+import path from 'node:path';
+import { defineConfig } from 'vitest/config';
+
+// Ported docmost-sync tests import the converter through the upstream package
+// barrel specifier `docmost-client`. We vendored only the PURE half of that
+// package into `src/lib`, so alias the barrel specifier to our local lib
+// barrel; everything those tests use (converter, canonicalize, markdown
+// envelope, markdownToProseMirror) is re-exported there.
+const here = path.dirname(fileURLToPath(import.meta.url));
+const libBarrel = path.resolve(here, 'src/lib/index.ts');
+
+export default defineConfig({
+  resolve: {
+    alias: {
+      'docmost-client': libBarrel,
+    },
+  },
+  test: {
+    environment: 'node',
+    include: ['test/**/*.test.ts'],
+  },
+});
diff --git a/pnpm-lock.yaml b/pnpm-lock.yaml
index 7836f325..299f5e51 100644
--- a/pnpm-lock.yaml
+++ b/pnpm-lock.yaml
@@ -902,6 +902,9 @@ importers:
 
   packages/git-sync:
     dependencies:
+      '@docmost/prosemirror-markdown':
+        specifier: workspace:*
+        version: link:../prosemirror-markdown
       '@tiptap/core':
         specifier: 3.20.4
         version: 3.20.4(@tiptap/pm@3.20.4)
@@ -966,6 +969,9 @@ importers:
 
   packages/mcp:
     dependencies:
+      '@docmost/prosemirror-markdown':
+        specifier: workspace:*
+        version: link:../prosemirror-markdown
       '@fellow/prosemirror-recreate-transform':
         specifier: ^1.2.3
         version: 1.2.3
@@ -1049,6 +1055,67 @@ importers:
         specifier: ^5.0.0
         version: 5.9.3
 
+  packages/prosemirror-markdown:
+    dependencies:
+      '@tiptap/core':
+        specifier: 3.20.4
+        version: 3.20.4(@tiptap/pm@3.20.4)
+      '@tiptap/extension-highlight':
+        specifier: 3.20.4
+        version: 3.20.4(@tiptap/core@3.20.4(@tiptap/pm@3.20.4))
+      '@tiptap/extension-image':
+        specifier: 3.20.4
+        version: 3.20.4(@tiptap/core@3.20.4(@tiptap/pm@3.20.4))
+      '@tiptap/extension-subscript':
+        specifier: 3.20.4
+        version: 3.20.4(@tiptap/core@3.20.4(@tiptap/pm@3.20.4))(@tiptap/pm@3.20.4)
+      '@tiptap/extension-superscript':
+        specifier: 3.20.4
+        version: 3.20.4(@tiptap/core@3.20.4(@tiptap/pm@3.20.4))(@tiptap/pm@3.20.4)
+      '@tiptap/extension-task-item':
+        specifier: 3.20.4
+        version: 3.20.4(@tiptap/extension-list@3.20.4(@tiptap/core@3.20.4(@tiptap/pm@3.20.4))(@tiptap/pm@3.20.4))
+      '@tiptap/extension-task-list':
+        specifier: 3.20.4
+        version: 3.20.4(@tiptap/extension-list@3.20.4(@tiptap/core@3.20.4(@tiptap/pm@3.20.4))(@tiptap/pm@3.20.4))
+      '@tiptap/html':
+        specifier: 3.20.4
+        version: 3.20.4(@tiptap/core@3.20.4(@tiptap/pm@3.20.4))(@tiptap/pm@3.20.4)(happy-dom@20.8.9)
+      '@tiptap/pm':
+        specifier: 3.20.4
+        version: 3.20.4
+      '@tiptap/starter-kit':
+        specifier: 3.20.4
+        version: 3.20.4
+      jsdom:
+        specifier: 25.0.0
+        version: 25.0.0
+      marked:
+        specifier: 17.0.5
+        version: 17.0.5
+      zod:
+        specifier: 4.3.6
+        version: 4.3.6
+    devDependencies:
+      '@docmost/editor-ext':
+        specifier: workspace:*
+        version: link:../editor-ext
+      '@types/jsdom':
+        specifier: ^21.1.7
+        version: 21.1.7
+      '@types/node':
+        specifier: ^20.0.0
+        version: 20.19.43
+      fast-check:
+        specifier: ^4.8.0
+        version: 4.8.0
+      typescript:
+        specifier: ^5.0.0
+        version: 5.9.3
+      vitest:
+        specifier: 4.1.6
+        version: 4.1.6(@opentelemetry/api@1.9.0)(@types/node@20.19.43)(@vitest/coverage-v8@4.1.6)(happy-dom@20.8.9)(jsdom@25.0.0)(vite@8.0.5(@types/node@20.19.43)(esbuild@0.28.0)(jiti@2.4.2)(less@4.2.0)(sugarss@5.0.1(postcss@8.5.14))(terser@5.39.0)(tsx@4.21.0)(yaml@2.8.3))
+
 packages:
 
   '@aashutoshrathi/word-wrap@1.2.6':
@@ -11619,7 +11686,7 @@ snapshots:
 
   '@babel/code-frame@7.29.0':
     dependencies:
-      '@babel/helper-validator-identifier': 7.28.5
+      '@babel/helper-validator-identifier': 7.29.7
       js-tokens: 4.0.0
       picocolors: 1.1.1
 
@@ -16086,7 +16153,7 @@ snapshots:
       obug: 2.1.1
       std-env: 4.1.0
       tinyrainbow: 3.1.0
-      vitest: 4.1.6(@opentelemetry/api@1.9.0)(@types/node@22.19.1)(@vitest/coverage-v8@4.1.6)(happy-dom@20.8.9)(jsdom@25.0.0)(vite@8.0.5(@types/node@22.19.1)(esbuild@0.28.0)(jiti@2.4.2)(less@4.2.0)(sugarss@5.0.1(postcss@8.5.14))(terser@5.39.0)(tsx@4.21.0)(yaml@2.8.3))
+      vitest: 4.1.6(@opentelemetry/api@1.9.0)(@types/node@25.5.0)(@vitest/coverage-v8@4.1.6)(happy-dom@20.8.9)(jsdom@27.4.0(@noble/hashes@2.0.1))(vite@8.0.5(@types/node@25.5.0)(esbuild@0.28.0)(jiti@2.4.2)(less@4.2.0)(sugarss@5.0.1(postcss@8.5.14))(terser@5.39.0)(tsx@4.21.0)(yaml@2.8.3))
 
   '@vitest/expect@4.1.6':
     dependencies: