test: add full test suite for docmost-client and remaining modules

Raise coverage from 2.6% to 68% statements by adding 19 test files (~480 tests) covering every module in test-strategy-report.md. No production code changed — tests reach private logic via (client as any), mock HTTP with axios-mock-adapter on the real axios instance (interceptors intact), and mock the Hocuspocus provider with vi.mock + real yjs + fake timers. Coverage: auth-utils/filters/page-lock/json-edit 100%, diff 99%, node-ops 96%, transforms 95%, collaboration 86%, layout 91%, client.ts 41% (transport). - node-ops/transforms/json-edit/page-lock/filters: pure tree/text ops, immutability + clone guarantees, throw-vs-noop contracts - markdown-converter + markdown-document envelope + fast-check round-trip property test - diff, docmost-schema (sanitizeCssColor/clampCalloutType security guards) - collaboration: pure (buildCollabWsUrl/buildYDoc) + write-path (mutatePageContent read-transform-write, false-success suppression) - client.ts: isSafeUrl/validateDoc* XSS guards, vm-sandbox, REST pagination, 401 re-auth interceptor, login dedup, uploadImage/createPage multipart guards - collectRecentSince edge cases; loadSettingsOrExit invalid-value branch - env-gated E2E skeleton (DOCMOST_E2E) Two genuine markdown round-trip non-idempotency bugs are documented as it.fails (code-mark excludes other marks; block-image injects a blank line). Latent: isSafeUrl allows file:// on link context. Adds dev-deps: fast-check, @vitest/coverage-v8, axios-mock-adapter; adds the "coverage" npm script.
2026-06-16 22:50:04 +03:00
parent cc13c94f53
commit 90d8f86fda
14 changed files with 5306 additions and 2 deletions
--- a/package-lock.json
+++ b/package-lock.json
--- a/package.json
+++ b/package.json
@@ -5,14 +5,19 @@
  "type": "module",
  "description": "Bidirectional sync daemon between Docmost articles and a local Markdown git vault (git is the state store). See SPEC.md.",
  "license": "MIT",
-  "workspaces": ["packages/*"],
-  "engines": { "node": ">=20" },
+  "workspaces": [
+    "packages/*"
+  ],
+  "engines": {
+    "node": ">=20"
+  },
  "scripts": {
    "build": "npm run build -w docmost-client && tsc",
    "start": "node build/index.js",
    "dev": "tsx watch src/index.ts",
    "test": "vitest run",
    "test:watch": "vitest",
+    "coverage": "vitest run --coverage --coverage.provider=v8 --coverage.include='src/**/*.ts' --coverage.include='packages/docmost-client/src/**/*.ts'",
    "roundtrip": "node build/roundtrip.js",
    "pull": "node build/pull.js"
  },
@@ -23,6 +28,9 @@
  },
  "devDependencies": {
    "@types/node": "22.19.21",
+    "@vitest/coverage-v8": "^3.2.6",
+    "axios-mock-adapter": "^2.1.0",
+    "fast-check": "^4.8.0",
    "tsx": "4.22.4",
    "typescript": "5.9.3",
    "vitest": "3.2.6"
--- a/test/auth-utils.test.ts
+++ b/test/auth-utils.test.ts
@@ -0,0 +1,275 @@
+import { afterEach, beforeEach, describe, expect, it, vi } from 'vitest';
+import axios from 'axios';
+import MockAdapter from 'axios-mock-adapter';
+import {
+  getCollabToken,
+  performLogin,
+} from '../packages/docmost-client/src/lib/auth-utils.js';
+
+// Both the source module and this test import the default axios instance,
+// which is hoisted to the workspace-root node_modules. MockAdapter installed
+// on that shared instance therefore intercepts the bare axios.post calls made
+// inside auth-utils.ts, and axios.isAxiosError still recognises the synthetic
+// errors MockAdapter throws.
+const BASE_URL = 'https://docmost.example.com/api';
+const API_TOKEN = 'test-api-token';
+
+const mock = new MockAdapter(axios);
+
+// Snapshot DEBUG so individual tests can toggle it and we always restore the
+// original value (the source gates secret-leaking branches on process.env.DEBUG).
+const ORIGINAL_DEBUG = process.env.DEBUG;
+
+afterEach(() => {
+  // Drop all registered handlers between tests.
+  mock.reset();
+  // Restore the env regardless of what a test set, to avoid cross-test leakage
+  // and to keep the developer's real DEBUG value intact after the run.
+  if (ORIGINAL_DEBUG === undefined) {
+    delete process.env.DEBUG;
+  } else {
+    process.env.DEBUG = ORIGINAL_DEBUG;
+  }
+});
+
+describe('getCollabToken', () => {
+  it('reads the token from the wrapped data.data.token path', async () => {
+    mock
+      .onPost(`${BASE_URL}/auth/collab-token`)
+      .reply(200, { data: { token: 'wrapped-token' } });
+
+    const token = await getCollabToken(BASE_URL, API_TOKEN);
+
+    expect(token).toBe('wrapped-token');
+  });
+
+  it('falls back to the top-level data.token when data.data is absent', async () => {
+    mock
+      .onPost(`${BASE_URL}/auth/collab-token`)
+      .reply(200, { token: 'flat-token' });
+
+    const token = await getCollabToken(BASE_URL, API_TOKEN);
+
+    expect(token).toBe('flat-token');
+  });
+
+  it('prefers data.data.token over a sibling top-level token', async () => {
+    mock
+      .onPost(`${BASE_URL}/auth/collab-token`)
+      .reply(200, { data: { token: 'wrapped' }, token: 'flat' });
+
+    const token = await getCollabToken(BASE_URL, API_TOKEN);
+
+    expect(token).toBe('wrapped');
+  });
+
+  it('sends the Bearer Authorization header built from the api token', async () => {
+    let seenAuth: string | undefined;
+    mock.onPost(`${BASE_URL}/auth/collab-token`).reply((config) => {
+      seenAuth = config.headers?.Authorization as string | undefined;
+      return [200, { data: { token: 'ok' } }];
+    });
+
+    await getCollabToken(BASE_URL, API_TOKEN);
+
+    expect(seenAuth).toBe(`Bearer ${API_TOKEN}`);
+  });
+
+  it('throws an Error whose .status carries the 401 so reauth callers can detect it', async () => {
+    // No DEBUG set: the body must NOT be leaked (see secret-leak guard test).
+    delete process.env.DEBUG;
+    mock
+      .onPost(`${BASE_URL}/auth/collab-token`)
+      .reply(401, { secret: 'do-not-leak' });
+
+    await expect(getCollabToken(BASE_URL, API_TOKEN)).rejects.toMatchObject({
+      status: 401,
+    });
+  });
+
+  it('omits the response body from the error message when DEBUG is unset (secret-leak guard)', async () => {
+    delete process.env.DEBUG;
+    mock
+      .onPost(`${BASE_URL}/auth/collab-token`)
+      .reply(401, { secret: 'do-not-leak' });
+
+    await expect(getCollabToken(BASE_URL, API_TOKEN)).rejects.toThrow(
+      /Failed to get collab token: 401/,
+    );
+    // The serialized body must be absent without DEBUG.
+    let captured: any;
+    try {
+      await getCollabToken(BASE_URL, API_TOKEN);
+    } catch (e) {
+      captured = e;
+    }
+    expect(captured.message).not.toContain('do-not-leak');
+    expect(captured.status).toBe(401);
+  });
+
+  it('includes the response body in the error message when DEBUG is set', async () => {
+    process.env.DEBUG = '1';
+    mock
+      .onPost(`${BASE_URL}/auth/collab-token`)
+      .reply(403, { detail: 'forbidden-detail' });
+
+    let captured: any;
+    try {
+      await getCollabToken(BASE_URL, API_TOKEN);
+    } catch (e) {
+      captured = e;
+    }
+    expect(captured.status).toBe(403);
+    // With DEBUG the JSON-serialized body is appended to the message.
+    expect(captured.message).toContain('forbidden-detail');
+    expect(captured.message).toContain('Failed to get collab token: 403');
+  });
+
+  it('rethrows a non-axios error unwrapped (status untouched)', async () => {
+    const boom = new Error('plain failure');
+    // A handler that throws a non-axios error from inside the request lifecycle.
+    mock.onPost(`${BASE_URL}/auth/collab-token`).reply(() => {
+      throw boom;
+    });
+
+    let captured: any;
+    try {
+      await getCollabToken(BASE_URL, API_TOKEN);
+    } catch (e) {
+      captured = e;
+    }
+    // It must be the exact same error object, not a wrapped one, and it must
+    // not have had a .status grafted onto it by the axios-error branch.
+    expect(captured).toBe(boom);
+    expect(captured.status).toBeUndefined();
+  });
+});
+
+describe('performLogin', () => {
+  it('extracts the authToken value from a single set-cookie header', async () => {
+    mock.onPost(`${BASE_URL}/auth/login`).reply(200, {}, {
+      'set-cookie': ['authToken=abc123; Path=/; HttpOnly'],
+    });
+
+    const token = await performLogin(BASE_URL, 'user@example.com', 'pw');
+
+    expect(token).toBe('abc123');
+  });
+
+  it('does not truncate a base64 cookie value containing "=" padding', async () => {
+    // The value contains "=" characters; slicing from the FIRST "=" must keep
+    // the full base64 payload (a naive split on "=" would lose the padding).
+    const value = 'eyJhbGciOiJIUzI1NiJ9.payload==';
+    mock.onPost(`${BASE_URL}/auth/login`).reply(200, {}, {
+      'set-cookie': [`authToken=${value}; Path=/; HttpOnly; SameSite=Lax`],
+    });
+
+    const token = await performLogin(BASE_URL, 'user@example.com', 'pw');
+
+    expect(token).toBe(value);
+  });
+
+  it('picks the authToken cookie out of multiple cookies present', async () => {
+    mock.onPost(`${BASE_URL}/auth/login`).reply(200, {}, {
+      'set-cookie': [
+        'sessionId=zzz; Path=/',
+        'authToken=the-token; Path=/; HttpOnly',
+        'theme=dark; Path=/',
+      ],
+    });
+
+    const token = await performLogin(BASE_URL, 'user@example.com', 'pw');
+
+    expect(token).toBe('the-token');
+  });
+
+  it('does NOT match authTokenRefresh (exact cookie-name guard)', async () => {
+    // Only an authTokenRefresh cookie is present; an exact-name match must
+    // reject it and report no authToken cookie rather than returning its value.
+    mock.onPost(`${BASE_URL}/auth/login`).reply(200, {}, {
+      'set-cookie': ['authTokenRefresh=refresh-value; Path=/; HttpOnly'],
+    });
+
+    await expect(
+      performLogin(BASE_URL, 'user@example.com', 'pw'),
+    ).rejects.toThrow('No authToken cookie found in login response');
+  });
+
+  it('prefers authToken over a co-present authTokenRefresh cookie', async () => {
+    mock.onPost(`${BASE_URL}/auth/login`).reply(200, {}, {
+      'set-cookie': [
+        'authTokenRefresh=refresh-value; Path=/',
+        'authToken=real-token; Path=/; HttpOnly',
+      ],
+    });
+
+    const token = await performLogin(BASE_URL, 'user@example.com', 'pw');
+
+    expect(token).toBe('real-token');
+  });
+
+  it('throws when the set-cookie header is missing', async () => {
+    // No set-cookie header at all in the response.
+    mock.onPost(`${BASE_URL}/auth/login`).reply(200, {});
+
+    await expect(
+      performLogin(BASE_URL, 'user@example.com', 'pw'),
+    ).rejects.toThrow('No Set-Cookie header found in login response');
+  });
+
+  describe('error logging (DEBUG gating)', () => {
+    let errorSpy: ReturnType<typeof vi.spyOn>;
+
+    beforeEach(() => {
+      errorSpy = vi.spyOn(console, 'error').mockImplementation(() => undefined);
+    });
+
+    afterEach(() => {
+      errorSpy.mockRestore();
+    });
+
+    it('logs only the status (not the body) on an axios error without DEBUG, and rethrows', async () => {
+      delete process.env.DEBUG;
+      mock
+        .onPost(`${BASE_URL}/auth/login`)
+        .reply(401, { secret: 'login-do-not-leak' });
+
+      await expect(
+        performLogin(BASE_URL, 'user@example.com', 'pw'),
+      ).rejects.toBeDefined();
+
+      const logged = errorSpy.mock.calls.flat();
+      // The body object must not be among the logged arguments.
+      expect(logged).toContain(401);
+      expect(
+        logged.some(
+          (a) =>
+            typeof a === 'object' &&
+            a !== null &&
+            (a as any).secret === 'login-do-not-leak',
+        ),
+      ).toBe(false);
+    });
+
+    it('logs the response body on an axios error when DEBUG is set, and rethrows', async () => {
+      process.env.DEBUG = '1';
+      mock
+        .onPost(`${BASE_URL}/auth/login`)
+        .reply(401, { detail: 'verbose-login-detail' });
+
+      await expect(
+        performLogin(BASE_URL, 'user@example.com', 'pw'),
+      ).rejects.toBeDefined();
+
+      const logged = errorSpy.mock.calls.flat();
+      expect(
+        logged.some(
+          (a) =>
+            typeof a === 'object' &&
+            a !== null &&
+            (a as any).detail === 'verbose-login-detail',
+        ),
+      ).toBe(true);
+    });
+  });
+});
--- a/test/client-pure.test.ts
+++ b/test/client-pure.test.ts
@@ -0,0 +1,474 @@
+// Unit tests for the PURE (private) helper methods of DocmostClient plus the
+// transformPage vm sandbox. The constructor only calls axios.create (no
+// network), so a real instance can be built and its private methods exercised
+// via an `(client as any)` cast. Private methods are pure (no I/O) except for
+// transformPage, whose network calls (ensureAuthenticated / listComments /
+// getPageRaw) we stub on the instance so the dryRun path runs offline.
+import { describe, it, expect } from 'vitest';
+import { DocmostClient } from '../packages/docmost-client/src/client.js';
+
+// Build a fresh client per test. The given URL ends with /api so appUrl tests
+// have something to strip; other tests do not depend on the suffix.
+function makeClient(apiUrl = 'https://docmost.example/api'): any {
+  return new DocmostClient(apiUrl, 'a@b.c', 'pw') as any;
+}
+
+describe('DocmostClient.isSafeUrl (SECURITY)', () => {
+  // --- dangerous schemes must be rejected in both contexts ---
+  const dangerousLink = ['javascript:alert(1)', 'vbscript:msgbox(1)', 'data:text/html,<script>'];
+  for (const url of dangerousLink) {
+    it(`rejects dangerous scheme on a link: ${url}`, () => {
+      const c = makeClient();
+      expect(c.isSafeUrl(url, 'link')).toBe(false);
+    });
+  }
+
+  // file: is in the dangerous set; for links scheme!==js/vbscript/data passes,
+  // BUT file: is only rejected for src. Confirm documented link behaviour:
+  // links only block javascript/vbscript/data. file: is allowed on a link.
+  it('allows file: on a link (links only block js/vbscript/data per docstring)', () => {
+    const c = makeClient();
+    expect(c.isSafeUrl('file:///etc/passwd', 'link')).toBe(true);
+  });
+
+  it('rejects file: on a src', () => {
+    const c = makeClient();
+    expect(c.isSafeUrl('file:///etc/passwd', 'src')).toBe(false);
+  });
+
+  it('rejects data: on a src', () => {
+    const c = makeClient();
+    expect(c.isSafeUrl('data:image/png;base64,AAAA', 'src')).toBe(false);
+  });
+
+  // --- whitespace / control-char smuggled schemes (the classic XSS bypass) ---
+  it('rejects a tab-smuggled javascript scheme on a link (java\\tscript:)', () => {
+    const c = makeClient();
+    const smuggled = 'java\tscript:alert(1)';
+    // CRITICAL: a bypass here would allow stored XSS. Must be rejected.
+    expect(c.isSafeUrl(smuggled, 'link')).toBe(false);
+  });
+
+  it('rejects a newline-smuggled javascript scheme on a link', () => {
+    const c = makeClient();
+    expect(c.isSafeUrl('java\nscript:alert(1)', 'link')).toBe(false);
+  });
+
+  it('rejects a leading-whitespace javascript scheme on a link', () => {
+    const c = makeClient();
+    expect(c.isSafeUrl('   javascript:alert(1)', 'link')).toBe(false);
+  });
+
+  it('rejects a NUL/control-char smuggled javascript scheme on a link', () => {
+    const c = makeClient();
+    // \x00 and \x01 are stripped before the scheme is parsed.
+    expect(c.isSafeUrl('java\x00script:alert(1)', 'link')).toBe(false);
+    expect(c.isSafeUrl('\x01javascript:alert(1)', 'link')).toBe(false);
+  });
+
+  it('rejects a tab-smuggled vbscript scheme on a src', () => {
+    const c = makeClient();
+    expect(c.isSafeUrl('vb\tscript:foo', 'src')).toBe(false);
+  });
+
+  // --- safe / allowed values ---
+  it('allows http and https in both contexts', () => {
+    const c = makeClient();
+    expect(c.isSafeUrl('http://example.com', 'link')).toBe(true);
+    expect(c.isSafeUrl('https://example.com', 'link')).toBe(true);
+    expect(c.isSafeUrl('http://example.com/x.png', 'src')).toBe(true);
+    expect(c.isSafeUrl('https://example.com/x.png', 'src')).toBe(true);
+  });
+
+  it('allows mailto in both contexts', () => {
+    const c = makeClient();
+    expect(c.isSafeUrl('mailto:a@b.c', 'link')).toBe(true);
+    expect(c.isSafeUrl('mailto:a@b.c', 'src')).toBe(true);
+  });
+
+  it('allows a scheme-less relative/absolute path (link and src)', () => {
+    const c = makeClient();
+    expect(c.isSafeUrl('/api/files/123/x.png', 'src')).toBe(true);
+    expect(c.isSafeUrl('relative/path', 'src')).toBe(true);
+    expect(c.isSafeUrl('#anchor', 'link')).toBe(true);
+    expect(c.isSafeUrl('/some/page', 'link')).toBe(true);
+  });
+
+  it('allows an arbitrary non-dangerous scheme on a link but not on a src', () => {
+    const c = makeClient();
+    // link: any scheme except js/vbscript/data is accepted (e.g. ftp, tel).
+    expect(c.isSafeUrl('ftp://host/file', 'link')).toBe(true);
+    expect(c.isSafeUrl('tel:+123', 'link')).toBe(true);
+    // src: only http/https/mailto (and scheme-less) are accepted.
+    expect(c.isSafeUrl('ftp://host/file', 'src')).toBe(false);
+    expect(c.isSafeUrl('tel:+123', 'src')).toBe(false);
+  });
+
+  // --- empty / non-string inputs ---
+  it('treats an empty/whitespace string as safe (empty href/src is harmless)', () => {
+    const c = makeClient();
+    expect(c.isSafeUrl('', 'link')).toBe(true);
+    expect(c.isSafeUrl('   ', 'src')).toBe(true);
+  });
+
+  it('rejects non-string inputs', () => {
+    const c = makeClient();
+    expect(c.isSafeUrl(undefined, 'link')).toBe(false);
+    expect(c.isSafeUrl(null, 'src')).toBe(false);
+    expect(c.isSafeUrl(123, 'link')).toBe(false);
+    expect(c.isSafeUrl({}, 'src')).toBe(false);
+  });
+});
+
+describe('DocmostClient.validateDocUrls', () => {
+  it('passes a clean doc with safe link href and safe media src', () => {
+    const c = makeClient();
+    const doc = {
+      type: 'doc',
+      content: [
+        {
+          type: 'paragraph',
+          content: [
+            { type: 'text', text: 'hi', marks: [{ type: 'link', attrs: { href: 'https://ok.com' } }] },
+          ],
+        },
+        { type: 'image', attrs: { src: '/api/files/1/x.png' } },
+      ],
+    };
+    expect(() => c.validateDocUrls(doc)).not.toThrow();
+  });
+
+  it('throws on an unsafe href on a link mark', () => {
+    const c = makeClient();
+    const doc = {
+      type: 'doc',
+      content: [
+        {
+          type: 'paragraph',
+          content: [
+            { type: 'text', text: 'x', marks: [{ type: 'link', attrs: { href: 'javascript:alert(1)' } }] },
+          ],
+        },
+      ],
+    };
+    expect(() => c.validateDocUrls(doc)).toThrow(/unsafe link href rejected/);
+  });
+
+  // Every media node type the method enumerates must have its src validated.
+  const mediaTypes = ['image', 'attachment', 'video', 'embed', 'youtube', 'drawio', 'excalidraw', 'audio', 'pdf'];
+  for (const type of mediaTypes) {
+    it(`throws on unsafe src on a ${type} node`, () => {
+      const c = makeClient();
+      const doc = { type: 'doc', content: [{ type, attrs: { src: 'javascript:alert(1)' } }] };
+      expect(() => c.validateDocUrls(doc)).toThrow(new RegExp(`unsafe ${type} src rejected`));
+    });
+
+    it(`throws on unsafe url on a ${type} node`, () => {
+      const c = makeClient();
+      const doc = { type: 'doc', content: [{ type, attrs: { url: 'data:text/html,x' } }] };
+      expect(() => c.validateDocUrls(doc)).toThrow(new RegExp(`unsafe ${type} url rejected`));
+    });
+  }
+
+  it('recurses into nested children', () => {
+    const c = makeClient();
+    const doc = {
+      type: 'doc',
+      content: [
+        { type: 'blockquote', content: [{ type: 'paragraph', content: [{ type: 'image', attrs: { src: 'vbscript:x' } }] }] },
+      ],
+    };
+    expect(() => c.validateDocUrls(doc)).toThrow(/unsafe image src rejected/);
+  });
+
+  it('throws when nesting exceeds the max depth (>200)', () => {
+    const c = makeClient();
+    // Build a chain 250 deep of content-wrapping nodes.
+    let node: any = { type: 'paragraph' };
+    for (let i = 0; i < 250; i++) node = { type: 'doc', content: [node] };
+    expect(() => c.validateDocUrls(node)).toThrow(/exceeds the maximum depth of 200/);
+  });
+
+  it('ignores non-object / null input without throwing', () => {
+    const c = makeClient();
+    expect(() => c.validateDocUrls(null)).not.toThrow();
+    expect(() => c.validateDocUrls('string')).not.toThrow();
+  });
+});
+
+describe('DocmostClient.validateDocStructure', () => {
+  it('passes a valid doc', () => {
+    const c = makeClient();
+    const doc = {
+      type: 'doc',
+      content: [{ type: 'paragraph', content: [{ type: 'text', text: 'hi', marks: [{ type: 'bold' }] }] }],
+    };
+    expect(() => c.validateDocStructure(doc)).not.toThrow();
+  });
+
+  it('throws when type is not a string (or node not an object)', () => {
+    const c = makeClient();
+    expect(() => c.validateDocStructure({ type: 123 })).toThrow(/string `type`/);
+    expect(() => c.validateDocStructure(null)).toThrow(/string `type`/);
+    expect(() => c.validateDocStructure('nope')).toThrow(/string `type`/);
+    expect(() => c.validateDocStructure({})).toThrow(/string `type`/);
+  });
+
+  it('throws when content is present but not an array', () => {
+    const c = makeClient();
+    expect(() => c.validateDocStructure({ type: 'doc', content: {} })).toThrow(/`content` must be an array/);
+  });
+
+  it('throws when marks is present but not an array', () => {
+    const c = makeClient();
+    expect(() => c.validateDocStructure({ type: 'paragraph', marks: 'bold' })).toThrow(/`marks` must be an array/);
+  });
+
+  it('throws when a mark is malformed (no string type)', () => {
+    const c = makeClient();
+    expect(() => c.validateDocStructure({ type: 'text', text: 'x', marks: [{ foo: 1 }] }))
+      .toThrow(/every mark must be an object with a string `type`/);
+  });
+
+  it('throws when a text node has a non-string text', () => {
+    const c = makeClient();
+    expect(() => c.validateDocStructure({ type: 'text', text: 123 })).toThrow(/text node must have a string `text`/);
+  });
+
+  it('throws when nesting exceeds the max depth (>200)', () => {
+    const c = makeClient();
+    let node: any = { type: 'paragraph' };
+    for (let i = 0; i < 250; i++) node = { type: 'doc', content: [node] };
+    expect(() => c.validateDocStructure(node)).toThrow(/nesting exceeds the maximum depth of 200/);
+  });
+});
+
+describe('DocmostClient.imageMimeFromPath', () => {
+  const cases: Array<[string, string]> = [
+    ['x.png', 'image/png'],
+    ['x.jpg', 'image/jpeg'],
+    ['x.jpeg', 'image/jpeg'],
+    ['x.gif', 'image/gif'],
+    ['x.webp', 'image/webp'],
+    ['x.svg', 'image/svg+xml'],
+  ];
+  for (const [path, mime] of cases) {
+    it(`maps ${path} -> ${mime}`, () => {
+      const c = makeClient();
+      expect(c.imageMimeFromPath(path)).toBe(mime);
+    });
+  }
+
+  it('is case-insensitive on the extension (.PNG)', () => {
+    const c = makeClient();
+    expect(c.imageMimeFromPath('/tmp/IMG.PNG')).toBe('image/png');
+    expect(c.imageMimeFromPath('/tmp/IMG.JpEg')).toBe('image/jpeg');
+  });
+
+  it('throws on an unknown extension', () => {
+    const c = makeClient();
+    expect(() => c.imageMimeFromPath('x.tiff')).toThrow(/unsupported image type/);
+  });
+
+  it('throws when there is no extension', () => {
+    const c = makeClient();
+    expect(() => c.imageMimeFromPath('/tmp/noext')).toThrow(/unsupported image type/);
+  });
+});
+
+describe('DocmostClient.buildImageNode', () => {
+  it('uses fileSize when present', () => {
+    const c = makeClient();
+    const node = c.buildImageNode({ id: 'abc', fileName: 'pic.png', fileSize: 4096 });
+    expect(node.type).toBe('image');
+    expect(node.attrs.size).toBe(4096);
+    expect(node.attrs.attachmentId).toBe('abc');
+    expect(node.attrs.src).toBe('/api/files/abc/pic.png');
+  });
+
+  it('defaults size to null when fileSize is undefined', () => {
+    const c = makeClient();
+    const node = c.buildImageNode({ id: 'abc', fileName: 'pic.png' });
+    expect(node.attrs.size).toBeNull();
+  });
+
+  it('defaults align to center and width to null', () => {
+    const c = makeClient();
+    const node = c.buildImageNode({ id: 'a', fileName: 'p.png' });
+    expect(node.attrs.align).toBe('center');
+    expect(node.attrs.width).toBeNull();
+  });
+
+  it('honours an explicit align', () => {
+    const c = makeClient();
+    const node = c.buildImageNode({ id: 'a', fileName: 'p.png' }, 'right');
+    expect(node.attrs.align).toBe('right');
+  });
+
+  it('omits alt when not provided, sets it when provided', () => {
+    const c = makeClient();
+    const noAlt = c.buildImageNode({ id: 'a', fileName: 'p.png' });
+    expect('alt' in noAlt.attrs).toBe(false);
+    const withAlt = c.buildImageNode({ id: 'a', fileName: 'p.png' }, 'center', 'a cat');
+    expect(withAlt.attrs.alt).toBe('a cat');
+  });
+});
+
+describe('DocmostClient.appUrl getter', () => {
+  it('strips a trailing /api', () => {
+    expect(makeClient('https://docmost.example/api').appUrl).toBe('https://docmost.example');
+  });
+
+  it('strips a trailing /api/', () => {
+    expect(makeClient('https://docmost.example/api/').appUrl).toBe('https://docmost.example');
+  });
+
+  it('leaves a non-/api URL intact', () => {
+    expect(makeClient('https://docmost.example').appUrl).toBe('https://docmost.example');
+    // /api in the middle of the path is not a trailing suffix, so untouched.
+    expect(makeClient('https://docmost.example/apidocs').appUrl).toBe('https://docmost.example/apidocs');
+  });
+});
+
+describe('DocmostClient.shareUrl', () => {
+  it('composes appUrl + share key + slugId', () => {
+    const c = makeClient('https://docmost.example/api');
+    expect(c.shareUrl('KEY123', 'slug-abc')).toBe('https://docmost.example/share/KEY123/p/slug-abc');
+  });
+
+  it('uses the stripped appUrl (no /api in the share URL)', () => {
+    const c = makeClient('https://docmost.example/api/');
+    expect(c.shareUrl('k', 's')).toBe('https://docmost.example/share/k/p/s');
+  });
+});
+
+describe('DocmostClient.parseCommentContent', () => {
+  it('parses a JSON string', () => {
+    const c = makeClient();
+    expect(c.parseCommentContent('{"type":"doc","content":[]}')).toEqual({ type: 'doc', content: [] });
+  });
+
+  it('passes a non-string value through unchanged', () => {
+    const c = makeClient();
+    const obj = { type: 'doc', content: [] };
+    expect(c.parseCommentContent(obj)).toBe(obj);
+    expect(c.parseCommentContent(null)).toBeNull();
+    expect(c.parseCommentContent(42)).toBe(42);
+  });
+
+  it('falls back to the raw string on invalid JSON', () => {
+    const c = makeClient();
+    expect(c.parseCommentContent('not json {')).toBe('not json {');
+  });
+});
+
+describe('DocmostClient.transformPage sandbox (dryRun, no socket)', () => {
+  // The dryRun path performs: ensureAuthenticated -> listComments -> getPageRaw
+  // -> runTransform (the vm sandbox) -> assertYjsEncodable -> diff. We stub the
+  // three network methods so the REAL sandbox runs offline. getPageRaw returns
+  // a minimal current doc; the transform operates on a structuredClone of it.
+  function stubbedClient(currentDoc: any = { type: 'doc', content: [{ type: 'paragraph' }] }): any {
+    const c = makeClient();
+    c.ensureAuthenticated = async () => {};
+    c.listComments = async () => [];
+    c.getPageRaw = async () => ({ content: currentDoc });
+    return c;
+  }
+
+  it('runs a transform that returns the doc and reports pushed:false in dryRun', async () => {
+    const c = stubbedClient();
+    const res = await c.transformPage('pid', '(doc, ctx) => doc', { dryRun: true });
+    expect(res.pushed).toBe(false);
+    expect(res).toHaveProperty('diff');
+    expect(Array.isArray(res.log)).toBe(true);
+  });
+
+  it('runs a transform that mutates the doc and the change shows in the diff', async () => {
+    const c = stubbedClient({ type: 'doc', content: [{ type: 'paragraph' }] });
+    const transform = `(doc) => { doc.content.push({ type: 'paragraph', content: [{ type: 'text', text: 'added' }] }); return doc; }`;
+    const res = await c.transformPage('pid', transform, { dryRun: true });
+    expect(res.pushed).toBe(false);
+    // diffDocs returns a non-empty diff when content changed.
+    expect(res.diff).toBeTruthy();
+  });
+
+  it('captures console.log output into the returned log array', async () => {
+    const c = stubbedClient();
+    const res = await c.transformPage('pid', `(doc) => { console.log('hello', 1); return doc; }`, { dryRun: true });
+    expect(res.log).toContain('hello 1');
+  });
+
+  it('sandbox has NO access to require/process/module/fs (they are undefined)', async () => {
+    const c = stubbedClient();
+    // The transform asserts these globals are undefined INSIDE the sandbox and
+    // throws if any leaked. If the transform completes, none leaked.
+    const transform = `(doc) => {
+      if (typeof require !== 'undefined') throw new Error('require leaked');
+      if (typeof process !== 'undefined') throw new Error('process leaked');
+      if (typeof module !== 'undefined') throw new Error('module leaked');
+      if (typeof global !== 'undefined') throw new Error('global leaked');
+      return doc;
+    }`;
+    await expect(c.transformPage('pid', transform, { dryRun: true })).resolves.toMatchObject({ pushed: false });
+  });
+
+  it('a transform that tries to require("fs") throws (no module loader in the sandbox)', async () => {
+    const c = stubbedClient();
+    const transform = `(doc) => { const fs = require('fs'); return doc; }`;
+    // require is not defined in the new context -> ReferenceError at run time.
+    await expect(c.transformPage('pid', transform, { dryRun: true })).rejects.toThrow();
+  });
+
+  it('throws when the transform does not evaluate to a function', async () => {
+    const c = stubbedClient();
+    await expect(c.transformPage('pid', '42', { dryRun: true }))
+      .rejects.toThrow(/must evaluate to a function/);
+  });
+
+  it('throws when the transform returns a non-doc value', async () => {
+    const c = stubbedClient();
+    await expect(c.transformPage('pid', '(doc) => ({ type: "paragraph" })', { dryRun: true }))
+      .rejects.toThrow(/must return a ProseMirror doc node/);
+    await expect(c.transformPage('pid', '(doc) => null', { dryRun: true }))
+      .rejects.toThrow(/must return a ProseMirror doc node/);
+  });
+
+  it('throws on a transform that does not compile', async () => {
+    const c = stubbedClient();
+    await expect(c.transformPage('pid', '(doc) => {{{', { dryRun: true }))
+      .rejects.toThrow(/did not compile/);
+  });
+
+  it('invokes validateDocStructure on the result (malformed node rejected)', async () => {
+    const c = stubbedClient();
+    // Return a doc whose child has a non-string type -> validateDocStructure throws.
+    const transform = `(doc) => ({ type: 'doc', content: [{ type: 123 }] })`;
+    await expect(c.transformPage('pid', transform, { dryRun: true }))
+      .rejects.toThrow(/string `type`/);
+  });
+
+  it('invokes validateDocUrls on the result (unsafe href rejected)', async () => {
+    const c = stubbedClient();
+    const transform = `(doc) => ({ type: 'doc', content: [
+      { type: 'paragraph', content: [
+        { type: 'text', text: 'x', marks: [{ type: 'link', attrs: { href: 'javascript:alert(1)' } }] }
+      ] }
+    ] })`;
+    await expect(c.transformPage('pid', transform, { dryRun: true }))
+      .rejects.toThrow(/unsafe link href rejected/);
+  });
+
+  it('enforces a vm wall-clock timeout (option present in source)', () => {
+    // Asserting the option rather than waiting 5s: the source sets
+    // { timeout: 5000 } on both runInNewContext calls. We verify the timeout
+    // literal exists in the compiled source so an accidental removal is caught.
+    // (Reading the source keeps this fast and avoids a real 5s busy loop.)
+    // eslint-disable-next-line @typescript-eslint/no-var-requires
+    const fs = require('node:fs');
+    const url = require('node:url');
+    const path = require('node:path');
+    const here = path.dirname(url.fileURLToPath(import.meta.url));
+    const src = fs.readFileSync(path.join(here, '..', 'packages', 'docmost-client', 'src', 'client.ts'), 'utf8');
+    expect(src).toMatch(/timeout:\s*5000/);
+  });
+});
--- a/test/client-rest.test.ts
+++ b/test/client-rest.test.ts
@@ -0,0 +1,618 @@
+import { afterEach, describe, expect, it, vi } from 'vitest';
+import axios from 'axios';
+import MockAdapter from 'axios-mock-adapter';
+// The DocmostClient source actually lives at packages/docmost-client/src/client.ts
+// (NOT under .../lib/). The package barrel re-exports it, and vitest resolves the
+// ".js" specifier to the TS source, so the real interceptors run.
+import { DocmostClient } from '../packages/docmost-client/src/client.js';
+
+/**
+ * Integration tests for DocmostClient's REST surface using axios-mock-adapter.
+ *
+ * Two distinct axios instances are in play and must each be mocked separately:
+ *
+ *   1. this.client (a dedicated axios.create() instance reachable via the
+ *      PRIVATE field (client as any).client). Every JSON REST call AND the
+ *      401/403 response interceptor live here. Attaching MockAdapter to THIS
+ *      instance is what makes the real interceptor run on mocked responses.
+ *
+ *   2. The global default `axios` import. performLogin() and getCollabToken()
+ *      (in lib/auth-utils.ts) use BARE axios.post(...), so /auth/login and
+ *      /auth/collab-token are NOT seen by this.client's interceptor and must be
+ *      mocked on the shared default axios instance instead (same trick the
+ *      existing auth-utils.test.ts relies on).
+ *
+ * Helper newClient() returns both the client and freshly-installed mocks; tests
+ * close over them. afterEach resets every mock and restores spies.
+ */
+
+const BASE_URL = 'https://docmost.example/api';
+
+// Track every mock created so afterEach can reset/restore them all even if a
+// test forgets — keeps handler registrations from leaking across tests.
+let activeMocks: MockAdapter[] = [];
+
+function instanceMock(client: DocmostClient): MockAdapter {
+  const m = new MockAdapter((client as any).client);
+  activeMocks.push(m);
+  return m;
+}
+
+function globalAxiosMock(): MockAdapter {
+  const m = new MockAdapter(axios);
+  activeMocks.push(m);
+  return m;
+}
+
+/**
+ * Register a /auth/login handler on the global-axios mock that always succeeds
+ * with a valid authToken set-cookie (this is how performLogin extracts a token).
+ * Returns a getter for how many times login was hit so re-login counts can be
+ * asserted.
+ */
+function stubLoginSuccess(gmock: MockAdapter): { get count(): number } {
+  let n = 0;
+  gmock.onPost(`${BASE_URL}/auth/login`).reply(() => {
+    n++;
+    return [200, {}, { 'set-cookie': ['authToken=token-' + n + '; Path=/; HttpOnly'] }];
+  });
+  return {
+    get count() {
+      return n;
+    },
+  };
+}
+
+afterEach(() => {
+  for (const m of activeMocks) m.restore();
+  activeMocks = [];
+  vi.restoreAllMocks();
+});
+
+// ---------------------------------------------------------------------------
+// paginateAll
+// ---------------------------------------------------------------------------
+describe('paginateAll', () => {
+  it('stops after a SHORT page (fewer items than the requested limit)', async () => {
+    const client = new DocmostClient(BASE_URL, 'a@b.c', 'pw');
+    const gmock = globalAxiosMock();
+    stubLoginSuccess(gmock);
+    const imock = instanceMock(client);
+
+    let calls = 0;
+    imock.onPost('/items').reply((config) => {
+      calls++;
+      // Page 1 returns 3 items for a limit of 5 -> short page -> stop.
+      const body = JSON.parse(config.data);
+      expect(body.page).toBe(1);
+      return [200, { data: { items: [{ id: 'a' }, { id: 'b' }, { id: 'c' }] } }];
+    });
+
+    const out = await (client as any).paginateAll('/items', {}, 5);
+    expect(out.map((i: any) => i.id)).toEqual(['a', 'b', 'c']);
+    expect(calls).toBe(1); // never asked for page 2
+  });
+
+  it('stops on an EMPTY page', async () => {
+    const client = new DocmostClient(BASE_URL, 'a@b.c', 'pw');
+    stubLoginSuccess(globalAxiosMock());
+    const imock = instanceMock(client);
+
+    let calls = 0;
+    imock.onPost('/items').reply(() => {
+      calls++;
+      return [200, { data: { items: [] } }];
+    });
+
+    const out = await (client as any).paginateAll('/items', {}, 5);
+    expect(out).toEqual([]);
+    expect(calls).toBe(1);
+  });
+
+  it('follows meta.hasNextPage across multiple FULL pages', async () => {
+    const client = new DocmostClient(BASE_URL, 'a@b.c', 'pw');
+    stubLoginSuccess(globalAxiosMock());
+    const imock = instanceMock(client);
+
+    // Two full pages (limit 2) where the first declares hasNextPage:true and the
+    // second declares false; the second page is full but its flag stops the loop.
+    imock
+      .onPost('/items')
+      .replyOnce(200, {
+        data: { items: [{ id: '1' }, { id: '2' }], meta: { hasNextPage: true } },
+      })
+      .onPost('/items')
+      .replyOnce(200, {
+        data: { items: [{ id: '3' }, { id: '4' }], meta: { hasNextPage: false } },
+      });
+
+    const out = await (client as any).paginateAll('/items', {}, 2);
+    expect(out.map((i: any) => i.id)).toEqual(['1', '2', '3', '4']);
+  });
+
+  it('truncates at the MAX_PAGES cap and emits a console.warn', async () => {
+    const client = new DocmostClient(BASE_URL, 'a@b.c', 'pw');
+    stubLoginSuccess(globalAxiosMock());
+    const imock = instanceMock(client);
+    const warn = vi.spyOn(console, 'warn').mockImplementation(() => undefined);
+
+    // A server that ALWAYS returns a full page (limit 1 -> 1 item) and always
+    // claims hasNextPage:true. The only stop condition is the 50-page ceiling.
+    let calls = 0;
+    imock.onPost('/items').reply(() => {
+      calls++;
+      return [200, { data: { items: [{ id: 'x' + calls }], meta: { hasNextPage: true } } }];
+    });
+
+    const out = await (client as any).paginateAll('/items', {}, 1);
+    // MAX_PAGES is 50: exactly 50 fetches, 50 accumulated items.
+    expect(calls).toBe(50);
+    expect(out).toHaveLength(50);
+    expect(warn).toHaveBeenCalledTimes(1);
+    expect(String(warn.mock.calls[0][0])).toContain('50-page cap');
+  });
+
+  it('clamps the limit into the 1..100 range before sending it', async () => {
+    const client = new DocmostClient(BASE_URL, 'a@b.c', 'pw');
+    stubLoginSuccess(globalAxiosMock());
+    const imock = instanceMock(client);
+
+    const seenLimits: number[] = [];
+    imock.onPost('/big').reply((config) => {
+      seenLimits.push(JSON.parse(config.data).limit);
+      return [200, { data: { items: [] } }];
+    });
+    imock.onPost('/small').reply((config) => {
+      seenLimits.push(JSON.parse(config.data).limit);
+      return [200, { data: { items: [] } }];
+    });
+
+    await (client as any).paginateAll('/big', {}, 9999); // clamps down to 100
+    await (client as any).paginateAll('/small', {}, 0); // clamps up to 1
+    expect(seenLimits).toEqual([100, 1]);
+  });
+
+  it('reads items from BOTH the data.data.items and the data.items envelope', async () => {
+    const client = new DocmostClient(BASE_URL, 'a@b.c', 'pw');
+    stubLoginSuccess(globalAxiosMock());
+    const imock = instanceMock(client);
+
+    // data.data.items envelope (wrapped).
+    imock.onPost('/wrapped').reply(200, { data: { items: [{ id: 'w' }] } });
+    // bare data.items envelope (unwrapped).
+    imock.onPost('/flat').reply(200, { items: [{ id: 'f' }] });
+
+    const wrapped = await (client as any).paginateAll('/wrapped', {}, 100);
+    const flat = await (client as any).paginateAll('/flat', {}, 100);
+    expect(wrapped.map((i: any) => i.id)).toEqual(['w']);
+    expect(flat.map((i: any) => i.id)).toEqual(['f']);
+  });
+
+  it('drives a real public method (getSpaces -> /spaces) through paginateAll + filterSpace', async () => {
+    const client = new DocmostClient(BASE_URL, 'a@b.c', 'pw');
+    stubLoginSuccess(globalAxiosMock());
+    const imock = instanceMock(client);
+
+    imock.onPost('/spaces').reply(200, {
+      data: {
+        items: [
+          { id: 's1', name: 'Space One', slug: 'one', extraneous: 'dropped' },
+        ],
+      },
+    });
+
+    const spaces = await client.getSpaces();
+    expect(spaces).toHaveLength(1);
+    expect(spaces[0]).toMatchObject({ id: 's1', name: 'Space One', slug: 'one' });
+    // filterSpace must drop fields it does not whitelist.
+    expect(spaces[0]).not.toHaveProperty('extraneous');
+  });
+});
+
+// ---------------------------------------------------------------------------
+// search
+// ---------------------------------------------------------------------------
+describe('search', () => {
+  it('clamps a too-large limit down to 100', async () => {
+    const client = new DocmostClient(BASE_URL, 'a@b.c', 'pw');
+    stubLoginSuccess(globalAxiosMock());
+    const imock = instanceMock(client);
+
+    let sentLimit: number | undefined;
+    imock.onPost('/search').reply((config) => {
+      sentLimit = JSON.parse(config.data).limit;
+      return [200, { data: [], success: true }];
+    });
+
+    await client.search('q', undefined, 9999);
+    expect(sentLimit).toBe(100);
+  });
+
+  it('clamps a too-small limit up to 1', async () => {
+    const client = new DocmostClient(BASE_URL, 'a@b.c', 'pw');
+    stubLoginSuccess(globalAxiosMock());
+    const imock = instanceMock(client);
+
+    let sentLimit: number | undefined;
+    imock.onPost('/search').reply((config) => {
+      sentLimit = JSON.parse(config.data).limit;
+      return [200, { data: [], success: true }];
+    });
+
+    await client.search('q', undefined, 0);
+    expect(sentLimit).toBe(1);
+  });
+
+  it('omits the limit field entirely when no limit is supplied', async () => {
+    const client = new DocmostClient(BASE_URL, 'a@b.c', 'pw');
+    stubLoginSuccess(globalAxiosMock());
+    const imock = instanceMock(client);
+
+    let body: any;
+    imock.onPost('/search').reply((config) => {
+      body = JSON.parse(config.data);
+      return [200, { data: [], success: true }];
+    });
+
+    await client.search('hello', 'space-1');
+    expect(body).not.toHaveProperty('limit');
+    expect(body.query).toBe('hello');
+    expect(body.spaceId).toBe('space-1');
+  });
+
+  it('normalizes a BARE-ARRAY data envelope', async () => {
+    const client = new DocmostClient(BASE_URL, 'a@b.c', 'pw');
+    stubLoginSuccess(globalAxiosMock());
+    const imock = instanceMock(client);
+
+    imock.onPost('/search').reply(200, {
+      data: [{ id: 'p1', title: 'Result 1', extra: 'x' }],
+      success: true,
+    });
+
+    const res = await client.search('q');
+    expect(res.success).toBe(true);
+    expect(res.items).toHaveLength(1);
+    expect(res.items[0]).toMatchObject({ id: 'p1', title: 'Result 1' });
+    // filterSearchResult whitelists fields; "extra" must be gone.
+    expect(res.items[0]).not.toHaveProperty('extra');
+  });
+
+  it('normalizes a { items: [...] } data envelope', async () => {
+    const client = new DocmostClient(BASE_URL, 'a@b.c', 'pw');
+    stubLoginSuccess(globalAxiosMock());
+    const imock = instanceMock(client);
+
+    imock.onPost('/search').reply(200, {
+      data: { items: [{ id: 'p2', title: 'Result 2' }] },
+      success: true,
+    });
+
+    const res = await client.search('q');
+    expect(res.items).toHaveLength(1);
+    expect(res.items[0]).toMatchObject({ id: 'p2', title: 'Result 2' });
+  });
+
+  it('defaults success to false when the envelope omits it', async () => {
+    const client = new DocmostClient(BASE_URL, 'a@b.c', 'pw');
+    stubLoginSuccess(globalAxiosMock());
+    const imock = instanceMock(client);
+
+    imock.onPost('/search').reply(200, { data: { items: [] } });
+
+    const res = await client.search('q');
+    expect(res.success).toBe(false);
+    expect(res.items).toEqual([]);
+  });
+});
+
+// ---------------------------------------------------------------------------
+// listComments (cursor loop)
+// ---------------------------------------------------------------------------
+describe('listComments', () => {
+  it('loops on meta.nextCursor until it is null and concatenates every page', async () => {
+    const client = new DocmostClient(BASE_URL, 'a@b.c', 'pw');
+    stubLoginSuccess(globalAxiosMock());
+    const imock = instanceMock(client);
+
+    const seenCursors: (string | undefined)[] = [];
+    imock.onPost('/comments').reply((config) => {
+      const body = JSON.parse(config.data);
+      seenCursors.push(body.cursor);
+      if (!body.cursor) {
+        // First page: a nextCursor pushes the loop to a second request.
+        return [200, { data: { items: [{ id: 'c1' }], meta: { nextCursor: 'CUR2' } } }];
+      }
+      // Second page: nextCursor null -> loop terminates.
+      return [200, { data: { items: [{ id: 'c2' }], meta: { nextCursor: null } } }];
+    });
+
+    const comments = await client.listComments('page-1');
+    expect(comments.map((c: any) => c.id)).toEqual(['c1', 'c2']);
+    // First call carries no cursor; the second carries the server's nextCursor.
+    expect(seenCursors).toEqual([undefined, 'CUR2']);
+  });
+
+  it('parses stringified-JSON comment content into markdown per item', async () => {
+    const client = new DocmostClient(BASE_URL, 'a@b.c', 'pw');
+    stubLoginSuccess(globalAxiosMock());
+    const imock = instanceMock(client);
+
+    // createComment stores content as JSON.stringify(proseMirrorDoc); on read it
+    // comes back as a STRING that parseCommentContent must JSON.parse before the
+    // markdown converter can render it.
+    const stringifiedDoc = JSON.stringify({
+      type: 'doc',
+      content: [{ type: 'paragraph', content: [{ type: 'text', text: 'Hello comment' }] }],
+    });
+
+    imock.onPost('/comments').reply(200, {
+      data: {
+        items: [
+          { id: 'c1', pageId: 'page-1', content: stringifiedDoc },
+          { id: 'c2', pageId: 'page-1', content: '' }, // empty -> "" markdown
+        ],
+        meta: { nextCursor: null },
+      },
+    });
+
+    const comments = await client.listComments('page-1');
+    expect(comments[0].content).toContain('Hello comment');
+    expect(comments[1].content).toBe('');
+  });
+
+  it('handles the bare (unwrapped) response envelope too', async () => {
+    const client = new DocmostClient(BASE_URL, 'a@b.c', 'pw');
+    stubLoginSuccess(globalAxiosMock());
+    const imock = instanceMock(client);
+
+    // response.data.data is absent -> the code falls back to response.data.
+    imock.onPost('/comments').reply(200, {
+      items: [{ id: 'only', pageId: 'page-1', content: '' }],
+      meta: { nextCursor: null },
+    });
+
+    const comments = await client.listComments('page-1');
+    expect(comments.map((c: any) => c.id)).toEqual(['only']);
+  });
+});
+
+// ---------------------------------------------------------------------------
+// checkNewComments
+// ---------------------------------------------------------------------------
+describe('checkNewComments', () => {
+  it('THROWS on an invalid "since" date rather than silently reporting nothing new', async () => {
+    const client = new DocmostClient(BASE_URL, 'a@b.c', 'pw');
+    stubLoginSuccess(globalAxiosMock());
+    instanceMock(client);
+
+    await expect(client.checkNewComments('space-1', 'not-a-date')).rejects.toThrow(
+      /invalid "since" date/,
+    );
+  });
+
+  it('keeps only comments with createdAt STRICTLY greater than since (boundary excluded)', async () => {
+    const client = new DocmostClient(BASE_URL, 'a@b.c', 'pw');
+    stubLoginSuccess(globalAxiosMock());
+    const imock = instanceMock(client);
+
+    const since = '2026-06-16T10:00:00.000Z';
+
+    // One root page (no children) returned by sidebar-pages enumeration.
+    imock.onPost('/pages/sidebar-pages').reply(200, {
+      data: { items: [{ id: 'p1', title: 'Page 1', hasChildren: false }] },
+    });
+
+    // Comments on p1: one before, one exactly AT the boundary, one after.
+    imock.onPost('/comments').reply(200, {
+      data: {
+        items: [
+          { id: 'before', pageId: 'p1', content: '', createdAt: '2026-06-16T09:59:59.000Z' },
+          { id: 'equal', pageId: 'p1', content: '', createdAt: since }, // boundary -> excluded (> is strict)
+          { id: 'after', pageId: 'p1', content: '', createdAt: '2026-06-16T10:00:01.000Z' },
+        ],
+        meta: { nextCursor: null },
+      },
+    });
+
+    const res = await client.checkNewComments('space-1', since);
+    expect(res.totalNewComments).toBe(1);
+    expect(res.pagesWithNewComments).toBe(1);
+    expect(res.comments[0].comments.map((c: any) => c.id)).toEqual(['after']);
+    // The boundary-equal comment is NOT included.
+    expect(res.comments[0].comments.map((c: any) => c.id)).not.toContain('equal');
+  });
+
+  it('reports truncated=false for a small page set', async () => {
+    const client = new DocmostClient(BASE_URL, 'a@b.c', 'pw');
+    stubLoginSuccess(globalAxiosMock());
+    const imock = instanceMock(client);
+
+    imock.onPost('/pages/sidebar-pages').reply(200, {
+      data: { items: [{ id: 'p1', title: 'Page 1', hasChildren: false }] },
+    });
+    imock.onPost('/comments').reply(200, {
+      data: { items: [], meta: { nextCursor: null } },
+    });
+
+    const res = await client.checkNewComments('space-1', '2026-06-16T10:00:00.000Z');
+    expect(res.truncated).toBe(false);
+    expect(res.checkedPages).toBe(1);
+    expect(res.totalNewComments).toBe(0);
+  });
+});
+
+// ---------------------------------------------------------------------------
+// AUTH: 401 interceptor + re-login dedup + getCollabTokenWithReauth
+// ---------------------------------------------------------------------------
+describe('auth: 401 interceptor and re-login', () => {
+  it('re-authenticates ONCE and replays the request ONCE on a 401-then-200 sequence', async () => {
+    const client = new DocmostClient(BASE_URL, 'a@b.c', 'pw');
+    // Silence performLogin's own console.error noise (not under test here).
+    vi.spyOn(console, 'error').mockImplementation(() => undefined);
+    const gmock = globalAxiosMock();
+    const login = stubLoginSuccess(gmock);
+    const imock = instanceMock(client);
+
+    // Pre-authenticate so the very first ensureAuthenticated() login is already
+    // done; this isolates the count of EXTRA re-logins caused by the 401.
+    await client.login();
+    expect(login.count).toBe(1);
+
+    let getCalls = 0;
+    imock.onPost('/workspace/info').reply(() => {
+      getCalls++;
+      if (getCalls === 1) return [401, {}]; // expired token
+      return [200, { data: { id: 'ws-9', name: 'WS' }, success: true }];
+    });
+
+    const res = await client.getWorkspace();
+    expect(res.data.id).toBe('ws-9');
+    expect(getCalls).toBe(2); // original + exactly one replay
+    expect(login.count).toBe(2); // pre-auth + exactly one re-login
+  });
+
+  it('does NOT loop forever: a 401 on BOTH original and replay surfaces the error (config._retry guard)', async () => {
+    const client = new DocmostClient(BASE_URL, 'a@b.c', 'pw');
+    vi.spyOn(console, 'error').mockImplementation(() => undefined);
+    const login = stubLoginSuccess(globalAxiosMock());
+    const imock = instanceMock(client);
+
+    await client.login();
+
+    let getCalls = 0;
+    imock.onPost('/workspace/info').reply(() => {
+      getCalls++;
+      return [401, {}]; // always 401, even after re-login
+    });
+
+    await expect(client.getWorkspace()).rejects.toBeDefined();
+    // The replay sets config._retry, so the SECOND 401 is not retried again.
+    expect(getCalls).toBe(2);
+    // Only one re-login happened (the first 401); the replay's 401 did not
+    // trigger another because _retry was already set.
+    expect(login.count).toBe(2);
+  });
+
+  it('never retries the /auth/login request itself through the interceptor', async () => {
+    const client = new DocmostClient(BASE_URL, 'a@b.c', 'pw');
+    const imock = instanceMock(client);
+
+    // Route a /auth/login call THROUGH this.client (so the interceptor sees it)
+    // and have it 401: the isLoginRequest guard must prevent any replay loop.
+    let hits = 0;
+    imock.onPost('/auth/login').reply(() => {
+      hits++;
+      return [401, {}];
+    });
+
+    await expect((client as any).client.post('/auth/login', {})).rejects.toBeDefined();
+    expect(hits).toBe(1); // exactly one hit, no interceptor-driven retry
+  });
+
+  it('surfaces the ORIGINAL error when the re-login attempt itself fails', async () => {
+    const client = new DocmostClient(BASE_URL, 'a@b.c', 'pw');
+    vi.spyOn(console, 'error').mockImplementation(() => undefined);
+    const gmock = globalAxiosMock();
+    // First login (pre-auth) succeeds; afterwards we flip login to fail.
+    let loginCalls = 0;
+    gmock.onPost(`${BASE_URL}/auth/login`).reply(() => {
+      loginCalls++;
+      if (loginCalls === 1) {
+        return [200, {}, { 'set-cookie': ['authToken=tok; Path=/'] }];
+      }
+      return [500, { msg: 'login down' }]; // re-login fails
+    });
+    const imock = instanceMock(client);
+
+    await client.login(); // pre-auth ok
+
+    imock.onPost('/workspace/info').reply(403, { msg: 'original-forbidden' });
+
+    let captured: any;
+    try {
+      await client.getWorkspace();
+    } catch (e) {
+      captured = e;
+    }
+    // The interceptor's catch returns Promise.reject(error) — the ORIGINAL 403,
+    // not the re-login's 500.
+    expect(captured?.response?.status).toBe(403);
+    expect(captured?.response?.data).toMatchObject({ msg: 'original-forbidden' });
+  });
+
+  it('dedups concurrent login() callers into ONE in-flight /auth/login request', async () => {
+    const client = new DocmostClient(BASE_URL, 'a@b.c', 'pw');
+    const login = stubLoginSuccess(globalAxiosMock());
+
+    // Three simultaneous login() calls must collapse into a single request.
+    await Promise.all([client.login(), client.login(), client.login()]);
+    expect(login.count).toBe(1);
+    // loginPromise resets to null after the in-flight login settles.
+    expect((client as any).loginPromise).toBeNull();
+  });
+
+  it('resets loginPromise after a FAILED login so a later login can retry', async () => {
+    const client = new DocmostClient(BASE_URL, 'a@b.c', 'pw');
+    vi.spyOn(console, 'error').mockImplementation(() => undefined);
+    const gmock = globalAxiosMock();
+
+    let loginCalls = 0;
+    gmock.onPost(`${BASE_URL}/auth/login`).reply(() => {
+      loginCalls++;
+      if (loginCalls === 1) return [500, {}]; // first attempt fails
+      return [200, {}, { 'set-cookie': ['authToken=ok; Path=/'] }]; // second succeeds
+    });
+
+    await expect(client.login()).rejects.toBeDefined();
+    // .finally() cleared the memoized promise even on failure.
+    expect((client as any).loginPromise).toBeNull();
+
+    // A fresh login() therefore issues a brand-new request instead of returning
+    // the previously-rejected promise.
+    await client.login();
+    expect(loginCalls).toBe(2);
+    expect((client as any).loginPromise).toBeNull();
+  });
+});
+
+describe('auth: getCollabTokenWithReauth', () => {
+  it('re-authenticates once on a 401 from collab-token, then retries and returns the token', async () => {
+    const client = new DocmostClient(BASE_URL, 'a@b.c', 'pw');
+    vi.spyOn(console, 'error').mockImplementation(() => undefined);
+    const gmock = globalAxiosMock();
+    const login = stubLoginSuccess(gmock);
+    instanceMock(client);
+
+    let collabCalls = 0;
+    gmock.onPost(`${BASE_URL}/auth/collab-token`).reply(() => {
+      collabCalls++;
+      if (collabCalls === 1) return [401, {}]; // expired token
+      return [200, { data: { token: 'collab-good' } }];
+    });
+
+    const token = await (client as any).getCollabTokenWithReauth();
+    expect(token).toBe('collab-good');
+    expect(collabCalls).toBe(2); // original + retry
+    // ensureAuthenticated login (1) + re-login after the 401 (2).
+    expect(login.count).toBe(2);
+  });
+
+  it('rethrows a NON-auth collab-token error without retrying', async () => {
+    const client = new DocmostClient(BASE_URL, 'a@b.c', 'pw');
+    vi.spyOn(console, 'error').mockImplementation(() => undefined);
+    const gmock = globalAxiosMock();
+    const login = stubLoginSuccess(gmock);
+    instanceMock(client);
+
+    let collabCalls = 0;
+    gmock.onPost(`${BASE_URL}/auth/collab-token`).reply(() => {
+      collabCalls++;
+      return [500, { msg: 'server down' }]; // non-auth error
+    });
+
+    await expect((client as any).getCollabTokenWithReauth()).rejects.toBeDefined();
+    expect(collabCalls).toBe(1); // no retry on a non-auth error
+    expect(login.count).toBe(1); // only the initial ensureAuthenticated login
+  });
+});
--- a/test/client-upload.test.ts
+++ b/test/client-upload.test.ts
@@ -0,0 +1,323 @@
+// Security-guard tests for DocmostClient.uploadImage and DocmostClient.createPage.
+//
+// Both methods send multipart bodies via BARE default axios (`axios.post`)
+// rather than the per-instance client, because a FormData stream is single-use
+// and cannot be replayed by this.client's 401 response interceptor. They each
+// implement their own one-shot 401/403 re-auth that rebuilds the FormData.
+//
+// We therefore mock BOTH adapters:
+//   - the default `axios` (via `new MockAdapter(axios)`) for `/auth/login`,
+//     `/files/upload` and `/pages/import` (the bare multipart POSTs), and
+//   - the per-instance client (via `new MockAdapter((client as any).client)`)
+//     for the JSON endpoints `/pages/info`, `/pages/sidebar-pages`,
+//     `/pages/update`.
+//
+// For the filesystem we use REAL temp files written under os.tmpdir() so the
+// real statSync/readFileSync path is exercised (and cleaned up afterEach).
+
+import { describe, it, expect, beforeEach, afterEach } from 'vitest';
+import MockAdapter from 'axios-mock-adapter';
+import axios from 'axios';
+import { writeFileSync, mkdtempSync, rmSync, mkdirSync } from 'node:fs';
+import { join } from 'node:path';
+import { tmpdir } from 'node:os';
+import { DocmostClient } from '../packages/docmost-client/src/client.js';
+
+const API_URL = 'http://docmost.test/api';
+const SPACE_ID = 'space-1';
+const PAGE_ID = 'page-1';
+
+// A 1x1 transparent PNG (valid-ish bytes; content is irrelevant to the guards).
+const PNG_BYTES = Buffer.from(
+  '89504e470d0a1a0a0000000d49484452000000010000000108060000001f15c4890000000a49444154789c63000100000500010d0a2db40000000049454e44ae426082',
+  'hex',
+);
+
+// A login mock that satisfies performLogin(): it reads the authToken cookie
+// from the Set-Cookie header. Returns it as an array, as a real server would.
+function mockLogin(mockAxios: MockAdapter): void {
+  mockAxios.onPost(`${API_URL}/auth/login`).reply(200, {}, {
+    'set-cookie': ['authToken=test-jwt-token; HttpOnly; Path=/'],
+  });
+}
+
+describe('DocmostClient multipart security guards', () => {
+  let tmpDir: string;
+  let mockAxios: MockAdapter; // default axios -> bare multipart + login
+  let mockClient: MockAdapter; // per-instance client -> JSON endpoints
+  let client: DocmostClient;
+
+  beforeEach(() => {
+    tmpDir = mkdtempSync(join(tmpdir(), 'docmost-upload-test-'));
+    client = new DocmostClient(API_URL, 'user@test', 'pw');
+    mockAxios = new MockAdapter(axios);
+    mockClient = new MockAdapter((client as any).client);
+    mockLogin(mockAxios);
+  });
+
+  afterEach(() => {
+    mockAxios.restore();
+    mockClient.restore();
+    delete process.env.DEBUG;
+    rmSync(tmpDir, { recursive: true, force: true });
+  });
+
+  // Helper: write a real image fixture and return its absolute path.
+  function writeImage(name: string, bytes: Buffer = PNG_BYTES): string {
+    const p = join(tmpDir, name);
+    writeFileSync(p, bytes);
+    return p;
+  }
+
+  describe('uploadImage — host-fs trust boundary', () => {
+    it('rejects an unsupported extension BEFORE any stat/read', async () => {
+      // Point at a path that does NOT exist on disk. If the extension guard
+      // runs first (as it must), we get the "unsupported image type" error and
+      // never reach statSync — which would otherwise throw a "Cannot stat"
+      // error. The error message proves the guard order.
+      const badPath = join(tmpDir, 'does-not-exist.txt');
+      await expect(client.uploadImage(PAGE_ID, badPath)).rejects.toThrow(
+        /unsupported image type \.txt; supported: png, jpg, jpeg, gif, webp, svg/,
+      );
+    });
+
+    it('reports "(none)" for a path with no extension (still before stat)', async () => {
+      const noExt = join(tmpDir, 'noextension');
+      await expect(client.uploadImage(PAGE_ID, noExt)).rejects.toThrow(
+        /unsupported image type \(none\)/,
+      );
+    });
+
+    it('rejects a directory (non-regular file) after the extension passes', async () => {
+      // A directory whose name ends in .png passes the extension allowlist but
+      // must fail the stat.isFile() guard.
+      const dirPath = join(tmpDir, 'a-directory.png');
+      mkdirSync(dirPath);
+      await expect(client.uploadImage(PAGE_ID, dirPath)).rejects.toThrow(
+        new RegExp(`Not a regular file: "${dirPath.replace(/[.*+?^${}()|[\]\\]/g, '\\$&')}"`),
+      );
+    });
+
+    it('surfaces a stat failure for a missing supported-extension file', async () => {
+      // Extension is valid, but the file does not exist -> statSync throws and
+      // is wrapped in "Cannot stat image file ...".
+      const missing = join(tmpDir, 'missing.png');
+      await expect(client.uploadImage(PAGE_ID, missing)).rejects.toThrow(
+        /Cannot stat image file at ".*missing\.png": /,
+      );
+    });
+
+    it('rejects a file larger than the 20 MiB cap', async () => {
+      // Write a real file just over 20 MiB so the real statSync size path is
+      // exercised. 20 MiB == 20 * 1024 * 1024; one extra byte trips the cap.
+      const MAX = 20 * 1024 * 1024;
+      const bigPath = join(tmpDir, 'big.png');
+      writeFileSync(bigPath, Buffer.alloc(MAX + 1));
+      await expect(client.uploadImage(PAGE_ID, bigPath)).rejects.toThrow(
+        new RegExp(`Image too large: ${MAX + 1} bytes exceeds the ${MAX}-byte cap`),
+      );
+      // No multipart POST should have been attempted for an oversized file.
+      const uploadPosts = mockAxios.history.post.filter((r) =>
+        String(r.url).includes('/files/upload'),
+      );
+      expect(uploadPosts.length).toBe(0);
+    });
+
+    it('uploads a valid image and returns attachment metadata + image node', async () => {
+      const imgPath = writeImage('ok.png');
+      mockAxios.onPost(`${API_URL}/files/upload`).reply(200, {
+        data: { id: 'att-1', fileName: 'ok.png', fileSize: 1234 },
+      });
+
+      const res = await client.uploadImage(PAGE_ID, imgPath);
+      expect(res.attachmentId).toBe('att-1');
+      expect(res.fileName).toBe('ok.png');
+      expect(res.fileSize).toBe(1234);
+      expect(res.src).toBe('/api/files/att-1/ok.png');
+      expect(res.imageNode.type).toBe('image');
+      expect(res.imageNode.attrs.attachmentId).toBe('att-1');
+      expect(res.imageNode.attrs.size).toBe(1234);
+    });
+
+    it('falls back to the local stat size when the response omits fileSize', async () => {
+      const imgPath = writeImage('nosize.png'); // PNG_BYTES length
+      const expectedSize = PNG_BYTES.length;
+      mockAxios.onPost(`${API_URL}/files/upload`).reply(200, {
+        // No fileSize in the attachment payload.
+        data: { id: 'att-2', fileName: 'nosize.png' },
+      });
+
+      const res = await client.uploadImage(PAGE_ID, imgPath);
+      expect(res.fileSize).toBe(expectedSize);
+      // The image node's size attr also uses the resolved (local) size.
+      expect(res.imageNode.attrs.size).toBe(expectedSize);
+    });
+
+    it('rebuilds a FRESH FormData and retries exactly once on a 401', async () => {
+      const imgPath = writeImage('retry.png');
+      // First multipart POST -> 401; second -> 200. login() is also issued
+      // between the two by the re-auth branch (already mocked by mockLogin).
+      mockAxios
+        .onPost(`${API_URL}/files/upload`)
+        .replyOnce(401)
+        .onPost(`${API_URL}/files/upload`)
+        .replyOnce(200, { data: { id: 'att-3', fileName: 'retry.png', fileSize: 7 } });
+
+      const res = await client.uploadImage(PAGE_ID, imgPath);
+      expect(res.attachmentId).toBe('att-3');
+
+      // Exactly two upload POSTs (the original + one retry), and a fresh login
+      // was triggered in between.
+      const uploadPosts = mockAxios.history.post.filter((r) =>
+        String(r.url).includes('/files/upload'),
+      );
+      expect(uploadPosts.length).toBe(2);
+      const loginPosts = mockAxios.history.post.filter((r) =>
+        String(r.url).includes('/auth/login'),
+      );
+      // One initial ensureAuthenticated() login + one re-auth login.
+      expect(loginPosts.length).toBeGreaterThanOrEqual(1);
+    });
+
+    it('does NOT retry more than once on repeated 401s', async () => {
+      const imgPath = writeImage('always401.png');
+      // Every upload POST returns 401. After the single retry also 401s, the
+      // error must propagate (no infinite loop). The second 401 is a raw
+      // AxiosError thrown out of the retry branch (not re-caught).
+      mockAxios.onPost(`${API_URL}/files/upload`).reply(401);
+
+      await expect(client.uploadImage(PAGE_ID, imgPath)).rejects.toBeTruthy();
+      const uploadPosts = mockAxios.history.post.filter((r) =>
+        String(r.url).includes('/files/upload'),
+      );
+      // Exactly two attempts: original + one retry.
+      expect(uploadPosts.length).toBe(2);
+    });
+
+    it('sanitizes a non-auth AxiosError and does NOT leak the response body', async () => {
+      const imgPath = writeImage('leak.png');
+      const SECRET = 'SUPER_SECRET_TOKEN_abc123';
+      mockAxios.onPost(`${API_URL}/files/upload`).reply(500, {
+        message: SECRET,
+        internal: { stack: SECRET },
+      });
+
+      let caught: Error | undefined;
+      try {
+        await client.uploadImage(PAGE_ID, imgPath);
+      } catch (e) {
+        caught = e as Error;
+      }
+      expect(caught).toBeDefined();
+      // Surfaces only status/statusText, never the body.
+      expect(caught!.message).toMatch(/Image upload failed: 500/);
+      expect(caught!.message).not.toContain(SECRET);
+    });
+
+    it('throws on a response missing att.id', async () => {
+      const imgPath = writeImage('noid.png');
+      mockAxios.onPost(`${API_URL}/files/upload`).reply(200, {
+        data: { fileName: 'noid.png' }, // missing id
+      });
+      await expect(client.uploadImage(PAGE_ID, imgPath)).rejects.toThrow(
+        /Unexpected \/files\/upload response:/,
+      );
+    });
+
+    it('throws on a response missing att.fileName', async () => {
+      const imgPath = writeImage('noname.png');
+      mockAxios.onPost(`${API_URL}/files/upload`).reply(200, {
+        data: { id: 'att-x' }, // missing fileName
+      });
+      await expect(client.uploadImage(PAGE_ID, imgPath)).rejects.toThrow(
+        /Unexpected \/files\/upload response:/,
+      );
+    });
+  });
+
+  describe('createPage — multipart import guards', () => {
+    it('rejects when the parent page is not found', async () => {
+      // getPage(parentPageId) -> getPageRaw -> POST /pages/info. Make it 404 so
+      // getPage throws and createPage maps it to the parent-not-found error.
+      mockClient.onPost('/pages/info').reply(404, { message: 'nope' });
+
+      await expect(
+        client.createPage('Title', '# body', SPACE_ID, 'missing-parent'),
+      ).rejects.toThrow('Parent page with ID missing-parent not found.');
+
+      // No import POST should have happened — the parent check runs first.
+      const importPosts = mockAxios.history.post.filter((r) =>
+        String(r.url).includes('/pages/import'),
+      );
+      expect(importPosts.length).toBe(0);
+    });
+
+    it('creates a page (no parent) and re-sets the title after import', async () => {
+      // Import succeeds via bare axios.
+      mockAxios
+        .onPost(`${API_URL}/pages/import`)
+        .reply(200, { data: { id: 'new-page-1' } });
+      // Title restore goes through the per-instance client.
+      mockClient.onPost('/pages/update').reply(200, { data: { ok: true } });
+      // Final getPage(newPageId): /pages/info + /pages/sidebar-pages.
+      mockClient
+        .onPost('/pages/info')
+        .reply(200, {
+          data: { id: 'new-page-1', spaceId: SPACE_ID, title: 'My Title', content: null },
+        });
+      mockClient
+        .onPost('/pages/sidebar-pages')
+        .reply(200, { data: { items: [], meta: { hasNextPage: false } } });
+
+      const res = await client.createPage('My Title', '# body', SPACE_ID);
+      expect((res as any).success).toBe(true);
+
+      // The title was re-set via /pages/update with the exact (un-mangled) title.
+      const updatePosts = mockClient.history.post.filter((r) =>
+        String(r.url).includes('/pages/update'),
+      );
+      expect(updatePosts.length).toBe(1);
+      const body = JSON.parse(String(updatePosts[0].data));
+      expect(body).toMatchObject({ pageId: 'new-page-1', title: 'My Title' });
+    });
+
+    it('rebuilds FormData and retries the import exactly once on a 401', async () => {
+      mockAxios
+        .onPost(`${API_URL}/pages/import`)
+        .replyOnce(401)
+        .onPost(`${API_URL}/pages/import`)
+        .replyOnce(200, { data: { id: 'new-page-2' } });
+      mockClient.onPost('/pages/update').reply(200, { data: { ok: true } });
+      mockClient
+        .onPost('/pages/info')
+        .reply(200, {
+          data: { id: 'new-page-2', spaceId: SPACE_ID, title: 'T', content: null },
+        });
+      mockClient
+        .onPost('/pages/sidebar-pages')
+        .reply(200, { data: { items: [], meta: { hasNextPage: false } } });
+
+      const res = await client.createPage('T', '# body', SPACE_ID);
+      expect((res as any).success).toBe(true);
+
+      const importPosts = mockAxios.history.post.filter((r) =>
+        String(r.url).includes('/pages/import'),
+      );
+      expect(importPosts.length).toBe(2);
+    });
+
+    it('rethrows a non-auth import error without retrying', async () => {
+      mockAxios.onPost(`${API_URL}/pages/import`).reply(500, { message: 'boom' });
+
+      await expect(
+        client.createPage('T', '# body', SPACE_ID),
+      ).rejects.toBeTruthy();
+
+      const importPosts = mockAxios.history.post.filter((r) =>
+        String(r.url).includes('/pages/import'),
+      );
+      // Exactly one attempt: a non-401/403 error is rethrown, never retried.
+      expect(importPosts.length).toBe(1);
+    });
+  });
+});
--- a/test/collaboration-mutate.test.ts
+++ b/test/collaboration-mutate.test.ts
@@ -0,0 +1,478 @@
+import { afterEach, beforeEach, describe, expect, it, vi } from 'vitest';
+import * as Y from 'yjs';
+
+// -----------------------------------------------------------------------------
+// Mock the Hocuspocus provider so the test drives its whole lifecycle by hand.
+//
+// `mutatePageContent` constructs `new HocuspocusProvider({...})` and wires all
+// behaviour through callbacks on the OPTIONS object it passes in:
+//   onConnect / onDisconnect / onClose / onSynced / onAuthenticationFailed.
+// It does NOT use an `onUnsyncedChanges` option — instead it reads the live
+// `provider.unsyncedChanges` getter and subscribes via
+// `provider.on("unsyncedChanges", handler)` / `provider.off(...)`.
+//
+// The mock therefore:
+//   - records EVERY constructed instance (so a test can assert "not called");
+//   - captures the options object (to fire onSynced/onDisconnect/onClose/...);
+//   - exposes the real `Y.Doc` passed as `options.document` — the source reads
+//     and writes THAT doc (a closure variable), never `provider.document`, so
+//     reading the fragment off the captured doc reflects what was written;
+//   - implements `on`/`off` for the "unsyncedChanges" event, a settable
+//     `unsyncedChanges` getter-backed field, and no-op `destroy`/`disconnect`.
+// -----------------------------------------------------------------------------
+
+type UnsyncedHandler = (data: { number: number }) => void;
+
+interface MockProviderHandle {
+  opts: any;
+  ydoc: Y.Doc;
+  unsyncedChanges: number;
+  listeners: Map<string, Set<(...args: any[]) => void>>;
+  destroyed: boolean;
+  // Helpers to drive the lifecycle from a test.
+  fireSynced: () => void;
+  fireDisconnect: () => void;
+  fireClose: () => void;
+  fireAuthFailed: () => void;
+  fireConnect: () => void;
+  // Set unsyncedChanges and emit the "unsyncedChanges" event with the new value.
+  emitUnsynced: (n: number) => void;
+}
+
+// Shared registry the test reads after invoking the SUT.
+const instances: MockProviderHandle[] = [];
+
+vi.mock('@hocuspocus/provider', () => {
+  const HocuspocusProvider = vi.fn().mockImplementation((opts: any) => {
+    const listeners = new Map<string, Set<(...args: any[]) => void>>();
+    const handle: MockProviderHandle = {
+      opts,
+      ydoc: opts.document as Y.Doc,
+      unsyncedChanges: 1, // default: write is outstanding until told otherwise
+      listeners,
+      destroyed: false,
+      fireSynced: () => opts.onSynced && opts.onSynced(),
+      fireDisconnect: () => opts.onDisconnect && opts.onDisconnect(),
+      fireClose: () => opts.onClose && opts.onClose(),
+      fireAuthFailed: () =>
+        opts.onAuthenticationFailed && opts.onAuthenticationFailed(),
+      fireConnect: () => opts.onConnect && opts.onConnect(),
+      emitUnsynced: (n: number) => {
+        handle.unsyncedChanges = n;
+        const set = listeners.get('unsyncedChanges');
+        if (set) for (const fn of set) fn({ number: n });
+      },
+    };
+
+    // The object the SUT actually interacts with.
+    const provider: any = {
+      // `unsyncedChanges` is read synchronously by waitForPersistence; back it
+      // by the handle so a test can preset it before firing onSynced.
+      get unsyncedChanges() {
+        return handle.unsyncedChanges;
+      },
+      on: (event: string, fn: (...args: any[]) => void) => {
+        if (!listeners.has(event)) listeners.set(event, new Set());
+        listeners.get(event)!.add(fn);
+      },
+      off: (event: string, fn: (...args: any[]) => void) => {
+        listeners.get(event)?.delete(fn);
+      },
+      destroy: () => {
+        handle.destroyed = true;
+      },
+      disconnect: () => {},
+      document: opts.document,
+    };
+
+    // Let a test reach the provider object too, if needed.
+    (handle as any).provider = provider;
+    instances.push(handle);
+    return provider;
+  });
+  return { HocuspocusProvider };
+});
+
+// Import AFTER vi.mock so the mocked provider is in place. Import directly from
+// the source .js (matches the repo's other tests, e.g. page-lock.test.ts).
+import {
+  mutatePageContent,
+  replacePageContent,
+} from '../packages/docmost-client/src/lib/collaboration.js';
+import { HocuspocusProvider } from '@hocuspocus/provider';
+
+// A valid minimal ProseMirror doc used as the "new" content to write.
+function newDocWith(text: string) {
+  return {
+    type: 'doc',
+    content: [
+      {
+        type: 'paragraph',
+        content: [{ type: 'text', text }],
+      },
+    ],
+  };
+}
+
+// Read the "default" XML fragment off a Y.Doc and report whether it has nodes.
+function fragmentLength(ydoc: Y.Doc): number {
+  return ydoc.getXmlFragment('default').length;
+}
+
+// Flush pending microtasks so callbacks fired synchronously settle before the
+// test inspects results. withPageLock chains through several microtask hops.
+async function flushMicrotasks() {
+  for (let i = 0; i < 20; i++) await Promise.resolve();
+}
+
+// Drive the SUT: call mutatePageContent, wait for the provider to be built,
+// run `drive(handle)` to fire lifecycle callbacks, then await the result.
+async function runMutate(
+  transform: (live: any) => any,
+  drive: (handle: MockProviderHandle) => void | Promise<void>,
+  pageId = uniquePageId(),
+) {
+  const promise = mutatePageContent(pageId, 'collab-token', 'http://x/api', transform);
+  // The provider is constructed only AFTER the page lock grants the turn,
+  // which is a few microtask hops in. Wait until the instance shows up.
+  await flushMicrotasks();
+  const handle = instances[instances.length - 1];
+  expect(handle, 'provider should have been constructed').toBeTruthy();
+  await drive(handle);
+  await flushMicrotasks();
+  return promise;
+}
+
+// Unique pageId per test: the page lock is keyed by a process-global Map, so a
+// reused id would serialize unrelated tests behind each other.
+let pageCounter = 0;
+function uniquePageId() {
+  return `page-${process.pid}-${Date.now()}-${pageCounter++}`;
+}
+
+beforeEach(() => {
+  vi.useFakeTimers();
+  instances.length = 0;
+});
+
+afterEach(() => {
+  vi.useRealTimers();
+  vi.clearAllMocks();
+});
+
+describe('replacePageContent — fail-fast guard (before any provider)', () => {
+  it('throws on null document WITHOUT constructing a provider', async () => {
+    await expect(
+      replacePageContent('p1', null as any, 'tok', 'http://x/api'),
+    ).rejects.toThrow(/invalid ProseMirror document/);
+    // The guard runs before mutatePageContent, so no provider is built.
+    expect(HocuspocusProvider).not.toHaveBeenCalled();
+    expect(instances.length).toBe(0);
+  });
+
+  it('throws on a non-"doc"-typed object WITHOUT constructing a provider', async () => {
+    await expect(
+      replacePageContent(
+        'p2',
+        { type: 'paragraph', content: [] } as any,
+        'tok',
+        'http://x/api',
+      ),
+    ).rejects.toThrow(/invalid ProseMirror document/);
+    expect(HocuspocusProvider).not.toHaveBeenCalled();
+    expect(instances.length).toBe(0);
+  });
+
+  it('throws on a non-object (string) WITHOUT constructing a provider', async () => {
+    await expect(
+      replacePageContent('p3', 'just a string' as any, 'tok', 'http://x/api'),
+    ).rejects.toThrow(/invalid ProseMirror document/);
+    expect(HocuspocusProvider).not.toHaveBeenCalled();
+    expect(instances.length).toBe(0);
+  });
+});
+
+describe('mutatePageContent — read/transform/write core', () => {
+  it('transform receives the default empty doc when the live Y.Doc is empty', async () => {
+    let received: any;
+    const promise = await runMutate(
+      (live) => {
+        received = live;
+        return null; // abort: we only care about what the transform saw
+      },
+      (h) => {
+        // Empty live doc -> onSynced reads it and runs the transform.
+        h.fireSynced();
+      },
+    );
+    await promise;
+    // An empty fragment yields the synthesized default doc.
+    expect(received).toEqual({ type: 'doc', content: [] });
+  });
+
+  it('transform returning null performs NO write and resolves with the live doc', async () => {
+    let liveDocRef: any;
+    const promise = await runMutate(
+      (live) => {
+        liveDocRef = live;
+        return null;
+      },
+      (h) => h.fireSynced(),
+    );
+    const result = await promise;
+    // No write: the captured Y.Doc fragment is still empty.
+    const handle = instances[instances.length - 1];
+    expect(fragmentLength(handle.ydoc)).toBe(0);
+    // The returned value is the live doc (the default empty doc here).
+    expect(result).toBe(liveDocRef);
+    expect(result).toEqual({ type: 'doc', content: [] });
+  });
+
+  it('transform throwing propagates: the returned promise rejects', async () => {
+    const pageId = uniquePageId();
+    const promise = mutatePageContent(pageId, 'tok', 'http://x/api', () => {
+      throw new Error('boom from transform');
+    });
+    // Attach the rejection handler up-front so the rejection is observed even
+    // though the throw is surfaced synchronously inside the SUT's onSynced
+    // try/catch (which converts it into a finish()/reject()).
+    const settled = promise.then(
+      () => ({ ok: true as const }),
+      (err: Error) => ({ ok: false as const, err }),
+    );
+    await flushMicrotasks();
+    const handle = instances[instances.length - 1];
+    handle.fireSynced();
+    await flushMicrotasks();
+    const outcome = await settled;
+    expect(outcome.ok).toBe(false);
+    if (!outcome.ok) {
+      expect(outcome.err.message).toMatch(/boom from transform/);
+    }
+  });
+
+  it('transform returning a new doc replaces the fragment (old gone, new present)', async () => {
+    const pageId = uniquePageId();
+    const promise = mutatePageContent(
+      pageId,
+      'tok',
+      'http://x/api',
+      () => newDocWith('hello world'),
+    );
+    await flushMicrotasks();
+    const handle = instances[instances.length - 1];
+    expect(handle).toBeTruthy();
+
+    // Seed the live doc with some pre-existing content so we can prove it is
+    // fully replaced (not merged). We write a paragraph into the fragment that
+    // the SUT will read on sync, then clear+rewrite.
+    const liveFragment = handle.ydoc.getXmlFragment('default');
+    handle.ydoc.transact(() => {
+      const el = new Y.XmlElement('paragraph');
+      el.insert(0, [new Y.XmlText('OLD CONTENT')]);
+      liveFragment.insert(0, [el]);
+    });
+    expect(fragmentLength(handle.ydoc)).toBe(1);
+
+    // Fire sync: the SUT reads liveDoc, runs transform, deletes the fragment,
+    // and applies the new doc's update.
+    handle.fireSynced();
+    // The write is synchronous; persistence is still pending (unsyncedChanges=1).
+    await flushMicrotasks();
+
+    // The fragment now reflects the NEW doc. The old "OLD CONTENT" text is gone.
+    const xml = handle.ydoc.getXmlFragment('default').toString();
+    expect(xml).toContain('hello world');
+    expect(xml).not.toContain('OLD CONTENT');
+
+    // Now acknowledge persistence so the promise resolves cleanly.
+    handle.emitUnsynced(0);
+    await flushMicrotasks();
+    const result = await promise;
+    expect(result).toEqual(newDocWith('hello world'));
+  });
+});
+
+describe('mutatePageContent — persistence / false-success suppression', () => {
+  it('unsyncedChanges->0 while connected RESOLVES with the written doc', async () => {
+    const pageId = uniquePageId();
+    const promise = mutatePageContent(
+      pageId,
+      'tok',
+      'http://x/api',
+      () => newDocWith('persisted'),
+    );
+    await flushMicrotasks();
+    const handle = instances[instances.length - 1];
+    // Outstanding write at sync time (unsyncedChanges defaults to 1), so the
+    // SUT subscribes and waits for the event.
+    handle.fireSynced();
+    await flushMicrotasks();
+
+    // Server acknowledges: counter drops to 0 while still connected.
+    handle.emitUnsynced(0);
+    await flushMicrotasks();
+    const result = await promise;
+    expect(result).toEqual(newDocWith('persisted'));
+  });
+
+  it('resolves immediately when unsyncedChanges is already 0 at persist-check time', async () => {
+    const pageId = uniquePageId();
+    const promise = mutatePageContent(
+      pageId,
+      'tok',
+      'http://x/api',
+      () => newDocWith('already synced'),
+    );
+    await flushMicrotasks();
+    const handle = instances[instances.length - 1];
+    // Pretend the write was acknowledged before waitForPersistence checks.
+    handle.unsyncedChanges = 0;
+    handle.fireSynced();
+    await flushMicrotasks();
+    const result = await promise;
+    expect(result).toEqual(newDocWith('already synced'));
+  });
+
+  it('disconnect BEFORE reaching 0 unsynced does NOT resolve as success (connectionLost guard)', async () => {
+    const pageId = uniquePageId();
+    const promise = mutatePageContent(
+      pageId,
+      'tok',
+      'http://x/api',
+      () => newDocWith('should not persist'),
+    );
+    // Reject handler attached up-front so the rejection is never unhandled.
+    const settled = promise.then(
+      () => ({ ok: true as const }),
+      (err: Error) => ({ ok: false as const, err }),
+    );
+    await flushMicrotasks();
+    const handle = instances[instances.length - 1];
+
+    // Sync + write happen; persistence subscription is registered (unsynced=1).
+    handle.fireSynced();
+    await flushMicrotasks();
+
+    // Connection drops: this sets connectionLost=true and finishes with an error.
+    handle.fireDisconnect();
+    await flushMicrotasks();
+
+    // A late reconnect handshake drives the counter back to 0. Because the
+    // connection was already lost, the unsyncedChanges handler must NOT report
+    // success — and finish() is idempotent (settled flag), so this is a no-op.
+    handle.emitUnsynced(0);
+    await flushMicrotasks();
+
+    const outcome = await settled;
+    expect(outcome.ok).toBe(false);
+    if (!outcome.ok) {
+      expect(outcome.err.message).toMatch(
+        /connection closed before the update was persisted/i,
+      );
+    }
+  });
+
+  it('onClose before persistence rejects with the connection-closed error', async () => {
+    const pageId = uniquePageId();
+    const promise = mutatePageContent(
+      pageId,
+      'tok',
+      'http://x/api',
+      () => newDocWith('x'),
+    );
+    const settled = promise.then(
+      () => ({ ok: true as const }),
+      (err: Error) => ({ ok: false as const, err }),
+    );
+    await flushMicrotasks();
+    const handle = instances[instances.length - 1];
+    handle.fireSynced();
+    await flushMicrotasks();
+    handle.fireClose();
+    await flushMicrotasks();
+    const outcome = await settled;
+    expect(outcome.ok).toBe(false);
+    if (!outcome.ok) {
+      expect(outcome.err.message).toMatch(
+        /connection closed before the update was persisted/i,
+      );
+    }
+  });
+
+  it('authentication failure rejects with the auth error', async () => {
+    const pageId = uniquePageId();
+    const promise = mutatePageContent(
+      pageId,
+      'tok',
+      'http://x/api',
+      () => newDocWith('x'),
+    );
+    const settled = promise.then(
+      () => ({ ok: true as const }),
+      (err: Error) => ({ ok: false as const, err }),
+    );
+    await flushMicrotasks();
+    const handle = instances[instances.length - 1];
+    handle.fireAuthFailed();
+    await flushMicrotasks();
+    const outcome = await settled;
+    expect(outcome.ok).toBe(false);
+    if (!outcome.ok) {
+      expect(outcome.err.message).toMatch(/Authentication failed/i);
+    }
+  });
+});
+
+describe('mutatePageContent — timeouts (fake timers)', () => {
+  it('connect timeout rejects when onSynced never fires', async () => {
+    const pageId = uniquePageId();
+    const promise = mutatePageContent(
+      pageId,
+      'tok',
+      'http://x/api',
+      () => newDocWith('never'),
+    );
+    const settled = promise.then(
+      () => ({ ok: true as const }),
+      (err: Error) => ({ ok: false as const, err }),
+    );
+    await flushMicrotasks();
+    // Never fire onSynced. Advance past CONNECT_TIMEOUT_MS (25000).
+    await vi.advanceTimersByTimeAsync(25001);
+    await flushMicrotasks();
+    const outcome = await settled;
+    expect(outcome.ok).toBe(false);
+    if (!outcome.ok) {
+      expect(outcome.err.message).toMatch(/Connection timeout/i);
+    }
+  });
+
+  it('persist timeout rejects when unsyncedChanges never reaches 0 after the write', async () => {
+    const pageId = uniquePageId();
+    const promise = mutatePageContent(
+      pageId,
+      'tok',
+      'http://x/api',
+      () => newDocWith('stuck'),
+    );
+    const settled = promise.then(
+      () => ({ ok: true as const }),
+      (err: Error) => ({ ok: false as const, err }),
+    );
+    await flushMicrotasks();
+    const handle = instances[instances.length - 1];
+    // Write happens, but the counter stays at 1 (default) — never acknowledged.
+    handle.fireSynced();
+    await flushMicrotasks();
+    // Advance past PERSIST_TIMEOUT_MS (20000). The connect timer was cleared
+    // when onSynced ran, so only the persist timer is pending.
+    await vi.advanceTimersByTimeAsync(20001);
+    await flushMicrotasks();
+    const outcome = await settled;
+    expect(outcome.ok).toBe(false);
+    if (!outcome.ok) {
+      expect(outcome.err.message).toMatch(/persist the update/i);
+    }
+  });
+});
--- a/test/collaboration-pure.test.ts
+++ b/test/collaboration-pure.test.ts
@@ -0,0 +1,415 @@
+import { describe, expect, it } from 'vitest';
+// Importing this module mutates the global DOM (jsdom is installed onto
+// global.window/document/Element at load time) and pulls in yjs/hocuspocus/
+// ws/marked. That is expected and works in the vitest "node" environment.
+import {
+  buildCollabWsUrl,
+  buildYDoc,
+  assertYjsEncodable,
+  markdownToProseMirror,
+} from '../packages/docmost-client/src/lib/collaboration.js';
+// Y is imported only to assert the runtime type of buildYDoc's return value.
+import * as Y from 'yjs';
+
+// ---------------------------------------------------------------------------
+// Small helpers / fixtures.
+// ---------------------------------------------------------------------------
+
+// A minimal, valid Docmost ProseMirror doc that Yjs can encode without issue.
+// `null` attribute values are legitimate (only `undefined` is unstorable), so
+// this round-trips cleanly through sanitizeForYjs + toYdoc.
+const validDoc = () => ({
+  type: 'doc',
+  content: [
+    {
+      type: 'paragraph',
+      attrs: { id: null, indent: null, textAlign: null },
+      content: [{ type: 'text', text: 'hello' }],
+    },
+  ],
+});
+
+// ===========================================================================
+describe('buildCollabWsUrl', () => {
+  // -------------------------------------------------------------------------
+  describe('scheme rewrite', () => {
+    it('rewrites http:// to ws://', () => {
+      expect(buildCollabWsUrl('http://localhost:3000')).toBe(
+        'ws://localhost:3000/collab',
+      );
+    });
+
+    it('rewrites https:// to wss://', () => {
+      expect(buildCollabWsUrl('https://docmost.example.com')).toBe(
+        'wss://docmost.example.com/collab',
+      );
+    });
+
+    it('only the LEADING http is rewritten (^http anchor)', () => {
+      // The regex is anchored at the start, so "http" appearing later in the
+      // host/path is untouched — only the scheme flips to ws.
+      expect(buildCollabWsUrl('https://httpbin.example.com')).toBe(
+        'wss://httpbin.example.com/collab',
+      );
+    });
+  });
+
+  // -------------------------------------------------------------------------
+  describe('trailing /api stripping', () => {
+    it('strips a trailing /api (no slash) before mounting /collab', () => {
+      expect(buildCollabWsUrl('http://localhost:3000/api')).toBe(
+        'ws://localhost:3000/collab',
+      );
+    });
+
+    it('strips a trailing /api/ (with slash)', () => {
+      expect(buildCollabWsUrl('https://docmost.example.com/api/')).toBe(
+        'wss://docmost.example.com/collab',
+      );
+    });
+
+    it('strips /api even when it follows a base path, keeping the base', () => {
+      expect(buildCollabWsUrl('http://x.com/base/api')).toBe(
+        'ws://x.com/base/collab',
+      );
+      expect(buildCollabWsUrl('http://x.com/base/api/')).toBe(
+        'ws://x.com/base/collab',
+      );
+    });
+  });
+
+  // -------------------------------------------------------------------------
+  describe('/collab mounting', () => {
+    it('mounts /collab exactly once on a bare host', () => {
+      const out = buildCollabWsUrl('http://x.com');
+      expect(out).toBe('ws://x.com/collab');
+      // Exactly one occurrence of "/collab".
+      expect(out.match(/\/collab/g)?.length).toBe(1);
+    });
+
+    it('does not leave a double slash when the base ends in /', () => {
+      // The pathname has its single trailing slash stripped before "/collab"
+      // is appended, so there is no "//collab".
+      expect(buildCollabWsUrl('http://x.com/')).toBe('ws://x.com/collab');
+    });
+  });
+
+  // -------------------------------------------------------------------------
+  describe('query/hash dropping', () => {
+    it('drops any query string and hash from the base URL', () => {
+      expect(buildCollabWsUrl('https://x.com/api/?a=1&b=2#frag')).toBe(
+        'wss://x.com/collab',
+      );
+    });
+
+    it('drops a bare query on a host with no path', () => {
+      expect(buildCollabWsUrl('http://x.com?token=abc')).toBe(
+        'ws://x.com/collab',
+      );
+    });
+  });
+
+  // -------------------------------------------------------------------------
+  describe('"already /collab" handling (valid-URL path is NOT idempotent)', () => {
+    // The task spec claims an already-"/collab" input is idempotent. That is
+    // only true on the malformed-URL FALLBACK branch (which guards with
+    // `if (!wsUrl.endsWith("/collab"))`). On the normal valid-URL parsing path
+    // there is NO such guard: the pathname always gets "/collab" appended, so a
+    // URL that already ends in /collab gets a SECOND /collab. We assert the
+    // ACTUAL behaviour rather than the (incorrect) idempotency claim.
+    it('appends a second /collab to a valid URL already ending in /collab', () => {
+      expect(buildCollabWsUrl('https://x.com/collab')).toBe(
+        'wss://x.com/collab/collab',
+      );
+    });
+  });
+
+  // -------------------------------------------------------------------------
+  describe('malformed-URL fallback branch', () => {
+    // `new URL("not-a-valid-url")` throws (no scheme), so the catch branch
+    // runs: it appends "/collab" only when the string does not already end in
+    // "/collab", after stripping one trailing slash.
+    it('appends /collab to a string that cannot be parsed as a URL', () => {
+      expect(buildCollabWsUrl('not-a-valid-url')).toBe('not-a-valid-url/collab');
+    });
+
+    it('strips a single trailing slash before appending /collab (fallback)', () => {
+      expect(buildCollabWsUrl('not-a-valid-url/')).toBe(
+        'not-a-valid-url/collab',
+      );
+    });
+
+    it('is idempotent in the fallback branch when already ending in /collab', () => {
+      // This is the ONLY branch where "/collab" is idempotent: the fallback
+      // guard `!wsUrl.endsWith("/collab")` skips the append.
+      expect(buildCollabWsUrl('not-a-valid-url/collab')).toBe(
+        'not-a-valid-url/collab',
+      );
+    });
+  });
+});
+
+// ===========================================================================
+describe('buildYDoc', () => {
+  it('round-trips a valid PM doc into a Y.Doc (encodes without throwing)', () => {
+    const ydoc = buildYDoc(validDoc());
+    expect(ydoc).toBeInstanceOf(Y.Doc);
+    // It also encodes to a non-empty Yjs update, proving content was stored.
+    expect(Y.encodeStateAsUpdate(ydoc).length).toBeGreaterThan(0);
+  });
+
+  it('sanitizes an undefined attribute value and still encodes', () => {
+    // `undefined` is the common cause of the opaque yjs failure; sanitizeForYjs
+    // strips it, so the doc encodes cleanly into a Y.Doc.
+    const doc = {
+      type: 'doc',
+      content: [
+        {
+          type: 'paragraph',
+          attrs: { id: undefined, indent: null, textAlign: null },
+          content: [{ type: 'text', text: 'hi' }],
+        },
+      ],
+    };
+    const ydoc = buildYDoc(doc);
+    expect(ydoc).toBeInstanceOf(Y.Doc);
+  });
+
+  it('throws a descriptive error that names the offending attribute path', () => {
+    // To exercise the `findUnstorableAttr` branch we need a doc that (a)
+    // survives structuredClone in sanitizeForYjs, (b) makes toYdoc throw, and
+    // (c) carries an attribute value findUnstorableAttr flags. An UNKNOWN node
+    // type (toYdoc throws "Unknown node type") plus a `bigint` attr (survives
+    // structuredClone, flagged by findUnstorableAttr) satisfies all three.
+    const doc = {
+      type: 'doc',
+      content: [
+        {
+          type: 'bogusNode',
+          attrs: { id: 'x', big: 7n },
+          content: [],
+        },
+      ],
+    };
+    let err: Error | undefined;
+    try {
+      buildYDoc(doc);
+    } catch (e) {
+      err = e as Error;
+    }
+    expect(err).toBeInstanceOf(Error);
+    // Descriptive wrapper, original cause, and the named offending path.
+    expect(err!.message).toContain('Failed to encode document to Yjs (toYdoc):');
+    expect(err!.message).toContain('Offending attribute:');
+    expect(err!.message).toContain('content[0].attrs.big (bigint)');
+  });
+
+  it('falls back to the generic hint when toYdoc throws but no attr is flagged', () => {
+    // An invalid doc whose attrs are all storable: the descriptive wrapper
+    // fires, but with the generic "...likely holds a value Yjs cannot store"
+    // suffix instead of a named "Offending attribute:".
+    const doc = { type: 'doc', content: [{ type: 'unknownThing', attrs: { id: 'a' } }] };
+    let err: Error | undefined;
+    try {
+      buildYDoc(doc);
+    } catch (e) {
+      err = e as Error;
+    }
+    expect(err).toBeInstanceOf(Error);
+    expect(err!.message).toContain('Failed to encode document to Yjs (toYdoc):');
+    expect(err!.message).not.toContain('Offending attribute:');
+    expect(err!.message).toContain('value Yjs cannot store');
+  });
+
+  it('a function-valued attribute throws (raw structuredClone error, NOT the descriptive one)', () => {
+    // NOTE on the spec: it suggested "a function or bigint value throws a
+    // descriptive error that names the offending attribute path". In reality a
+    // FUNCTION attribute makes `sanitizeForYjs` -> structuredClone throw
+    // BEFORE buildYDoc's try/catch is reached, so the thrown error is the raw
+    // "... could not be cloned." message and does NOT name the path. We assert
+    // that actual behaviour here.
+    const doc = {
+      type: 'doc',
+      content: [
+        {
+          type: 'paragraph',
+          attrs: { id: 'p1', indent: null, textAlign: null, weird: () => {} },
+          content: [{ type: 'text', text: 'hi' }],
+        },
+      ],
+    };
+    let err: Error | undefined;
+    try {
+      buildYDoc(doc);
+    } catch (e) {
+      err = e as Error;
+    }
+    expect(err).toBeInstanceOf(Error);
+    expect(err!.message).toContain('could not be cloned');
+    // It is the structuredClone error, not the wrapped descriptive one.
+    expect(err!.message).not.toContain('Failed to encode document to Yjs');
+  });
+
+  it('a lone bigint attribute on a VALID doc is storable and does NOT throw', () => {
+    // Another spec correction: a bigint that is NOT accompanied by an otherwise
+    // invalid doc survives structuredClone and toYdoc stores it fine, so no
+    // error is raised. (findUnstorableAttr only ever runs after toYdoc throws.)
+    const doc = {
+      type: 'doc',
+      content: [
+        {
+          type: 'paragraph',
+          attrs: { id: null, indent: null, textAlign: null, big: 5n },
+          content: [{ type: 'text', text: 'hi' }],
+        },
+      ],
+    };
+    expect(() => buildYDoc(doc)).not.toThrow();
+  });
+});
+
+// ===========================================================================
+describe('assertYjsEncodable', () => {
+  it('returns void (no throw) for a valid doc', () => {
+    expect(() => assertYjsEncodable(validDoc())).not.toThrow();
+    expect(assertYjsEncodable(validDoc())).toBeUndefined();
+  });
+
+  it('throws IDENTICALLY to buildYDoc for an invalid doc', () => {
+    // assertYjsEncodable just calls buildYDoc and discards the Y.Doc, so the
+    // error message must be byte-for-byte the same descriptive error.
+    const doc = {
+      type: 'doc',
+      content: [{ type: 'bogusNode', attrs: { id: 'x', big: 7n }, content: [] }],
+    };
+
+    const grab = (fn: () => void): string => {
+      try {
+        fn();
+      } catch (e) {
+        return (e as Error).message;
+      }
+      throw new Error('expected the call to throw, but it did not');
+    };
+
+    const fromAssert = grab(() => assertYjsEncodable(doc));
+    const fromBuild = grab(() => buildYDoc(doc));
+    expect(fromAssert).toBe(fromBuild);
+    expect(fromAssert).toContain('Offending attribute: content[0].attrs.big (bigint)');
+  });
+});
+
+// ===========================================================================
+describe('markdownToProseMirror', () => {
+  it('returns a single empty paragraph doc for an empty string', async () => {
+    const out = await markdownToProseMirror('');
+    expect(out.type).toBe('doc');
+    expect(Array.isArray(out.content)).toBe(true);
+    expect(out.content).toHaveLength(1);
+    expect(out.content[0].type).toBe('paragraph');
+    // An empty paragraph has no `content` array (no inline children).
+    expect(out.content[0].content).toBeUndefined();
+  });
+
+  // -------------------------------------------------------------------------
+  describe('callouts (via preprocessCallouts)', () => {
+    it('converts a :::info ... ::: fence into a callout node', async () => {
+      const out = await markdownToProseMirror(':::info\nHello **world**\n:::');
+      expect(out.type).toBe('doc');
+      expect(out.content).toHaveLength(1);
+      const callout = out.content[0];
+      expect(callout.type).toBe('callout');
+      expect(callout.attrs.type).toBe('info');
+      // Inner markdown is rendered: a paragraph containing the bold run.
+      expect(callout.content[0].type).toBe('paragraph');
+      const inline = callout.content[0].content;
+      const boldNode = inline.find((n: any) =>
+        Array.isArray(n.marks) && n.marks.some((m: any) => m.type === 'bold'),
+      );
+      expect(boldNode).toBeDefined();
+      expect(boldNode.text).toBe('world');
+    });
+
+    it('lower-cases the callout type from the fence', async () => {
+      // CALLOUT_OPEN_RE captures the type and preprocessCallouts lower-cases it.
+      const out = await markdownToProseMirror(':::WARNING\nbeware\n:::');
+      expect(out.content[0].type).toBe('callout');
+      expect(out.content[0].attrs.type).toBe('warning');
+    });
+
+    it('handles a nested callout via the depth counter', async () => {
+      // An inner :::type opens a deeper level; the outer fence matches the
+      // OUTERMOST closing :::, so the inner callout nests inside the outer one.
+      const md = ':::info\nouter\n:::success\ninner\n:::\n:::';
+      const out = await markdownToProseMirror(md);
+      expect(out.content).toHaveLength(1);
+      const outer = out.content[0];
+      expect(outer.type).toBe('callout');
+      expect(outer.attrs.type).toBe('info');
+      // Somewhere inside the outer callout there is a nested success callout.
+      const nested = outer.content.find((n: any) => n.type === 'callout');
+      expect(nested).toBeDefined();
+      expect(nested.attrs.type).toBe('success');
+    });
+
+    it('does NOT treat a ::: line inside a fenced code block as a callout', async () => {
+      // The single-pass scanner tracks code fences and copies their `:::` lines
+      // through verbatim, so the result is a codeBlock, not a callout.
+      const md = '```\n:::info\nnot a callout\n:::\n```';
+      const out = await markdownToProseMirror(md);
+      expect(out.content).toHaveLength(1);
+      expect(out.content[0].type).toBe('codeBlock');
+      // No callout node anywhere in the output.
+      expect(out.content.some((n: any) => n.type === 'callout')).toBe(false);
+      // The literal ::: text survives inside the code block's text.
+      const codeText = out.content[0].content[0].text;
+      expect(codeText).toContain(':::info');
+      expect(codeText).toContain(':::');
+    });
+  });
+
+  // -------------------------------------------------------------------------
+  describe('task lists (via bridgeTaskLists)', () => {
+    it('converts a GFM checkbox UL into a taskList with checked state', async () => {
+      const out = await markdownToProseMirror('- [x] done\n- [ ] todo');
+      expect(out.content).toHaveLength(1);
+      const list = out.content[0];
+      expect(list.type).toBe('taskList');
+      expect(list.content).toHaveLength(2);
+      expect(list.content[0].type).toBe('taskItem');
+      expect(list.content[0].attrs.checked).toBe(true);
+      expect(list.content[1].type).toBe('taskItem');
+      expect(list.content[1].attrs.checked).toBe(false);
+      // No stray bulletList/orderedList survives beside the taskList.
+      expect(out.content.some((n: any) => n.type === 'bulletList')).toBe(false);
+    });
+
+    it('converts an ORDERED list whose every item is a checkbox into a taskList', async () => {
+      // bridgeTaskLists rule: BOTH <ul> and <ol> are candidates, and an <ol>
+      // whose every direct <li> carries its own checkbox is rewritten to a
+      // taskList (the <ol> is renamed to <ul> so no phantom orderedList remains).
+      const out = await markdownToProseMirror('1. [x] a\n2. [ ] b');
+      expect(out.content).toHaveLength(1);
+      const list = out.content[0];
+      expect(list.type).toBe('taskList');
+      expect(list.content[0].attrs.checked).toBe(true);
+      expect(list.content[1].attrs.checked).toBe(false);
+      // Crucially, NO phantom empty orderedList is emitted beside the taskList.
+      expect(out.content.some((n: any) => n.type === 'orderedList')).toBe(false);
+    });
+
+    it('leaves an ordinary ordered list (no checkboxes) as an orderedList', async () => {
+      // Mixed/ordinary lists are untouched — they keep rendering as numbered.
+      const out = await markdownToProseMirror('1. a\n2. b');
+      expect(out.content).toHaveLength(1);
+      expect(out.content[0].type).toBe('orderedList');
+      expect(out.content.some((n: any) => n.type === 'taskList')).toBe(false);
+    });
+
+    it('leaves an ordinary bullet list untouched', async () => {
+      const out = await markdownToProseMirror('- a\n- b');
+      expect(out.content[0].type).toBe('bulletList');
+      expect(out.content.some((n: any) => n.type === 'taskList')).toBe(false);
+    });
+  });
+});
--- a/test/config-errors-invalid.test.ts
+++ b/test/config-errors-invalid.test.ts
@@ -0,0 +1,139 @@
+import { afterEach, describe, expect, it, vi } from 'vitest';
+import { z, ZodError } from 'zod';
+import { loadSettingsOrExit } from '../src/config-errors.js';
+import { envSchema } from '../src/settings.js';
+
+// Companion to test/config-errors.test.ts. That file covers the success path,
+// the MISSING-required (undefined -> invalid_type) -> exit branch, and the
+// non-ZodError passthrough. This file fills the remaining GAP: the
+// INVALID-VALUE branch (config-errors.ts lines ~20, 27-30). A ZodError whose
+// issue is a CONSTRAINT violation (bad URL, bad enum, too-short string) is NOT
+// a missing key, so it must be routed into the `invalid` bucket and reported
+// under the "Invalid value(s)" heading with a `<name>: <message>` line — a
+// distinct, operator-facing message from the missing-variable case.
+describe('loadSettingsOrExit — invalid-value branch', () => {
+  afterEach(() => {
+    vi.restoreAllMocks();
+  });
+
+  // Stub process.exit so it throws (control stops at the exit point without
+  // killing the runner) and capture everything written to stderr. Mirrors the
+  // approach in the existing config-errors.test.ts.
+  function stubExitAndStderr() {
+    const exitSpy = vi.spyOn(process, 'exit').mockImplementation(((
+      code?: number,
+    ) => {
+      throw new Error(`exit:${code}`);
+    }) as never);
+    const writeSpy = vi
+      .spyOn(process.stderr, 'write')
+      .mockImplementation(() => true);
+    const written = () => writeSpy.mock.calls.map((c) => String(c[0])).join('');
+    return { exitSpy, writeSpy, written };
+  }
+
+  it('exits(1) and reports an invalid value (bad URL) under "Invalid value(s)"', () => {
+    const { exitSpy, written } = stubExitAndStderr();
+
+    // A present-but-invalid DOCMOST_API_URL: the value exists (so it is NOT a
+    // missing-key issue), but fails the .url() constraint -> goes to `invalid`.
+    expect(() =>
+      loadSettingsOrExit(() =>
+        envSchema.parse({
+          DOCMOST_API_URL: 'not-a-url',
+          DOCMOST_EMAIL: 'ops@example.com',
+          DOCMOST_PASSWORD: 'hunter2',
+          DOCMOST_SPACE_ID: 'space-1',
+        }),
+      ),
+    ).toThrow('exit:1');
+
+    expect(exitSpy).toHaveBeenCalledWith(1);
+    const out = written();
+    // The invalid-value heading must appear...
+    expect(out).toContain('Invalid value(s)');
+    // ...and it must name the offending variable on a `<name>: <message>` line.
+    expect(out).toContain('DOCMOST_API_URL:');
+    // The header line is always present.
+    expect(out).toContain('Configuration error in environment / .env:');
+    // It must NOT misreport an invalid value as a missing one.
+    expect(out).not.toContain('Missing required variable(s)');
+  });
+
+  it('exits(1) and reports an invalid enum value (LOG_LEVEL)', () => {
+    const { exitSpy, written } = stubExitAndStderr();
+
+    // All required vars present and valid; only LOG_LEVEL violates the enum.
+    expect(() =>
+      loadSettingsOrExit(() =>
+        envSchema.parse({
+          DOCMOST_API_URL: 'https://docs.example.com/api',
+          DOCMOST_EMAIL: 'ops@example.com',
+          DOCMOST_PASSWORD: 'hunter2',
+          DOCMOST_SPACE_ID: 'space-1',
+          LOG_LEVEL: 'verbose', // not in ['debug','info','warn','error']
+        }),
+      ),
+    ).toThrow('exit:1');
+
+    expect(exitSpy).toHaveBeenCalledWith(1);
+    const out = written();
+    expect(out).toContain('Invalid value(s)');
+    expect(out).toContain('LOG_LEVEL:');
+    expect(out).not.toContain('Missing required variable(s)');
+  });
+
+  it('routes a hand-built constraint-violation ZodError into the invalid bucket', () => {
+    const { exitSpy, written } = stubExitAndStderr();
+
+    // Construct the ZodError directly from a min-length violation so the test
+    // does not depend on the project schema's exact field set. The issue has a
+    // non-empty path (so a variable name is printed) and code "too_small"
+    // (NOT invalid_type/undefined), so config-errors.ts classifies it as
+    // invalid rather than missing.
+    const zerr = new ZodError([
+      {
+        code: 'too_small',
+        minimum: 1,
+        type: 'string',
+        inclusive: true,
+        path: ['DOCMOST_PASSWORD'],
+        message: 'String must contain at least 1 character(s)',
+      } as z.ZodIssue,
+    ]);
+
+    expect(() =>
+      loadSettingsOrExit(() => {
+        throw zerr;
+      }),
+    ).toThrow('exit:1');
+
+    expect(exitSpy).toHaveBeenCalledWith(1);
+    const out = written();
+    expect(out).toContain('Invalid value(s)');
+    expect(out).toContain('DOCMOST_PASSWORD: String must contain at least 1');
+    expect(out).not.toContain('Missing required variable(s)');
+  });
+
+  it('reports missing AND invalid in their own sections when both occur', () => {
+    const { exitSpy, written } = stubExitAndStderr();
+
+    // DOCMOST_API_URL present but invalid (-> invalid section); the three other
+    // required vars absent (-> missing section). Confirms the two branches are
+    // populated and emitted independently.
+    expect(() =>
+      loadSettingsOrExit(() =>
+        envSchema.parse({
+          DOCMOST_API_URL: 'not-a-url',
+        }),
+      ),
+    ).toThrow('exit:1');
+
+    expect(exitSpy).toHaveBeenCalledWith(1);
+    const out = written();
+    expect(out).toContain('Missing required variable(s)');
+    expect(out).toContain('Invalid value(s)');
+    expect(out).toContain('DOCMOST_API_URL:');
+    expect(out).toContain('DOCMOST_EMAIL');
+  });
+});
--- a/test/diff.test.ts
+++ b/test/diff.test.ts
@@ -0,0 +1,359 @@
+import { describe, expect, it } from 'vitest';
+import { diffDocs } from '../packages/docmost-client/src/lib/diff.js';
+
+// ---------------------------------------------------------------------------
+// ProseMirror JSON builders. diffDocs accepts plain JSON docs (it parses them
+// through the Docmost schema internally), so we only need minimal node shapes.
+// ---------------------------------------------------------------------------
+
+/** A paragraph; omit `text` for an empty paragraph (no content array entries). */
+const para = (text?: string) => ({
+  type: 'paragraph',
+  content: text ? [{ type: 'text', text }] : [],
+});
+
+/** A heading (level 2 by default) carrying a single text run. */
+const heading = (text: string, level = 2) => ({
+  type: 'heading',
+  attrs: { level },
+  content: [{ type: 'text', text }],
+});
+
+/** A top-level doc node wrapping the given blocks. */
+const doc = (...content: any[]) => ({ type: 'doc', content });
+
+/** An image node (atom). */
+const image = () => ({ type: 'image', attrs: {} });
+
+/** A callout node wrapping one paragraph. */
+const callout = (text = 'note') => ({
+  type: 'callout',
+  attrs: { type: 'info' },
+  content: [para(text)],
+});
+
+/** A 1x1 table. */
+const table = (cell = 'c') => ({
+  type: 'table',
+  content: [
+    { type: 'tableRow', content: [{ type: 'tableCell', content: [para(cell)] }] },
+  ],
+});
+
+/** A paragraph carrying a text run that bears a link mark with the given href. */
+const linkPara = (text: string, href: string | undefined, extraMarks: any[] = []) => ({
+  type: 'paragraph',
+  content: [
+    {
+      type: 'text',
+      text,
+      marks: [{ type: 'link', attrs: href === undefined ? {} : { href } }, ...extraMarks],
+    },
+  ],
+});
+
+/** The diff.ts default for the notes-heading argument. */
+const DEFAULT_NOTES_HEADING = 'Примечания переводчика';
+
+describe('diffDocs', () => {
+  describe('textual changes (precise path)', () => {
+    it('reports no changes for two identical docs', () => {
+      const d = doc(para('hello world'));
+      const result = diffDocs(d, d);
+
+      expect(result.changes).toHaveLength(0);
+      expect(result.summary).toEqual({ inserted: 0, deleted: 0, blocksChanged: 0 });
+      // The Changes section renders the sentinel line for an empty change list.
+      expect(result.markdown).toContain('(no textual changes)');
+    });
+
+    it('counts a pure insertion ("abc" -> "abcXY") and captures the inserted substring', () => {
+      const result = diffDocs(doc(para('abc')), doc(para('abcXY')));
+
+      expect(result.summary.inserted).toBe(2);
+      expect(result.summary.deleted).toBe(0);
+      // Exactly one insert change whose text equals the inserted substring.
+      const inserts = result.changes.filter((c) => c.op === 'insert');
+      expect(inserts).toHaveLength(1);
+      expect(inserts[0].text).toBe('XY');
+      // No deletions on a pure insertion.
+      expect(result.changes.filter((c) => c.op === 'delete')).toHaveLength(0);
+    });
+
+    it('counts a pure deletion ("abcXY" -> "abc") and captures the deleted substring', () => {
+      const result = diffDocs(doc(para('abcXY')), doc(para('abc')));
+
+      expect(result.summary.deleted).toBe(2);
+      expect(result.summary.inserted).toBe(0);
+      const deletes = result.changes.filter((c) => c.op === 'delete');
+      expect(deletes).toHaveLength(1);
+      expect(deletes[0].text).toBe('XY');
+      expect(result.changes.filter((c) => c.op === 'insert')).toHaveLength(0);
+    });
+
+    it('reports a word modification as a matched delete + insert with exact substrings', () => {
+      const result = diffDocs(doc(para('hello world')), doc(para('hello there')));
+
+      // "world" (5) removed, "there" (5) added.
+      expect(result.summary.inserted).toBe(5);
+      expect(result.summary.deleted).toBe(5);
+
+      const deletes = result.changes.filter((c) => c.op === 'delete');
+      const inserts = result.changes.filter((c) => c.op === 'insert');
+      expect(deletes.map((c) => c.text)).toContain('world');
+      expect(inserts.map((c) => c.text)).toContain('there');
+    });
+
+    it('handles two empty docs without error', () => {
+      const result = diffDocs({ type: 'doc', content: [] }, { type: 'doc', content: [] });
+
+      expect(result.changes).toHaveLength(0);
+      expect(result.summary).toEqual({ inserted: 0, deleted: 0, blocksChanged: 0 });
+      expect(result.markdown).toContain('(no textual changes)');
+    });
+
+    it('reports an insertion into an empty doc', () => {
+      const result = diffDocs({ type: 'doc', content: [] }, doc(para('brand new')));
+
+      expect(result.summary.inserted).toBeGreaterThan(0);
+      const inserts = result.changes.filter((c) => c.op === 'insert');
+      expect(inserts.length).toBeGreaterThan(0);
+      // The inserted text is the new paragraph's content.
+      expect(inserts.map((c) => c.text).join('')).toContain('brand new');
+    });
+  });
+
+  describe('integrity counting', () => {
+    it('counts images, tables and callouts as old -> new tuples', () => {
+      // old: 1 image, 1 callout, 1 table   new: 2 images, 0 callouts, 1 table
+      const oldDoc = doc(image(), callout(), table());
+      const newDoc = doc(image(), image(), table());
+      const { integrity } = diffDocs(oldDoc, newDoc);
+
+      expect(integrity.images).toEqual([1, 2]);
+      expect(integrity.callouts).toEqual([1, 0]);
+      expect(integrity.tables).toEqual([1, 1]);
+    });
+
+    it('renders the integrity section verbatim in the markdown', () => {
+      const oldDoc = doc(image(), callout(), table());
+      const newDoc = doc(image(), image(), table());
+      const { markdown } = diffDocs(oldDoc, newDoc);
+
+      // The integrity block is our own formatting, so exact lines are asserted.
+      expect(markdown).toContain('## Integrity (old -> new)');
+      expect(markdown).toContain('- images: 1 -> 2');
+      expect(markdown).toContain('- callouts: 1 -> 0');
+      expect(markdown).toContain('- tables: 1 -> 1');
+    });
+
+    it('counts a single link split across two adjacent runs (shared href) as one link', () => {
+      // Two text runs, both bearing a link to the SAME href; one also bold.
+      const d = doc({
+        type: 'paragraph',
+        content: [
+          { type: 'text', text: 'foo', marks: [{ type: 'link', attrs: { href: 'http://x' } }, { type: 'bold' }] },
+          { type: 'text', text: 'bar', marks: [{ type: 'link', attrs: { href: 'http://x' } }] },
+        ],
+      });
+      const { integrity } = diffDocs(d, d);
+
+      // Counting by unique href collapses the two runs into one link.
+      expect(integrity.links).toEqual([1, 1]);
+    });
+
+    it('counts distinct hrefs separately', () => {
+      const d = doc({
+        type: 'paragraph',
+        content: [
+          { type: 'text', text: 'one', marks: [{ type: 'link', attrs: { href: 'http://a' } }] },
+          { type: 'text', text: 'two', marks: [{ type: 'link', attrs: { href: 'http://b' } }] },
+        ],
+      });
+      const { integrity } = diffDocs(d, d);
+      expect(integrity.links).toEqual([2, 2]);
+    });
+
+    it('counts a link mark with a missing href once (bucketed under "")', () => {
+      // Per source: a missing/empty href is collected under a single "" key, so a
+      // malformed link is still counted exactly once.
+      const d = linkPara('orphan', undefined);
+      const { integrity } = diffDocs(d, d);
+      expect(integrity.links).toEqual([1, 1]);
+    });
+  });
+
+  describe('footnoteMarkers', () => {
+    it('excludes markers after the default notes heading and preserves reading order', () => {
+      // Body has [1] then [2]; the [99] sits AFTER the notes heading and must be
+      // excluded from both old and new marker lists.
+      const d = doc(
+        para('intro [1] middle [2]'),
+        heading(DEFAULT_NOTES_HEADING),
+        para('[99] footnote body'),
+      );
+      const { integrity } = diffDocs(d, d);
+
+      expect(integrity.footnoteMarkers).toEqual([
+        [1, 2],
+        [1, 2],
+      ]);
+      // Reading order: [1] precedes [2].
+      expect(integrity.footnoteMarkers[1]).toEqual([1, 2]);
+    });
+
+    it('honors a custom notesHeading argument', () => {
+      const d = doc(para('a [1]'), heading('Notes'), para('[5] excluded'));
+      const { integrity } = diffDocs(d, d, 'Notes');
+
+      // With the matching custom heading, [5] is excluded.
+      expect(integrity.footnoteMarkers).toEqual([[1], [1]]);
+    });
+
+    it('includes every marker when no notes heading is present', () => {
+      // No heading equals the notesHeading -> the whole doc is the body.
+      const d = doc(para('a [1] b [2]'), para('[3]'));
+      const { integrity } = diffDocs(d, d);
+
+      expect(integrity.footnoteMarkers).toEqual([
+        [1, 2, 3],
+        [1, 2, 3],
+      ]);
+    });
+
+    it('renders the footnoteMarkers integrity line verbatim', () => {
+      const d = doc(para('x [1] y [2]'), heading(DEFAULT_NOTES_HEADING), para('[9]'));
+      const { markdown } = diffDocs(d, d);
+      expect(markdown).toContain('- footnoteMarkers: [1, 2] -> [1, 2]');
+    });
+  });
+
+  describe('coarse fallback', () => {
+    // An unknown node type makes Node.fromJSON reject the doc, which throws
+    // inside the precise pipeline and triggers the coarse block-level fallback.
+    // (Confirmed by running the module: `{ type: '___nope' }` is not in the
+    // schema, so parsing throws and `fellBack` becomes true.)
+    it('degrades to a coarse block-level diff instead of throwing', () => {
+      const oldDoc = doc(para('keep this'), { type: '___nope' });
+      const newDoc = doc(para('keep this'), para('new block'));
+
+      // Must not throw.
+      const result = diffDocs(oldDoc, newDoc);
+
+      // The fallback note appears in the markdown header area.
+      expect(result.markdown).toContain('precise diff failed; coarse block-level diff shown.');
+      // Only the genuinely new block is reported; the unchanged "keep this"
+      // block is not.
+      const inserts = result.changes.filter((c) => c.op === 'insert');
+      expect(inserts).toHaveLength(1);
+      expect(inserts[0].text).toBe('new block');
+    });
+
+    it('does not report whitespace-only blocks in the fallback path', () => {
+      // New doc adds a block whose plain text is only whitespace; coarseDiff
+      // skips blocks whose trimmed text is empty.
+      const oldDoc = doc({ type: '___nope' }, para('kept'));
+      const newDoc = doc(para('kept'), para('   '));
+
+      const result = diffDocs(oldDoc, newDoc);
+
+      // Fallback was taken (precise path threw on the unknown node).
+      expect(result.markdown).toContain('coarse block-level diff shown.');
+      // No change is reported: "kept" is unchanged and "   " is whitespace-only.
+      expect(result.changes).toHaveLength(0);
+      expect(result.summary).toEqual({ inserted: 0, deleted: 0, blocksChanged: 0 });
+    });
+
+    it('reports both a deletion and an insertion in the fallback path', () => {
+      const oldDoc = doc(para('old paragraph'), { type: '___nope' });
+      const newDoc = doc(para('new paragraph'));
+
+      const result = diffDocs(oldDoc, newDoc);
+
+      expect(result.markdown).toContain('coarse block-level diff shown.');
+      const deletes = result.changes.filter((c) => c.op === 'delete');
+      const inserts = result.changes.filter((c) => c.op === 'insert');
+      // "old paragraph" no longer present -> deletion; "new paragraph" -> insertion.
+      expect(deletes.map((c) => c.text)).toContain('old paragraph');
+      expect(inserts.map((c) => c.text)).toContain('new paragraph');
+      // Character counts accumulate from the reported texts.
+      expect(result.summary.deleted).toBe('old paragraph'.length);
+      expect(result.summary.inserted).toBe('new paragraph'.length);
+    });
+  });
+
+  describe('blockContextAt (DiffChange.block)', () => {
+    it('truncates a >80-char block context with an ellipsis and keeps it non-empty', () => {
+      // A 100-char paragraph with a one-char edit; the block context guards a
+      // swallowed catch and must produce a truncated, non-empty string.
+      const longText = 'X'.repeat(100);
+      const result = diffDocs(doc(para(longText)), doc(para(longText + 'Z')));
+
+      const inserts = result.changes.filter((c) => c.op === 'insert');
+      expect(inserts).toHaveLength(1);
+      const block = inserts[0].block;
+      expect(block.length).toBeGreaterThan(0);
+      // Truncation rule: 77 chars + "..." = length 80, ending with "...".
+      expect(block.endsWith('...')).toBe(true);
+      expect(block).toHaveLength(80);
+    });
+
+    it('keeps a short block context untruncated', () => {
+      const result = diffDocs(doc(para('abc')), doc(para('abcXY')));
+      const inserts = result.changes.filter((c) => c.op === 'insert');
+      expect(inserts[0].block).toBe('abcXY');
+      expect(inserts[0].block.endsWith('...')).toBe(false);
+    });
+
+    it('dedups blocksChanged by op + block context (multiple edits in one block count once per op)', () => {
+      // Two separate word edits inside a single paragraph produce 4 changes
+      // (2 deletes + 2 inserts) but only 2 distinct block keys:
+      //   "d:the quick brown fox" and "i:the slow brown wolf".
+      const result = diffDocs(
+        doc(para('the quick brown fox')),
+        doc(para('the slow brown wolf')),
+      );
+
+      expect(result.changes.length).toBe(4);
+      expect(result.summary.blocksChanged).toBe(2);
+    });
+
+    it('counts one block key per op for edits spread across two blocks', () => {
+      // Edits in two different paragraphs -> 4 distinct block keys.
+      const result = diffDocs(
+        doc(para('first line here'), para('second line here')),
+        doc(para('first line HERE'), para('second line HERE')),
+      );
+
+      expect(result.summary.blocksChanged).toBe(4);
+    });
+  });
+
+  describe('markdown rendering', () => {
+    it('puts the summary counts in the markdown header', () => {
+      const result = diffDocs(doc(para('abc')), doc(para('abcXY')));
+      expect(result.markdown).toContain(
+        '# Diff: 2 inserted / 0 deleted (1 blocks changed)',
+      );
+    });
+
+    it('renders each change with its op sign (loose membership, library-controlled order)', () => {
+      const result = diffDocs(doc(para('hello world')), doc(para('hello there')));
+
+      // The Changes section is ordered by the diff library; assert membership,
+      // not an exact ordered string. Scope to lines AFTER the "## Changes"
+      // heading, since integrity lines also begin with "- ".
+      const lines = result.markdown.split('\n');
+      const changesIdx = lines.indexOf('## Changes');
+      expect(changesIdx).toBeGreaterThanOrEqual(0);
+      const changeLines = lines
+        .slice(changesIdx + 1)
+        .filter((l) => l.startsWith('+ ') || l.startsWith('- '));
+      expect(changeLines.some((l) => l.startsWith('- ') && l.includes('world'))).toBe(true);
+      expect(changeLines.some((l) => l.startsWith('+ ') && l.includes('there'))).toBe(true);
+      // One delete line and one insert line.
+      expect(changeLines.filter((l) => l.startsWith('- '))).toHaveLength(1);
+      expect(changeLines.filter((l) => l.startsWith('+ '))).toHaveLength(1);
+    });
+  });
+});
--- a/test/docmost-schema.test.ts
+++ b/test/docmost-schema.test.ts
@@ -0,0 +1,184 @@
+import { describe, expect, it } from 'vitest';
+import {
+  sanitizeCssColor,
+  clampCalloutType,
+} from '../packages/docmost-client/src/lib/docmost-schema.js';
+
+/**
+ * Unit tests for the two pure guard functions of the Docmost schema.
+ *
+ * `sanitizeCssColor` is a SECURITY boundary: its return value is interpolated
+ * straight into an inline `style="..."` attribute by Docmost, so any value it
+ * accepts must be incapable of breaking out of that attribute. These tests pin
+ * both the accept set (well-formed CSS <color> syntax) and, more importantly,
+ * the reject set (anything containing the characters an attacker would need to
+ * inject: quotes, angle brackets, semicolons, colons, parentheses with letters,
+ * or a `url(...)` / `expression(...)` payload).
+ */
+
+describe('sanitizeCssColor', () => {
+  describe('accepts well-formed CSS colors', () => {
+    it('accepts simple named colors (letters only), returned verbatim', () => {
+      expect(sanitizeCssColor('red')).toBe('red');
+      expect(sanitizeCssColor('rebeccapurple')).toBe('rebeccapurple');
+      // Case is preserved (the regex is case-insensitive for letters).
+      expect(sanitizeCssColor('Black')).toBe('Black');
+      expect(sanitizeCssColor('transparent')).toBe('transparent');
+    });
+
+    it('accepts #rgb and #rgba short hex', () => {
+      expect(sanitizeCssColor('#abc')).toBe('#abc');
+      expect(sanitizeCssColor('#abcd')).toBe('#abcd');
+      expect(sanitizeCssColor('#FFF')).toBe('#FFF');
+    });
+
+    it('accepts #rrggbb and #rrggbbaa long hex', () => {
+      expect(sanitizeCssColor('#aabbcc')).toBe('#aabbcc');
+      expect(sanitizeCssColor('#AABBCCDD')).toBe('#AABBCCDD');
+      expect(sanitizeCssColor('#0f0f0f')).toBe('#0f0f0f');
+    });
+
+    it('accepts rgb()/rgba() functional notation', () => {
+      expect(sanitizeCssColor('rgb(255, 0, 0)')).toBe('rgb(255, 0, 0)');
+      expect(sanitizeCssColor('rgba(0, 128, 255, 0.5)')).toBe(
+        'rgba(0, 128, 255, 0.5)',
+      );
+      // CSS Color 4 space-separated + slash-alpha syntax (digits, %, /, spaces).
+      expect(sanitizeCssColor('rgb(100% 0% 0% / 50%)')).toBe(
+        'rgb(100% 0% 0% / 50%)',
+      );
+    });
+
+    it('accepts hsl()/hsla() functional notation', () => {
+      expect(sanitizeCssColor('hsl(120, 50%, 50%)')).toBe('hsl(120, 50%, 50%)');
+      expect(sanitizeCssColor('hsla(240, 100%, 50%, 0.3)')).toBe(
+        'hsla(240, 100%, 50%, 0.3)',
+      );
+    });
+  });
+
+  describe('trims surrounding whitespace before validating', () => {
+    it('trims leading/trailing whitespace and returns the trimmed value', () => {
+      // The implementation trims first, then matches; the returned value is the
+      // trimmed string, not the original padded input.
+      expect(sanitizeCssColor('  red  ')).toBe('red');
+      expect(sanitizeCssColor('\t#aabbcc\n')).toBe('#aabbcc');
+      expect(sanitizeCssColor('  rgb(1, 2, 3)  ')).toBe('rgb(1, 2, 3)');
+    });
+  });
+
+  describe('rejects CSS-injection / breakout payloads (returns null)', () => {
+    it('rejects a style-attribute breakout via extra declarations', () => {
+      // The classic "set a valid color, then smuggle another declaration".
+      expect(sanitizeCssColor('red; --x: url(x)')).toBeNull();
+      expect(sanitizeCssColor('red; background: url(http://x)')).toBeNull();
+    });
+
+    it('rejects an attribute breakout via quotes and angle brackets', () => {
+      expect(sanitizeCssColor('red"><script>')).toBeNull();
+      expect(sanitizeCssColor("red'><img src=x>")).toBeNull();
+    });
+
+    it('rejects expression(...) payloads', () => {
+      // `expression` is letters-only but the trailing "(...)" is not part of the
+      // named-color alternative and `expression` is not an allowed function, so
+      // the anchored regex rejects the whole string.
+      expect(sanitizeCssColor('expression(alert(1))')).toBeNull();
+    });
+
+    it('rejects url(...) payloads', () => {
+      expect(sanitizeCssColor('url(http://x)')).toBeNull();
+      expect(sanitizeCssColor('rgb(url(x))')).toBeNull();
+    });
+
+    it('rejects any value containing a semicolon', () => {
+      expect(sanitizeCssColor('red;')).toBeNull();
+      expect(sanitizeCssColor('rgb(1,2,3);')).toBeNull();
+    });
+
+    it('rejects any value containing embedded quotes', () => {
+      expect(sanitizeCssColor('"red"')).toBeNull();
+      expect(sanitizeCssColor("'red'")).toBeNull();
+      expect(sanitizeCssColor('rgb(1,2,"3")')).toBeNull();
+    });
+
+    it('rejects any value containing angle brackets', () => {
+      expect(sanitizeCssColor('<red>')).toBeNull();
+      expect(sanitizeCssColor('red>')).toBeNull();
+    });
+
+    it('rejects functional notation carrying letters inside the parens', () => {
+      // The function body allowlist is [0-9.,%/\s] only — no letters survive,
+      // so a smuggled identifier/keyword inside cannot slip through.
+      expect(sanitizeCssColor('rgb(red)')).toBeNull();
+      expect(sanitizeCssColor('rgb(1, var(--x), 3)')).toBeNull();
+    });
+
+    it('rejects a hex value of an unsupported length', () => {
+      // Only 3/4/6/8 hex digits are allowed; 5 and 7 are not.
+      expect(sanitizeCssColor('#aabbc')).toBeNull();
+      expect(sanitizeCssColor('#aabbccd')).toBeNull();
+      expect(sanitizeCssColor('#xyz')).toBeNull();
+    });
+  });
+
+  describe('rejects empty / whitespace-only / non-string input (returns null)', () => {
+    it('returns null for an empty string', () => {
+      expect(sanitizeCssColor('')).toBeNull();
+    });
+
+    it('returns null for a whitespace-only string', () => {
+      expect(sanitizeCssColor('   ')).toBeNull();
+      expect(sanitizeCssColor('\t\n')).toBeNull();
+    });
+
+    it('returns null for null and undefined', () => {
+      expect(sanitizeCssColor(null)).toBeNull();
+      expect(sanitizeCssColor(undefined)).toBeNull();
+    });
+
+    it('returns null for non-string types', () => {
+      // The guard's first line is a `typeof value !== "string"` check.
+      expect(sanitizeCssColor(123 as unknown as string)).toBeNull();
+      expect(sanitizeCssColor({} as unknown as string)).toBeNull();
+      expect(sanitizeCssColor([] as unknown as string)).toBeNull();
+      expect(sanitizeCssColor(true as unknown as string)).toBeNull();
+    });
+  });
+});
+
+/**
+ * `clampCalloutType` maps an arbitrary string to one of the four allowed
+ * Docmost callout types, normalizing case and falling back to "info" for
+ * anything unknown / empty / nullish.
+ */
+describe('clampCalloutType', () => {
+  it('passes each allowed value through unchanged', () => {
+    expect(clampCalloutType('info')).toBe('info');
+    expect(clampCalloutType('warning')).toBe('warning');
+    expect(clampCalloutType('danger')).toBe('danger');
+    expect(clampCalloutType('success')).toBe('success');
+  });
+
+  it('normalizes mixed/upper case to lower case', () => {
+    expect(clampCalloutType('WARNING')).toBe('warning');
+    expect(clampCalloutType('Danger')).toBe('danger');
+    expect(clampCalloutType('SuCcEsS')).toBe('success');
+    expect(clampCalloutType('INFO')).toBe('info');
+  });
+
+  it('falls back to "info" for unknown values', () => {
+    expect(clampCalloutType('note')).toBe('info');
+    expect(clampCalloutType('error')).toBe('info');
+    expect(clampCalloutType('tip')).toBe('info');
+  });
+
+  it('falls back to "info" for empty, whitespace and nullish input', () => {
+    expect(clampCalloutType('')).toBe('info');
+    expect(clampCalloutType(null)).toBe('info');
+    expect(clampCalloutType(undefined)).toBe('info');
+    // Surrounding whitespace is NOT trimmed before the allowlist check, so
+    // " warning " is unknown and falls back to "info".
+    expect(clampCalloutType(' warning ')).toBe('info');
+  });
+});
--- a/test/e2e-docmost.test.ts
+++ b/test/e2e-docmost.test.ts
@@ -0,0 +1,171 @@
+/**
+ * End-to-end journeys against a REAL Docmost instance.
+ *
+ * These tests talk to a live server, so they are SKIPPED by default (no live
+ * Docmost is available in CI). They only EXECUTE when the env flag DOCMOST_E2E
+ * is set; otherwise the whole suite is registered via `describe.skip` and
+ * reported as skipped — it must still import cleanly and never error during a
+ * normal `vitest run`.
+ *
+ * How to run (all on one line):
+ *
+ *   DOCMOST_E2E=1 \
+ *   DOCMOST_API_URL=https://your-docmost/api \
+ *   DOCMOST_EMAIL=you@example.com \
+ *   DOCMOST_PASSWORD=secret \
+ *   DOCMOST_SPACE_ID=<spaceId> \
+ *   npx vitest run test/e2e-docmost.test.ts
+ *
+ * Optional: DOCMOST_E2E_PAGE_ID=<pageId> pins the round-trip journey to a
+ * specific page; otherwise it uses the first page found in the space.
+ */
+import { mkdtemp, readFile, readdir, mkdir, writeFile } from 'node:fs/promises';
+import { tmpdir } from 'node:os';
+import { join } from 'node:path';
+import { afterAll, beforeAll, describe, expect, it } from 'vitest';
+import { DocmostClient } from 'docmost-client';
+import { buildVaultLayout, type PageNode } from '../src/layout.js';
+
+// Gate: the journeys run only when DOCMOST_E2E is truthy. By default `d` is
+// describe.skip, so the suite is registered but not executed.
+const RUN_E2E = !!process.env.DOCMOST_E2E;
+const d = RUN_E2E ? describe : describe.skip;
+
+// Read live-connection config from the environment. Read lazily (not at module
+// top-level assertion time) so the skipped path never throws on missing vars.
+function liveConfig() {
+  const apiUrl = process.env.DOCMOST_API_URL ?? '';
+  const email = process.env.DOCMOST_EMAIL ?? '';
+  const password = process.env.DOCMOST_PASSWORD ?? '';
+  const spaceId = process.env.DOCMOST_SPACE_ID ?? '';
+  return { apiUrl, email, password, spaceId };
+}
+
+// Recursively collect every `.md` file path under `root`, relative to `root`,
+// using forward slashes — mirrors the folder hierarchy the pull writes.
+async function collectMarkdownFiles(
+  root: string,
+  prefix = '',
+): Promise<string[]> {
+  const out: string[] = [];
+  const entries = await readdir(root, { withFileTypes: true });
+  for (const e of entries) {
+    const rel = prefix ? `${prefix}/${e.name}` : e.name;
+    if (e.isDirectory()) {
+      out.push(...(await collectMarkdownFiles(join(root, e.name), rel)));
+    } else if (e.isFile() && e.name.endsWith('.md')) {
+      out.push(rel);
+    }
+  }
+  return out;
+}
+
+d('docmost-sync E2E (live server; DOCMOST_E2E gated)', () => {
+  let client: DocmostClient;
+  let vaultPath: string;
+
+  beforeAll(async () => {
+    const { apiUrl, email, password } = liveConfig();
+    // Fail loudly if the gate is on but the connection vars are missing — a
+    // run that was asked to hit a live server with no address is a config bug,
+    // not a silent pass.
+    expect(apiUrl, 'DOCMOST_API_URL must be set when DOCMOST_E2E is on').not.toBe(
+      '',
+    );
+    expect(email, 'DOCMOST_EMAIL must be set').not.toBe('');
+    expect(password, 'DOCMOST_PASSWORD must be set').not.toBe('');
+
+    client = new DocmostClient(apiUrl, email, password);
+    await client.login();
+
+    // A throwaway temp vault so the journey never touches the real data/ vault.
+    vaultPath = await mkdtemp(join(tmpdir(), 'docmost-e2e-vault-'));
+  });
+
+  afterAll(() => {
+    // The temp vault is under the OS temp dir; leave it for post-mortem
+    // inspection — the OS reclaims it. (No teardown that could mask a failure.)
+  });
+
+  // Journey 1 — "pull a space into the vault".
+  // Given the live space, walk its page tree, write one self-contained .md per
+  // page under the deterministic folder hierarchy from buildVaultLayout, and
+  // assert: (a) exactly one file per laid-out page, and (b) each file lands at
+  // the path its layout entry dictates. This re-implements the I/O loop of
+  // src/pull.ts so the assertions can target the produced tree directly.
+  it('pull a space into the vault', async () => {
+    const { spaceId } = liveConfig();
+    expect(spaceId, 'DOCMOST_SPACE_ID must be set').not.toBe('');
+
+    const pages: PageNode[] = await client.listAllSpacePages(spaceId);
+    expect(pages.length).toBeGreaterThan(0);
+
+    const layout = buildVaultLayout(pages);
+
+    // Write one file per page at its laid-out destination (mirrors pull.ts).
+    let written = 0;
+    for (const page of pages) {
+      if (!page || !page.id) continue;
+      const entry = layout.get(page.id);
+      if (!entry) continue;
+      const dir = join(vaultPath, ...entry.segments);
+      await mkdir(dir, { recursive: true });
+      const md = await client.exportPageBody(page.id);
+      await writeFile(join(dir, `${entry.stem}.md`), md, 'utf8');
+      written++;
+    }
+
+    // (a) One Markdown file per page that got a layout entry.
+    const expectedPaths = new Set<string>();
+    for (const page of pages) {
+      const entry = layout.get(page.id);
+      if (!entry) continue;
+      expectedPaths.add([...entry.segments, `${entry.stem}.md`].join('/'));
+    }
+    const actualPaths = await collectMarkdownFiles(vaultPath);
+    expect(actualPaths.length).toBe(written);
+    expect(new Set(actualPaths)).toEqual(expectedPaths);
+
+    // (b) Correct folder hierarchy: every written file sits exactly where its
+    // layout entry (ancestor folders + stem) places it, and every non-root
+    // page is nested under at least one folder segment.
+    for (const page of pages) {
+      const entry = layout.get(page.id);
+      if (!entry) continue;
+      const rel = [...entry.segments, `${entry.stem}.md`].join('/');
+      expect(actualPaths).toContain(rel);
+      const body = await readFile(join(vaultPath, rel), 'utf8');
+      // exportPageBody emits a self-contained file (meta block + body).
+      expect(body.length).toBeGreaterThan(0);
+    }
+  });
+
+  // Journey 2 — "round-trip a page without a phantom diff".
+  // SPEC §0 / §11 idempotency guarantee: export -> import -> export must yield a
+  // byte-identical body. We export a real page's self-contained body, import it
+  // back into the SAME page, then export again and assert the two exports are
+  // byte-for-byte equal (so a subsequent pull produces no phantom git diff).
+  it('round-trip a page without a phantom diff', async () => {
+    const { spaceId } = liveConfig();
+
+    // Resolve the target page: an explicit override, else the first page found.
+    let pageId = process.env.DOCMOST_E2E_PAGE_ID ?? '';
+    if (!pageId) {
+      const pages: PageNode[] = await client.listAllSpacePages(spaceId);
+      const first = pages.find((p) => p && p.id);
+      expect(first, 'space has at least one page to round-trip').toBeTruthy();
+      pageId = first!.id;
+    }
+
+    // export #1 (self-contained body, SPEC §3).
+    const md1 = await client.exportPageBody(pageId);
+    expect(md1.length).toBeGreaterThan(0);
+
+    // import the exact bytes back into the same page...
+    await client.importPageMarkdown(pageId, md1);
+
+    // ...then export #2. The idempotency invariant is byte-identical bodies.
+    const md2 = await client.exportPageBody(pageId);
+    expect(md2).toBe(md1);
+  });
+});
--- a/test/markdown-roundtrip.property.test.ts
+++ b/test/markdown-roundtrip.property.test.ts
@@ -0,0 +1,674 @@
+import { describe, expect, it } from 'vitest';
+import fc from 'fast-check';
+// Import the converter DIRECTLY from src (NOT the docmost-client barrel) so we
+// match the path used by the other converter unit tests.
+import { convertProseMirrorToMarkdown } from '../packages/docmost-client/src/lib/markdown-converter.js';
+// markdownToProseMirror lives in collaboration.ts; importing it mutates the
+// global DOM via jsdom at module load time — this is expected and required for
+// @tiptap/html's generateJSON to run under Node.
+import { markdownToProseMirror } from '../packages/docmost-client/src/lib/collaboration.js';
+import { stripBlockIds } from '../src/roundtrip.js';
+
+// ---------------------------------------------------------------------------
+// WHY THIS TEST EXISTS (SPEC §11 / "Задача №0")
+//
+// git is the state store, and git diffs byte-for-byte. The sync daemon does
+// `export(markdown) -> import(ProseMirror) -> export(markdown)` on every pull,
+// so if the *second* export differs from the first by even one byte, every
+// pull produces a phantom diff -> endless commits/conflicts. The single
+// property git actually needs is therefore MARKDOWN BYTE-STABILITY:
+//
+//     md2 := export(import(export(doc)))   MUST equal   md1 := export(doc)
+//
+// This file fuzzes that invariant with fast-check over randomly generated,
+// representative Docmost ProseMirror documents.
+//
+// ---------------------------------------------------------------------------
+// THE "SUPPORTED SPACE" PROBLEM
+//
+// A NAIVE generator surfaces two different kinds of `md2 !== md1`:
+//
+//   (a) GENUINE converter limitations — documented below as `it.fails` repros.
+//   (b) Inputs the converter LEGITIMATELY normalizes, i.e. markdown that is
+//       ambiguous or that the schema rewrites to a canonical form. These are
+//       NOT byte-stable by construction and are NOT bugs; the fix is to keep
+//       the generator inside the byte-stable / supported space.
+//
+// The following were all empirically confirmed (by probing the live converter)
+// and are EXCLUDED from / canonicalized by the byte-stable arbitrary. Each is a
+// markdown ambiguity or a schema/ProseMirror normalization, NOT a converter bug.
+//
+//   * Text that re-triggers block/inline markdown syntax on re-parse:
+//       - a leading `>`/`*`/`-`/`#`/`1.` turns a paragraph into a blockquote/
+//         list/heading;
+//       - `a  b` (2+ spaces) collapses to `a b`;
+//       - `<b>` / `</div>` parse as real HTML tags (and run-concatenation can
+//         form `<word>` across a run boundary);
+//       - `&amp;` / `&lt;` decode back to `&` / `<`;
+//       - a lone backtick is a code-span delimiter and re-pairs globally.
+//     -> The text arbitrary emits space-joined tokens that BEGIN and END with an
+//        alphanumeric word, with any single special char confined to the middle
+//        (space-flanked). Every char the task requires (* _ [ ] ( ) | < > &, and
+//        more) is covered this way; the backtick is exercised via code spans.
+//   * A purely numeric image `alt` ("0") or link `title` ("0") is parsed back as
+//     a NUMBER and dropped by the converter's `value || ""` -> alt/title always
+//     carry at least one letter.
+//   * Callout types other than info/success/warning/danger normalize to `info`
+//     (schema only knows those four) -> generator restricts to those four.
+//   * A list item / callout / blockquote with MULTIPLE block children: the
+//     converter joins them with a single "\n", which marked re-parses as ONE
+//     merged paragraph ("- p1\n  p2" -> "- p1 p2"). -> container bodies hold a
+//     SINGLE paragraph, optionally plus ONE nested list for lists.
+//   * `orderedList.start` / `1)` markers normalize to `1.` -> not emitted.
+//   * Two sibling lists sharing a marker family (bullet/task use "-", ordered
+//     uses "1.") MERGE into one list -> no two list blocks are adjacent.
+//   * TWO consecutive hard breaks render a blank line that marked eats as a
+//     paragraph break, and a trailing hard break is trimmed -> consecutive/
+//     trailing hard breaks are collapsed/removed.
+//   * Adjacent text runs with IDENTICAL marks ("**a****b****c**" -> "**abc**").
+//     A real ProseMirror doc never stores split same-mark runs (the editor
+//     coalesces them) -> the generator merges them too (normalizeInline).
+//
+// The GENUINE, real-but-intentional non-roundtrip limitations are kept HONEST as
+// `it.fails` blocks below (so the suite stays green only because they are marked
+// expected-to-fail, never by hiding them):
+//
+//   1. The `code` mark COMBINED with any other mark. The converter emits nested
+//      HTML (`<strong><code>x</code></strong>`), but the schema's `code` mark
+//      declares `excludes: "_"`, so on import every co-occurring mark is dropped
+//      and the run comes back as `code` only -> md2 == "`x`". Acknowledged in
+//      markdown-converter.ts (the long comment above the marks switch);
+//      impossible to round-trip both while `code` excludes them.
+//   2. A BLOCK-level `image` placed BETWEEN other blocks. The Docmost image node
+//      is block-level but `![](url)` is inline; marked wraps it in a <p>, the
+//      schema hoists the <img> out and leaves an empty paragraph sibling, which
+//      injects an extra blank gap on the second export. An image IS byte-stable
+//      as the sole block (edge artifacts get trimmed) — covered by a green test.
+// ---------------------------------------------------------------------------
+
+// Run a full export -> import -> export cycle and return both markdown strings.
+async function roundTrip(doc: unknown): Promise<{ md1: string; md2: string; doc2: any }> {
+  const md1 = convertProseMirrorToMarkdown(doc);
+  const doc2 = await markdownToProseMirror(md1);
+  const md2 = convertProseMirrorToMarkdown(doc2);
+  return { md1, md2, doc2 };
+}
+
+const SEED = 42;
+const NUM_RUNS = 100;
+
+// ---------------------------------------------------------------------------
+// Inline text arbitraries
+// ---------------------------------------------------------------------------
+
+// Alphanumeric "word" (no markdown-significant characters). Length 1..6.
+const wordArb = fc
+  .stringMatching(/^[A-Za-z0-9]{1,6}$/)
+  .filter((w) => w.length > 0);
+
+// A SINGLE markdown-significant character, emitted only as an isolated,
+// space-flanked token. Every char the task calls out plus a few more; each was
+// verified byte-stable in this position.
+//
+// NOTE: the backtick (`) is DELIBERATELY excluded from free-floating plain
+// text. A lone backtick is a markdown code-span DELIMITER, so its round-trip
+// depends on GLOBAL backtick pairing: a stray backtick in running text adjacent
+// to a real code span ("A ` " + `code`) re-pairs into a different code span and
+// loses a space — genuinely outside the byte-stable space. The backtick is
+// still fully exercised as the `code`-mark delimiter and inside code blocks.
+const specialCharArb = fc.constantFrom(
+  '*', '_', '[', ']', '(', ')', '{', '}', '|', '<', '>', '&', '#', '!', '~', '=', '+', '-',
+);
+
+// Build a "safe special" text string: a space-joined sequence of tokens that
+// always BEGINS and ENDS with an alphanumeric word, with any isolated special
+// chars confined to the MIDDLE (each space-flanked by words).
+//
+// Both boundary guarantees matter:
+//   * Leading word: the line never opens with a block/inline trigger
+//     (">", "*", "-", "#", "1." ...).
+//   * Trailing word: adjacent text runs CONCATENATE with no separator, so a run
+//     ending in a bare "<" beside a run starting with a letter would form a fake
+//     HTML tag ("...0 <" + "A >" -> "0 <A >"), which marked/jsdom strips. Ending
+//     every run with an alphanumeric word keeps every special internal and
+//     space-flanked even after concatenation.
+const safeTextArb: fc.Arbitrary<string> = fc
+  .tuple(
+    wordArb,
+    fc.array(fc.oneof(wordArb, specialCharArb), { minLength: 0, maxLength: 3 }),
+    wordArb,
+  )
+  .map(([first, middle, last]) => [first, ...middle, last].join(' '));
+
+// A plain alphanumeric phrase (1..3 words) for places where even isolated
+// specials are not wanted (e.g. code-block language, mention labels).
+const phraseArb: fc.Arbitrary<string> = fc
+  .array(wordArb, { minLength: 1, maxLength: 3 })
+  .map((ws) => ws.join(' '));
+
+// A phrase guaranteed to contain at least one letter. Used for image alt text:
+// a PURELY numeric alt (e.g. "0", "00") is parsed back by the schema as a
+// NUMBER, and the converter's `alt || ""` then treats the number 0 as falsy and
+// DROPS the alt ("![0](u)" -> "![](u)") — not byte-stable. A letter anywhere in
+// the alt keeps it a string and avoids the coercion.
+const letterPhraseArb: fc.Arbitrary<string> = fc
+  .tuple(
+    fc.stringMatching(/^[A-Za-z]{1,4}$/),
+    fc.array(wordArb, { minLength: 0, maxLength: 2 }),
+  )
+  .map(([head, rest]) => [head, ...rest].join(' '));
+
+
+// A text run with an OPTIONAL single non-code mark (bold/italic/strike), or a
+// SOLE `code` mark, or a link. `code` is never combined with another mark in
+// the byte-stable arbitrary (that combination is the known bug, exercised
+// separately in the it.fails block). Marks wrap safe text, which stays stable
+// even when it contains isolated specials.
+const markedTextRunArb: fc.Arbitrary<any> = fc.oneof(
+  // Plain text.
+  safeTextArb.map((t) => ({ type: 'text', text: t })),
+  // Single formatting mark.
+  fc
+    .tuple(safeTextArb, fc.constantFrom('bold', 'italic', 'strike'))
+    .map(([t, m]) => ({ type: 'text', text: t, marks: [{ type: m }] })),
+  // Sole code mark (backtick span). safeTextArb is already backtick-free, so the
+  // code span content cannot contain an inner backtick (which would be
+  // ambiguous to re-parse).
+  safeTextArb.map((t) => ({ type: 'text', text: t, marks: [{ type: 'code' }] })),
+  // Link with safe text and a paren/space-free href, optionally with a title.
+  // The title rides in a markdown link-title attribute; a purely numeric title
+  // is coerced to a number and dropped on re-import (same class of quirk as the
+  // image alt), so the title always carries at least one letter.
+  fc
+    .tuple(
+      phraseArb,
+      fc.webUrl().filter((u) => !/[()\s]/.test(u)),
+      fc.option(letterPhraseArb, { nil: undefined }),
+    )
+    .map(([t, href, title]) => ({
+      type: 'text',
+      text: t,
+      marks: [{ type: 'link', attrs: title ? { href, title } : { href } }],
+    })),
+);
+
+// Inline math node carrying LaTeX that includes the `a < b` the task asks for.
+const mathInlineArb: fc.Arbitrary<any> = fc
+  .constantFrom('a < b', 'x^2 + y^2', 'a < b < c', '\\frac{1}{2}', 'E = mc^2')
+  .map((text) => ({ type: 'mathInline', attrs: { text } }));
+
+// Mention node (schema attrs); label/id are plain phrases.
+const mentionArb: fc.Arbitrary<any> = fc
+  .tuple(phraseArb, fc.uuid(), fc.uuid())
+  .map(([label, id, entityId]) => ({
+    type: 'mention',
+    attrs: { id, label, entityType: 'user', entityId },
+  }));
+
+const hardBreakArb: fc.Arbitrary<any> = fc.constant({ type: 'hardBreak' });
+
+// Canonicalize a generated inline-content array the way ProseMirror itself
+// stores inline content, then trim the markdown-fragile edges. Applied to both
+// paragraph and heading inline content.
+//
+//   1) MERGE adjacent `text` runs that carry IDENTICAL marks. A real
+//      ProseMirror document never stores two neighbouring runs with the same
+//      mark set — the editor coalesces them into one. A naive generator that
+//      leaves them split produces UNREALISTIC docs AND breaks byte-stability:
+//      three adjacent bold runs export as "**a****b****c**", whose inner
+//      "****" boundaries are ambiguous and re-parse as a single "**abc**".
+//      Merging makes the generated doc canonical and the markdown stable.
+//   2) Collapse CONSECUTIVE hard breaks. Two in a row render as "  \n  \n",
+//      whose middle whitespace-only line marked treats as a paragraph break, so
+//      "a  \n  \nb" re-parses to "a\n\nb". A SINGLE hard break round-trips.
+//   3) Drop a TRAILING hard break: "...  \n" sits at the paragraph edge and is
+//      removed by the converter's .trim().
+const sameMarks = (a: any[] | undefined, b: any[] | undefined): boolean =>
+  JSON.stringify(a ?? []) === JSON.stringify(b ?? []);
+
+function normalizeInline(nodes: any[]): any[] {
+  const out: any[] = [];
+  for (const node of nodes) {
+    const prev = out[out.length - 1];
+    // Collapse a second consecutive hard break.
+    if (node.type === 'hardBreak' && prev && prev.type === 'hardBreak') {
+      continue;
+    }
+    // Merge an adjacent text run with the same marks.
+    if (
+      node.type === 'text' &&
+      prev &&
+      prev.type === 'text' &&
+      sameMarks(prev.marks, node.marks)
+    ) {
+      prev.text += node.text;
+      continue;
+    }
+    // Clone text nodes so the in-place merge above never mutates a shared value.
+    out.push(node.type === 'text' ? { ...node } : node);
+  }
+  while (out.length > 1 && out[out.length - 1].type === 'hardBreak') {
+    out.pop();
+  }
+  return out;
+}
+
+// Inline content for a paragraph: at least one marked text run, optionally with
+// inline atoms (math/mention) and hard breaks interspersed. Always starts with a
+// text run so the paragraph never opens with a block trigger.
+const inlineContentArb: fc.Arbitrary<any[]> = fc
+  .tuple(
+    markedTextRunArb,
+    fc.array(
+      fc.oneof(
+        { weight: 5, arbitrary: markedTextRunArb },
+        { weight: 1, arbitrary: mathInlineArb },
+        { weight: 1, arbitrary: mentionArb },
+        { weight: 1, arbitrary: hardBreakArb },
+      ),
+      { minLength: 0, maxLength: 4 },
+    ),
+  )
+  .map(([first, rest]) => normalizeInline([first, ...rest]));
+
+// Inline content for a HEADING — identical to a paragraph's, but WITHOUT hard
+// breaks. A hard break inside an ATX heading ("# a  \nb") is NOT byte-stable:
+// marked does not honour a hard break inside a heading, so it re-parses as the
+// heading "# a" plus a separate paragraph "b" (md2 = "# a\n\nb"). math/mention/
+// link inside a heading are fine (verified) and stay in the menu.
+const headingInlineContentArb: fc.Arbitrary<any[]> = fc
+  .tuple(
+    markedTextRunArb,
+    fc.array(
+      fc.oneof(
+        { weight: 5, arbitrary: markedTextRunArb },
+        { weight: 1, arbitrary: mathInlineArb },
+        { weight: 1, arbitrary: mentionArb },
+      ),
+      { minLength: 0, maxLength: 4 },
+    ),
+  )
+  .map(([first, rest]) => normalizeInline([first, ...rest]));
+
+// ---------------------------------------------------------------------------
+// Block arbitraries
+// ---------------------------------------------------------------------------
+
+const paragraphArb: fc.Arbitrary<any> = inlineContentArb.map((content) => ({
+  type: 'paragraph',
+  content,
+}));
+
+const headingArb: fc.Arbitrary<any> = fc
+  .tuple(fc.integer({ min: 1, max: 6 }), headingInlineContentArb)
+  .map(([level, content]) => ({ type: 'heading', attrs: { level }, content }));
+
+// Code block content: 1..4 lines of plain phrases (may contain specials inline,
+// which are inert inside a fenced block). Language is optional and is a single
+// lowercase token.
+const codeBlockArb: fc.Arbitrary<any> = fc
+  .tuple(
+    fc.option(fc.constantFrom('js', 'ts', 'python', 'go', 'rust', 'bash'), {
+      nil: '',
+    }),
+    fc
+      .array(safeTextArb, { minLength: 1, maxLength: 4 })
+      .map((lines) => lines.join('\n')),
+  )
+  .map(([language, code]) => ({
+    type: 'codeBlock',
+    attrs: { language },
+    content: [{ type: 'text', text: code }],
+  }));
+
+const blockquoteArb: fc.Arbitrary<any> = paragraphArb.map((p) => ({
+  type: 'blockquote',
+  content: [p],
+}));
+
+const horizontalRuleArb: fc.Arbitrary<any> = fc.constant({
+  type: 'horizontalRule',
+});
+
+// Callout: ONE paragraph child; type restricted to the four the schema knows.
+const calloutArb: fc.Arbitrary<any> = fc
+  .tuple(
+    fc.constantFrom('info', 'success', 'warning', 'danger'),
+    paragraphArb,
+  )
+  .map(([type, p]) => ({ type: 'callout', attrs: { type }, content: [p] }));
+
+const mathBlockArb: fc.Arbitrary<any> = fc
+  .constantFrom('a < b', 'a < b < c', '\\sum_{i=0}^{n} i', 'x = \\frac{-b}{2a}', '')
+  .map((text) => ({ type: 'mathBlock', attrs: { text } }));
+
+const imageArb: fc.Arbitrary<any> = fc
+  .tuple(
+    fc.webUrl(),
+    // alt is a letter-bearing phrase OR empty. Brackets/parens leak into the
+    // markdown image syntax (not byte-stable) so they are excluded, and a purely
+    // numeric alt is coerced to a number and dropped (see letterPhraseArb), so
+    // alt always carries at least one letter when non-empty.
+    fc.option(letterPhraseArb, { nil: '' }),
+  )
+  .map(([src, alt]) => ({ type: 'image', attrs: { src, alt } }));
+
+// A simple list item: ONE paragraph, optionally followed by ONE nested bullet
+// list (single level of nesting). depth controls whether nesting is allowed.
+function listItemArb(allowNest: boolean): fc.Arbitrary<any> {
+  if (!allowNest) {
+    return paragraphArb.map((p) => ({ type: 'listItem', content: [p] }));
+  }
+  return fc
+    .tuple(
+      paragraphArb,
+      fc.option(
+        fc.array(
+          paragraphArb.map((p) => ({ type: 'listItem', content: [p] })),
+          { minLength: 1, maxLength: 3 },
+        ),
+        { nil: undefined },
+      ),
+    )
+    .map(([p, nested]) => ({
+      type: 'listItem',
+      content: nested
+        ? [p, { type: 'bulletList', content: nested }]
+        : [p],
+    }));
+}
+
+const bulletListArb: fc.Arbitrary<any> = fc
+  .array(listItemArb(true), { minLength: 1, maxLength: 4 })
+  .map((items) => ({ type: 'bulletList', content: items }));
+
+const orderedListArb: fc.Arbitrary<any> = fc
+  .array(listItemArb(true), { minLength: 1, maxLength: 4 })
+  .map((items) => ({ type: 'orderedList', content: items }));
+
+// Task item: ONE paragraph, optional ONE nested bullet list.
+const taskItemArb: fc.Arbitrary<any> = fc
+  .tuple(
+    fc.boolean(),
+    paragraphArb,
+    fc.option(
+      fc.array(listItemArb(false), { minLength: 1, maxLength: 2 }),
+      { nil: undefined },
+    ),
+  )
+  .map(([checked, p, nested]) => ({
+    type: 'taskItem',
+    attrs: { checked },
+    content: nested ? [p, { type: 'bulletList', content: nested }] : [p],
+  }));
+
+const taskListArb: fc.Arbitrary<any> = fc
+  .array(taskItemArb, { minLength: 1, maxLength: 4 })
+  .map((items) => ({ type: 'taskList', content: items }));
+
+// GFM table: a header row + 1..3 body rows, with a fixed column count (1..3) and
+// per-column alignment. Cells hold a single short paragraph of safe text.
+const tableArb: fc.Arbitrary<any> = fc
+  .integer({ min: 1, max: 3 })
+  .chain((cols) => {
+    const cellArb = (header: boolean, align?: string) =>
+      phraseArb.map((t) => ({
+        type: header ? 'tableHeader' : 'tableCell',
+        attrs: align ? { align } : {},
+        content: [{ type: 'paragraph', content: [{ type: 'text', text: t }] }],
+      }));
+    const alignsArb = fc.array(
+      fc.constantFrom(undefined, 'left', 'center', 'right'),
+      { minLength: cols, maxLength: cols },
+    );
+    return fc
+      .tuple(
+        alignsArb,
+        fc.array(
+          fc.constant(null), // body-row placeholders; cells filled below
+          { minLength: 1, maxLength: 3 },
+        ),
+      )
+      .chain(([aligns, bodyRows]) => {
+        const headerRow = fc
+          .tuple(...aligns.map((a) => cellArb(true, a)))
+          .map((cells) => ({ type: 'tableRow', content: cells }));
+        const bodyRowArbs = bodyRows.map(() =>
+          fc
+            .tuple(...aligns.map(() => cellArb(false)))
+            .map((cells) => ({ type: 'tableRow', content: cells })),
+        );
+        return fc
+          .tuple(headerRow, fc.tuple(...bodyRowArbs))
+          .map(([h, body]) => ({ type: 'table', content: [h, ...body] }));
+      });
+  });
+
+// ---------------------------------------------------------------------------
+// Top-level document arbitrary
+// ---------------------------------------------------------------------------
+
+// The full menu of block nodes that are byte-stable when SEQUENCED with other
+// blocks. NOTE: `image` is deliberately NOT in this menu — see the dedicated
+// image tests below. The Docmost `image` node is BLOCK-level, but its markdown
+// form `![](url)` is INLINE; marked wraps it in a <p>, the schema then hoists
+// the block <img> out and leaves an EMPTY paragraph beside it, so on the second
+// export the stray empty paragraph injects extra blank lines between siblings
+// ("p\n\n![](u)\n\nq" -> "p\n\n\n\n![](u)\n\nq"). An image is only byte-stable
+// when it is the SOLE block (the edge artifacts get .trim()'d away). It is
+// therefore covered by its own targeted tests, not mixed into multi-block docs.
+const blockArb: fc.Arbitrary<any> = fc.oneof(
+  { weight: 6, arbitrary: paragraphArb },
+  { weight: 3, arbitrary: headingArb },
+  { weight: 2, arbitrary: codeBlockArb },
+  { weight: 2, arbitrary: bulletListArb },
+  { weight: 2, arbitrary: orderedListArb },
+  { weight: 2, arbitrary: taskListArb },
+  { weight: 2, arbitrary: blockquoteArb },
+  { weight: 2, arbitrary: tableArb },
+  { weight: 2, arbitrary: calloutArb },
+  { weight: 1, arbitrary: horizontalRuleArb },
+  { weight: 1, arbitrary: mathBlockArb },
+);
+
+const LIST_TYPES = new Set(['bulletList', 'orderedList', 'taskList']);
+
+// A bounded document: 1..8 block nodes. Kept small so each run is cheap (each
+// run does a real marked + jsdom parse) and shrinking stays fast.
+//
+// Post-process: never let two LIST blocks sit directly adjacent. Two sibling
+// lists that share a marker family — bullet/task both use "-", ordered uses
+// "1." — are MERGED by markdown into a single list when only a blank line
+// separates them ("- a\n\n- b" -> one list -> "- a\n- b"), which is not
+// byte-stable. (A non-list block between two lists separates them fine, as does
+// a different marker family, but dropping every back-to-back list is the clean,
+// always-correct rule.) We drop a list block whenever the previously kept block
+// is also a list.
+const docArb: fc.Arbitrary<any> = fc
+  .array(blockArb, { minLength: 1, maxLength: 8 })
+  .map((content) => {
+    const out: any[] = [];
+    for (const block of content) {
+      const prev = out[out.length - 1];
+      if (
+        prev &&
+        LIST_TYPES.has(prev.type) &&
+        LIST_TYPES.has(block.type)
+      ) {
+        continue; // skip a list that would sit right after another list
+      }
+      out.push(block);
+    }
+    // Guarantee a non-empty document even if filtering removed everything but a
+    // single dropped block (cannot happen here since the first block is always
+    // kept, but keep the invariant explicit).
+    return { type: 'doc', content: out.length ? out : content.slice(0, 1) };
+  });
+
+// ---------------------------------------------------------------------------
+// The properties
+// ---------------------------------------------------------------------------
+
+describe('markdown <-> ProseMirror round-trip (property-based)', () => {
+  it('the generator covers every targeted node type at least once', () => {
+    // A sanity check that the arbitrary actually exercises the intended node
+    // variety within NUM_RUNS — not a correctness property, just coverage.
+    const seen = new Set<string>();
+    const collect = (node: any) => {
+      if (!node || typeof node !== 'object') return;
+      if (node.type) seen.add(node.type);
+      for (const m of node.marks ?? []) seen.add(`mark:${m.type}`);
+      for (const c of node.content ?? []) collect(c);
+    };
+    fc.assert(
+      fc.property(docArb, (doc) => {
+        collect(doc);
+        return true;
+      }),
+      { numRuns: NUM_RUNS, seed: SEED },
+    );
+    // Core block types and marks we expect to appear.
+    for (const t of [
+      'paragraph',
+      'heading',
+      'codeBlock',
+      'bulletList',
+      'orderedList',
+      'taskList',
+      'blockquote',
+      'table',
+      'callout',
+      'horizontalRule',
+      'mathBlock',
+      // 'image' is covered by its own dedicated tests, not docArb.
+      'mention',
+      'mathInline',
+      'hardBreak',
+      'mark:bold',
+      'mark:italic',
+      'mark:strike',
+      'mark:code',
+      'mark:link',
+    ]) {
+      expect(seen, `expected the generator to produce ${t}`).toContain(t);
+    }
+  });
+
+  it('markdown is byte-stable across export -> import -> export', async () => {
+    // The property git needs: a second export reproduces the first byte-for-byte.
+    await fc.assert(
+      fc.asyncProperty(docArb, async (doc) => {
+        const { md1, md2 } = await roundTrip(doc);
+        expect(md2).toBe(md1);
+      }),
+      { numRuns: NUM_RUNS, seed: SEED },
+    );
+  });
+
+  it('the document is semantically stable on a second cycle (ids stripped)', async () => {
+    // Optional, stronger-feeling property. We do NOT compare doc vs doc2: the
+    // converter reconstructs schema default attrs on the FIRST import (a known
+    // SPEC §11 divergence). But once the markdown is byte-stable, importing the
+    // SAME markdown twice must yield structurally identical docs (modulo the
+    // regenerated block ids). So we compare doc2 (import of md1) with doc3
+    // (import of md2 == md1) after stripping ids.
+    await fc.assert(
+      fc.asyncProperty(docArb, async (doc) => {
+        const md1 = convertProseMirrorToMarkdown(doc);
+        const doc2 = await markdownToProseMirror(md1);
+        const md2 = convertProseMirrorToMarkdown(doc2);
+        // Guard: this property only makes sense when md is byte-stable.
+        expect(md2).toBe(md1);
+        const doc3 = await markdownToProseMirror(md2);
+        expect(stripBlockIds(doc3)).toEqual(stripBlockIds(doc2));
+      }),
+      { numRuns: NUM_RUNS, seed: SEED },
+    );
+  });
+
+  it('a SOLE image block is byte-stable', async () => {
+    // An image is byte-stable when it is the only block in the document: the
+    // stray empty paragraph the schema leaves beside the hoisted block <img>
+    // sits at a document edge and is removed by the converter's final .trim().
+    await fc.assert(
+      fc.asyncProperty(imageArb, async (image) => {
+        const doc = { type: 'doc', content: [image] };
+        const { md1, md2 } = await roundTrip(doc);
+        expect(md2).toBe(md1);
+      }),
+      { numRuns: NUM_RUNS, seed: SEED },
+    );
+  });
+
+  // -------------------------------------------------------------------------
+  // KNOWN, DOCUMENTED non-roundtrip bug #2 (kept honest as it.fails).
+  //
+  // BUG: a block-level `image` placed BETWEEN other blocks is not byte-stable.
+  // The Docmost image node is BLOCK-level but its markdown form `![](url)` is
+  // INLINE. marked wraps the inline image in a <p>; the schema then hoists the
+  // block <img> out of that <p>, leaving an EMPTY paragraph as a sibling. On the
+  // second export that empty paragraph renders as "" and the "\n\n" doc join
+  // injects an extra blank gap:
+  //   "p\n\n![x](u)\n\nq"  ->  "p\n\n\n\n![x](u)\n\nq"   (=> md2 !== md1).
+  // Minimal repro doc:
+  //   { type:'doc', content:[
+  //       { type:'paragraph', content:[{type:'text',text:'p'}] },
+  //       { type:'image', attrs:{ src:'http://a.aa', alt:'x' } },
+  //       { type:'paragraph', content:[{type:'text',text:'q'}] } ] }
+  // Not "fixed" — the source must not change; documented and exercised here.
+  // -------------------------------------------------------------------------
+  it.fails('BUG: a block image between other blocks is not byte-stable', async () => {
+    const doc = {
+      type: 'doc',
+      content: [
+        { type: 'paragraph', content: [{ type: 'text', text: 'p' }] },
+        { type: 'image', attrs: { src: 'http://a.aa', alt: 'x' } },
+        { type: 'paragraph', content: [{ type: 'text', text: 'q' }] },
+      ],
+    };
+    const { md1, md2 } = await roundTrip(doc);
+    expect(md2).toBe(md1);
+  });
+
+  // -------------------------------------------------------------------------
+  // KNOWN, DOCUMENTED non-roundtrip bug #1 (kept honest as it.fails).
+  //
+  // BUG: the `code` mark combined with ANY other mark does NOT round-trip.
+  // The converter emits nested HTML so the output is well-formed, e.g.
+  //   marks [code, bold]  ->  md1 = "<strong><code>x</code></strong>"
+  // but the schema's `code` mark declares `excludes: "_"`, so on import the
+  // co-occurring mark is dropped and the run comes back as code-only:
+  //   md2 = "`x`"   (=> md2 !== md1).
+  // Minimal repro doc:
+  //   { type:'doc', content:[ { type:'paragraph', content:[
+  //       { type:'text', text:'x', marks:[{type:'code'},{type:'bold'}] } ] } ] }
+  // This is acknowledged in markdown-converter.ts (the long comment above the
+  // marks switch): preserving both marks is impossible while `code` excludes
+  // them. Documented here, not "fixed", because the source must not change.
+  // -------------------------------------------------------------------------
+  it.fails(
+    'BUG: code mark combined with another mark is not byte-stable',
+    async () => {
+      const codeComboArb = fc
+        .tuple(safeTextArb, fc.constantFrom('bold', 'italic', 'strike'))
+        .map(([t, other]) => ({
+          type: 'doc',
+          content: [
+            {
+              type: 'paragraph',
+              content: [
+                { type: 'text', text: t, marks: [{ type: 'code' }, { type: other }] },
+              ],
+            },
+          ],
+        }));
+      await fc.assert(
+        fc.asyncProperty(codeComboArb, async (doc) => {
+          const { md1, md2 } = await roundTrip(doc);
+          expect(md2).toBe(md1);
+        }),
+        { numRuns: 20, seed: SEED },
+      );
+    },
+  );
+});
--- a/test/recent-since-edges.test.ts
+++ b/test/recent-since-edges.test.ts
@@ -0,0 +1,236 @@
+import { afterEach, describe, expect, it, vi } from 'vitest';
+// Import from source (not the built barrel/dist) for consistency with the rest
+// of the docmost-client test wave and to avoid running stale compiled output.
+import { collectRecentSince } from '../packages/docmost-client/src/client.js';
+
+/**
+ * Edge-case unit tests for `collectRecentSince`, complementing
+ * `test/recent-since.test.ts` (which covers the happy / cap / dedup / order
+ * paths). These tests target the defensive `!= null` guards, the exact cutoff
+ * boundary, and a mid-walk null cursor — none of which the existing suite
+ * exercises. `fetchPage` is always faked; no network is involved.
+ *
+ * Imported `from 'docmost-client'` (the built barrel) to match the behaviour
+ * the existing suite asserts against.
+ */
+
+// An item may be malformed (missing id and/or updatedAt), so every field is
+// optional here on purpose — that is exactly what these tests probe.
+type Item = { id?: string; updatedAt?: string };
+
+/**
+ * Build a fake `fetchPage` from an ordered list of pages. Page i's nextCursor
+ * points at page i+1; the last page has no cursor (null). Tracks the call
+ * count and the sequence of cursors the function asked for, so we can assert
+ * the walk stopped where we expect.
+ */
+function fakeServer(pages: Item[][]) {
+  let calls = 0;
+  const cursorsRequested: (string | null)[] = [];
+  const cursorFor = (i: number) => (i < pages.length - 1 ? `c${i}` : null);
+  const fetchPage = async (cursor: string | null) => {
+    // null -> page 0, "cN" -> page N+1 (mirrors the existing suite's helper).
+    const idx = cursor === null ? 0 : Number(cursor.slice(1)) + 1;
+    calls++;
+    cursorsRequested.push(cursor);
+    const items = pages[idx] ?? [];
+    return { items, nextCursor: cursorFor(idx) };
+  };
+  return {
+    fetchPage,
+    get calls() {
+      return calls;
+    },
+    get cursorsRequested() {
+      return cursorsRequested;
+    },
+  };
+}
+
+afterEach(() => {
+  vi.restoreAllMocks();
+});
+
+describe('collectRecentSince — malformed items (the `!= null` guards)', () => {
+  it('keeps an item with no updatedAt without tripping the cutoff', async () => {
+    // The item with no `updatedAt` must skip the `<= cutoff` comparison
+    // entirely (guard: item.updatedAt != null) and therefore be collected
+    // rather than terminating the scan. The genuinely-old 'old' item that
+    // follows it is what stops the walk.
+    const server = fakeServer([
+      [
+        { id: 'a', updatedAt: '2026-06-16T10:00:00Z' },
+        { id: 'no-ts' }, // no updatedAt -> cutoff check skipped, still collected
+        { id: 'b', updatedAt: '2026-06-16T09:00:00Z' },
+        { id: 'old', updatedAt: '2026-06-16T01:00:00Z' }, // <= cutoff -> stop
+        { id: 'after', updatedAt: '2026-06-16T00:30:00Z' },
+      ],
+    ]);
+
+    const out = await collectRecentSince(
+      server.fetchPage,
+      '2026-06-16T05:00:00Z',
+    );
+
+    // 'no-ts' survives between the two newer items; 'old' and everything after
+    // it is excluded once the cutoff is hit.
+    expect(out.map((i) => i.id)).toEqual(['a', 'no-ts', 'b']);
+  });
+
+  it('keeps an item with no id and never dedups it', async () => {
+    // Items without an `id` are never added to the `seen` set (guard:
+    // item.id != null), so they are never deduped: every no-id item — even
+    // identical ones — is collected. A no-id item must not throw on the
+    // `seen.has(undefined)` path either.
+    const server = fakeServer([
+      [
+        { id: 'a', updatedAt: '2026-06-16T10:00:00Z' },
+        { updatedAt: '2026-06-16T09:30:00Z' }, // no id
+        { updatedAt: '2026-06-16T09:30:00Z' }, // identical, no id -> NOT deduped
+        { id: 'b', updatedAt: '2026-06-16T09:00:00Z' },
+      ],
+    ]);
+
+    const out = await collectRecentSince(
+      server.fetchPage,
+      '2026-06-16T01:00:00Z',
+    );
+
+    // Both no-id items are kept (length 4), proving no-id items bypass dedup.
+    expect(out).toHaveLength(4);
+    expect(out.map((i) => i.id)).toEqual(['a', undefined, undefined, 'b']);
+  });
+
+  it('does not let a malformed item break id-based dedup of real items', async () => {
+    // A malformed (no id, no updatedAt) item appears alongside a real id that
+    // overlaps across pages. The real id 'b' must still be deduped exactly
+    // once, and the malformed item must not interfere with that bookkeeping.
+    const server = fakeServer([
+      [
+        { id: 'a', updatedAt: '2026-06-16T10:00:00Z' },
+        {}, // fully malformed: no id, no updatedAt
+        { id: 'b', updatedAt: '2026-06-16T09:00:00Z' },
+      ],
+      [
+        { id: 'b', updatedAt: '2026-06-16T09:00:00Z' }, // overlap -> deduped
+        { id: 'c', updatedAt: '2026-06-16T08:00:00Z' },
+      ],
+    ]);
+
+    const out = await collectRecentSince(
+      server.fetchPage,
+      '2026-06-16T01:00:00Z',
+    );
+
+    // Real ids appear once each; the malformed item is kept once (it counts as
+    // a new item, so it does not stall progress between pages).
+    expect(out.map((i) => i.id)).toEqual(['a', undefined, 'b', 'c']);
+    expect(server.calls).toBe(2);
+  });
+});
+
+describe('collectRecentSince — exact cutoff boundary (updatedAt === sinceIso)', () => {
+  it('EXCLUDES an item whose updatedAt equals sinceIso (<= is inclusive on the boundary)', async () => {
+    // The comparison is `item.updatedAt <= sinceIso`, so an item exactly AT
+    // the cutoff satisfies it and is treated as the stop point: that item and
+    // everything after it is excluded.
+    const server = fakeServer([
+      [
+        { id: 'a', updatedAt: '2026-06-16T06:00:00Z' },
+        { id: 'boundary', updatedAt: '2026-06-16T05:00:00Z' }, // === sinceIso
+        { id: 'after', updatedAt: '2026-06-16T04:00:00Z' },
+      ],
+      [{ id: 'never', updatedAt: '2026-06-16T03:00:00Z' }], // must not be fetched
+    ]);
+
+    const out = await collectRecentSince(
+      server.fetchPage,
+      '2026-06-16T05:00:00Z',
+    );
+
+    // Only the strictly-newer 'a'; the boundary item is the cutoff and is
+    // excluded, and the walk stops without fetching page 1.
+    expect(out.map((i) => i.id)).toEqual(['a']);
+    expect(server.calls).toBe(1);
+  });
+
+  it('returns an empty array when the very first item is exactly at the cutoff', async () => {
+    // Boundary item is first on the page: the loop hits the cutoff immediately
+    // and collects nothing.
+    const server = fakeServer([
+      [
+        { id: 'boundary', updatedAt: '2026-06-16T05:00:00Z' }, // === sinceIso
+        { id: 'after', updatedAt: '2026-06-16T04:00:00Z' },
+      ],
+    ]);
+
+    const out = await collectRecentSince(
+      server.fetchPage,
+      '2026-06-16T05:00:00Z',
+    );
+
+    expect(out).toEqual([]);
+    expect(server.calls).toBe(1);
+  });
+});
+
+describe('collectRecentSince — nextCursor null mid-walk before cutoff', () => {
+  it('stops and returns what it has when the cursor runs out before the cutoff', async () => {
+    // Both pages are entirely newer than the cutoff (so `reachedCutoff` stays
+    // false), but the last page has nextCursor === null. The `if
+    // (!data.nextCursor) break` must end the walk gracefully and return the
+    // accumulated items — no extra fetch, no warning (cap not hit).
+    const server = fakeServer([
+      [
+        { id: 'a', updatedAt: '2026-06-16T10:00:00Z' },
+        { id: 'b', updatedAt: '2026-06-16T09:00:00Z' },
+      ],
+      [
+        { id: 'c', updatedAt: '2026-06-16T08:00:00Z' },
+        { id: 'd', updatedAt: '2026-06-16T07:00:00Z' }, // still all newer
+      ],
+    ]);
+
+    const warn = vi.spyOn(console, 'warn').mockImplementation(() => {});
+
+    const out = await collectRecentSince(
+      server.fetchPage,
+      '2026-06-16T01:00:00Z',
+      50, // generous cap: the null cursor, not the cap, must stop the walk
+    );
+
+    // Everything from both pages, in server order; the null cursor ends it.
+    expect(out.map((i) => i.id)).toEqual(['a', 'b', 'c', 'd']);
+    // Exactly the two real pages were fetched (page 0 via null, page 1 via c0).
+    expect(server.calls).toBe(2);
+    expect(server.cursorsRequested).toEqual([null, 'c0']);
+    // The cutoff was never reached, but we exhausted the feed naturally, so no
+    // truncation warning is emitted.
+    expect(warn).not.toHaveBeenCalled();
+  });
+});
+
+describe('collectRecentSince — hardPageCap warning (re-confirm)', () => {
+  it('warns once when the cap is hit before the cutoff is reached', async () => {
+    // Endless feed of unique, all-newer items with a perpetual nextCursor: the
+    // only stop condition is the cap, which must emit exactly one truncation
+    // warning naming the cap value.
+    let n = 0;
+    const fetchPage = async (_cursor: string | null) => {
+      const id = `id${n++}`;
+      return {
+        items: [{ id, updatedAt: '2026-06-16T10:00:00Z' }] as Item[],
+        nextCursor: 'next', // never runs out
+      };
+    };
+
+    const warn = vi.spyOn(console, 'warn').mockImplementation(() => {});
+
+    const cap = 3;
+    const out = await collectRecentSince(fetchPage, '2020-01-01T00:00:00Z', cap);
+
+    expect(out).toHaveLength(cap);
+    expect(warn).toHaveBeenCalledTimes(1);
+    expect(String(warn.mock.calls[0][0])).toContain('hardPageCap=3');
+  });
+});