fix(git-sync): push 503 starvation + concurrent-edit marker leak/silent loss
Bug #1 (push 503 starvation): an external receive-pack that briefly overlapped a poll cycle immediately 503'd because the per-space single-writer lock was held. Add a BOUNDED retry-acquire on the PUSH path only (SpaceLockService .withSpaceLock acquireRetry: capped exponential backoff up to ~5s); a transient overlap now waits and succeeds, a genuinely stuck cycle still 503s after the bound. The poll cycle passes no retry (immediate skip). Push result stays deterministic: the receive-pack only runs once the lock is held, so a 503 never leaves a half-applied ref. Bug #2 (concurrent-edit marker leak + silent same-block loss): - Marker leak (a): the push UPDATE path stripped markers for the body sent to Docmost but left raw <<<<<<</>>>>>>> committed on the published `main` vault forever (autoMergeConflicts ON). Now the cleaned body is written back to the vault file + recorded in writtenBack so runPush commits it on `main` and the vault converges to clean bytes. - Marker leak (b): pin merge.conflictStyle=merge in ensureRepo and teach stripConflictMarkers/hasConflictMarkers about the diff3 `|||||||` base section (drop the marker AND the stale base region) so diff3/zdiff3 conflicts can never leak `|||||||` + base content into a page. Also scrub the 3-way merge BASE markdown. - Silent same-block loss: the block 3-way merge still resolves same-block conflicts deterministically to git, but it is no longer silent: diff3Plan now reports a conflict count (mergeXmlFragments3WayWithStats), gitSyncWriteBody logs it, and the persistence boundary-snapshot now fires for git-sync writes over a non-git-sync baseline so the human's pre-merge content is preserved in page history (recoverable). Full both-preserved persisted-conflict UI remains the deferred redesign. Tests: space-lock bounded-retry (success/stuck/poll-immediate); push vault-clean + diff3 ||||||| strip; ensureRepo conflictStyle pin; diff3Plan/3-way conflict counts; persistence git-sync boundary snapshot. Server tsc clean; git-sync vitest + server collaboration/git-sync jest all green. Co-Authored-By: Claude Opus 4.8 (1M context) <noreply@anthropic.com>
This commit is contained in:
@@ -220,6 +220,13 @@ export class VaultGit {
|
||||
// that core.autocrlf=false does not cover). POSIX-only path, which is
|
||||
// fine: the daemon runs on Linux (Docker) / macOS. A system
|
||||
// /etc/gitattributes remains the host admin's domain (out of scope).
|
||||
// - merge.conflictStyle=merge — CRITICAL (SPEC §9, conflict-marker leak):
|
||||
// a global `merge.conflictStyle=diff3`/`zdiff3` makes a conflicting merge
|
||||
// emit an EXTRA `|||||||` base-marker section. The conflict-marker
|
||||
// scrub on the push side (`stripConflictMarkers`) handles `|||||||` too,
|
||||
// but pinning the classic `merge` style keeps the markers the engine
|
||||
// produces to the canonical three (`<<<<<<<`/`=======`/`>>>>>>>`) so
|
||||
// behavior is deterministic regardless of the operator's global config.
|
||||
// NOTE: these stay PERSISTED LOCAL config (not `-c` flags) on purpose — a
|
||||
// human running git by hand in the vault must inherit the same neutralized
|
||||
// behavior; a transient `-c` would not persist. (core.quotepath, by
|
||||
@@ -230,6 +237,7 @@ export class VaultGit {
|
||||
await this.run(["config", "core.safecrlf", "false"]);
|
||||
await this.run(["config", "commit.gpgsign", "false"]);
|
||||
await this.run(["config", "core.attributesFile", "/dev/null"]);
|
||||
await this.run(["config", "merge.conflictStyle", "merge"]);
|
||||
} catch (err: unknown) {
|
||||
const detail = err instanceof Error ? err.message : String(err);
|
||||
throw new Error(
|
||||
|
||||
@@ -699,19 +699,39 @@ export async function applyPushActions(
|
||||
});
|
||||
continue;
|
||||
}
|
||||
const conflicted = hasConflictMarkers(rawBody);
|
||||
const body = stripConflictMarkers(rawBody);
|
||||
// The last-synced version of this file (pre-image) is the common ancestor
|
||||
// for a 3-way merge against the live page, so concurrent human edits are
|
||||
// not clobbered (review #5). Null when the file is new at last-pushed. Its
|
||||
// body is stripped the SAME way so the merge compares body-to-body.
|
||||
// body is stripped the SAME way (frontmatter AND conflict markers) so the
|
||||
// merge compares clean body-to-body: a base that itself carried markers
|
||||
// (from a prior conflict commit) must never reintroduce marker syntax or a
|
||||
// stale diff3 base region into the 3-way merge.
|
||||
const baseFull = await deps.git.showFileAtRef(LAST_PUSHED_REF, u.path);
|
||||
const baseMarkdown = baseFull === null ? null : parsePageFile(baseFull).body;
|
||||
const baseMarkdown =
|
||||
baseFull === null
|
||||
? null
|
||||
: stripConflictMarkers(parsePageFile(baseFull).body);
|
||||
const result = await client.importPageMarkdown(
|
||||
u.pageId,
|
||||
body,
|
||||
baseMarkdown,
|
||||
);
|
||||
updated++;
|
||||
// CONFLICT VAULT-CLEAN (autoMergeConflicts ON, SPEC §9 marker leak). On ON
|
||||
// a conflicted page is auto-merged INTO Docmost (the clean `body` above),
|
||||
// but the file on `main` still carries the raw `<<<<<<<`/`>>>>>>>` markers
|
||||
// the pull-side `commitMerge` committed. Left as-is they would (1) stay in
|
||||
// the PUBLISHED vault forever (external clones see raw markers) and (2)
|
||||
// re-conflict every cycle. So write the CLEAN body back to the vault file
|
||||
// and record it in `writtenBack` — `runPush` step 7a commits it on `main`
|
||||
// and re-advances the refs, so the published vault converges to the merged
|
||||
// content. Only conflicted files are rewritten (no churn for clean updates).
|
||||
if (conflicted) {
|
||||
await deps.writeFile(u.path, serializePageFile(u.pageId, body));
|
||||
writtenBack.push({ path: u.path, pageId: u.pageId });
|
||||
}
|
||||
// §10 loop-guard data: hash the BODY we pushed + capture `updatedAt`.
|
||||
pushed.push({
|
||||
pageId: u.pageId,
|
||||
@@ -1083,13 +1103,23 @@ export function isPageFile(path: string): boolean {
|
||||
* Docmost). A body is treated as conflicted only when it carries BOTH a begin
|
||||
* (`<<<<<<<`) and an end (`>>>>>>>`) marker line, so a legitimate Markdown setext
|
||||
* heading underline (`=======`) is not mistaken for a conflict. When conflicted,
|
||||
* the three marker line types are removed while BOTH sides' content is preserved
|
||||
* (no data loss): the marker SYNTAX never reaches Docmost, but the human's content
|
||||
* does — where the conflict is visible and fixable rather than silently dropped.
|
||||
* every marker line type is removed while the human-visible content is preserved
|
||||
* (no data loss): the marker SYNTAX never reaches Docmost, but the content does —
|
||||
* where the conflict is visible and fixable rather than silently dropped.
|
||||
*
|
||||
* `diff3`/`zdiff3` style: a conflict in that style adds a `|||||||` base section
|
||||
* (`|||||||` line + the merge-BASE content + `=======`). `ensureRepo` pins
|
||||
* `merge.conflictStyle=merge` so the engine never produces it, but a vault that
|
||||
* predates the pin — or content arriving via an external push that a human
|
||||
* committed in diff3 style — could still carry it. So we ALSO recognize the
|
||||
* `|||||||` marker and DROP the stale base region it introduces (between
|
||||
* `|||||||` and `=======`): the base text is neither side's current content, so
|
||||
* keeping it would inject obsolete lines AND leak a raw `|||||||` marker.
|
||||
*/
|
||||
const CONFLICT_BEGIN_RE = /^<{7}/m;
|
||||
const CONFLICT_END_RE = /^>{7}/m;
|
||||
const CONFLICT_BEGIN_LINE_RE = /^<{7}/;
|
||||
const CONFLICT_BASE_LINE_RE = /^\|{7}/;
|
||||
const CONFLICT_SEP_LINE_RE = /^={7}/;
|
||||
const CONFLICT_END_LINE_RE = /^>{7}/;
|
||||
|
||||
@@ -1099,23 +1129,37 @@ export function hasConflictMarkers(body: string): boolean {
|
||||
|
||||
function stripConflictMarkers(body: string): string {
|
||||
if (!hasConflictMarkers(body)) return body;
|
||||
// Remove ONLY the three marker line types, and treat a `=======` line as a
|
||||
// conflict separator ONLY when we are between a `<<<<<<<` begin and a `>>>>>>>`
|
||||
// end — so a legitimate Markdown setext heading underline (`=======`) outside a
|
||||
// conflict block is preserved (review finding). Both conflict sides' content is
|
||||
// kept; only the marker SYNTAX is dropped.
|
||||
let inBlock = false;
|
||||
// Track where we are inside a conflict block so a `=======` line is treated as
|
||||
// a conflict separator ONLY between a `<<<<<<<` begin and a `>>>>>>>` end — a
|
||||
// legitimate Markdown setext heading underline (`=======`) outside a conflict
|
||||
// block is preserved (review finding). State machine over the block:
|
||||
// 'no' — outside any conflict block.
|
||||
// 'ours' — after `<<<<<<<`, before `|||||||`/`=======` (our side: KEEP).
|
||||
// 'base' — after `|||||||`, before `=======` (diff3 base region: DROP).
|
||||
// 'theirs' — after `=======`, before `>>>>>>>` (their side: KEEP).
|
||||
// Every marker LINE itself is dropped; only the base region's content is also
|
||||
// dropped (it is stale and not part of either current side).
|
||||
let state: "no" | "ours" | "base" | "theirs" = "no";
|
||||
const out: string[] = [];
|
||||
for (const line of body.split("\n")) {
|
||||
if (CONFLICT_BEGIN_LINE_RE.test(line)) {
|
||||
inBlock = true;
|
||||
state = "ours";
|
||||
continue;
|
||||
}
|
||||
if (CONFLICT_END_LINE_RE.test(line)) {
|
||||
inBlock = false;
|
||||
if (state !== "no" && CONFLICT_END_LINE_RE.test(line)) {
|
||||
state = "no";
|
||||
continue;
|
||||
}
|
||||
if (inBlock && CONFLICT_SEP_LINE_RE.test(line)) {
|
||||
if (state === "ours" && CONFLICT_BASE_LINE_RE.test(line)) {
|
||||
state = "base";
|
||||
continue;
|
||||
}
|
||||
if ((state === "ours" || state === "base") && CONFLICT_SEP_LINE_RE.test(line)) {
|
||||
state = "theirs";
|
||||
continue;
|
||||
}
|
||||
// Drop the diff3 base region's content (stale, neither current side).
|
||||
if (state === "base") {
|
||||
continue;
|
||||
}
|
||||
out.push(line);
|
||||
|
||||
Reference in New Issue
Block a user