From 62cc474002481cee707f480b3c44ba430dd43fac Mon Sep 17 00:00:00 2001
From: Jeremy <jeremy@fluxlabs.net>
Date: Sat, 4 Apr 2026 10:00:07 -0500
Subject: [PATCH] test(gsd): fill state machine E2E verification gaps (#3498)

Add 102 integration tests across two new files covering state machine
edge cases, runtime failures, and boundary conditions not exercised
by the existing live-validation suite.

Closes #3498
---
 .../state-machine-edge-cases.test.ts          | 1188 +++++++++++++++++
 .../state-machine-runtime-failures.test.ts    |  841 ++++++++++++
 2 files changed, 2029 insertions(+)
 create mode 100644 src/resources/extensions/gsd/tests/integration/state-machine-edge-cases.test.ts
 create mode 100644 src/resources/extensions/gsd/tests/integration/state-machine-runtime-failures.test.ts

diff --git a/src/resources/extensions/gsd/tests/integration/state-machine-edge-cases.test.ts b/src/resources/extensions/gsd/tests/integration/state-machine-edge-cases.test.ts
new file mode 100644
index 000000000..320d3a6e6
--- /dev/null
+++ b/src/resources/extensions/gsd/tests/integration/state-machine-edge-cases.test.ts
@@ -0,0 +1,1188 @@
+/**
+ * state-machine-edge-cases.test.ts — Gap-filling tests for the GSD state
+ * machine covering failure modes, boundary conditions, and edge cases NOT
+ * covered by the existing state-machine-live-validation.test.ts suite.
+ *
+ * Coverage gaps filled:
+ * 1. State derivation failures (file deletion races, partial DB, cache staleness,
+ *    corrupt files, 0-slice ROADMAP)
+ * 2. Transition boundary failures (mid-transition mutation, cascading blockers,
+ *    multi-level milestone deps, blocked→unblocked recovery)
+ * 3. Dispatch failures (null activeSlice, evaluating-gates without config,
+ *    unhandled phase, missing task plan recovery)
+ * 4. Completion & verification failures (unparseable verdict, needs-remediation
+ *    blocks completion, missing SUMMARY blocks validation, UAT verdict gate,
+ *    replan loop cap)
+ */
+
+// GSD State Machine Edge Case Tests
+
+import { describe, test, beforeEach, afterEach } from "node:test";
+import assert from "node:assert/strict";
+import {
+  mkdtempSync,
+  mkdirSync,
+  writeFileSync,
+  readFileSync,
+  rmSync,
+  existsSync,
+  unlinkSync,
+} from "node:fs";
+import { tmpdir } from "node:os";
+import { join } from "node:path";
+
+// ── DB layer ──────────────────────────────────────────────────────────────
+import {
+  openDatabase,
+  closeDatabase,
+  insertMilestone,
+  insertSlice,
+  insertTask,
+  getTask,
+  getSlice,
+  getMilestone,
+  getSliceTasks,
+  getMilestoneSlices,
+  updateTaskStatus,
+  updateSliceStatus,
+  updateMilestoneStatus,
+  insertReplanHistory,
+  getReplanHistory,
+  insertGateRow,
+  getPendingGates,
+} from "../../gsd-db.ts";
+
+// ── State derivation ──────────────────────────────────────────────────────
+import {
+  deriveState,
+  deriveStateFromDb,
+  invalidateStateCache,
+  isGhostMilestone,
+  isValidationTerminal,
+} from "../../state.ts";
+
+// ── Status guards ─────────────────────────────────────────────────────────
+import { isClosedStatus } from "../../status-guards.ts";
+
+// ── Cache invalidation ───────────────────────────────────────────────────
+import { invalidateAllCaches } from "../../cache.ts";
+
+// ── Dispatch ─────────────────────────────────────────────────────────────
+import {
+  resolveDispatch,
+  DISPATCH_RULES,
+  getDispatchRuleNames,
+} from "../../auto-dispatch.ts";
+import type { DispatchContext, DispatchAction } from "../../auto-dispatch.ts";
+
+// ── Verdict parser ──────────────────────────────────────────────────────
+import {
+  extractVerdict,
+  isAcceptableUatVerdict,
+  isValidMilestoneVerdict,
+} from "../../verdict-parser.ts";
+
+// ── Path helpers ─────────────────────────────────────────────────────────
+import { clearPathCache } from "../../paths.ts";
+
+// ═══════════════════════════════════════════════════════════════════════════
+// Fixture Helpers
+// ═══════════════════════════════════════════════════════════════════════════
+
+function makeTempDir(): string {
+  return mkdtempSync(join(tmpdir(), "gsd-edge-cases-"));
+}
+
+/**
+ * Create a standard .gsd/ fixture with M001 containing S01 (2 tasks) and S02 (1 task).
+ * Same structure as state-machine-live-validation.test.ts for consistency.
+ */
+function createFullFixture(): string {
+  const base = makeTempDir();
+  const gsdDir = join(base, ".gsd");
+  const m001Dir = join(gsdDir, "milestones", "M001");
+  const s01Dir = join(m001Dir, "slices", "S01");
+  const s01Tasks = join(s01Dir, "tasks");
+  const s02Dir = join(m001Dir, "slices", "S02");
+  const s02Tasks = join(s02Dir, "tasks");
+
+  mkdirSync(s01Tasks, { recursive: true });
+  mkdirSync(s02Tasks, { recursive: true });
+
+  writeFileSync(
+    join(m001Dir, "M001-CONTEXT.md"),
+    [
+      "# M001: Edge Case Milestone",
+      "",
+      "## Purpose",
+      "Test state machine edge cases.",
+    ].join("\n"),
+  );
+
+  writeFileSync(
+    join(m001Dir, "M001-ROADMAP.md"),
+    [
+      "# M001: Edge Case Milestone",
+      "",
+      "## Vision",
+      "Prove edge case correctness.",
+      "",
+      "## Success Criteria",
+      "- All edge cases handled",
+      "",
+      "## Slices",
+      "",
+      "- [ ] **S01: First Feature** `risk:low` `depends:[]`",
+      "  - After this: First feature proven.",
+      "",
+      "- [ ] **S02: Second Feature** `risk:low` `depends:[]`",
+      "  - After this: Second feature proven.",
+      "",
+      "## Boundary Map",
+      "",
+      "| From | To | Produces | Consumes |",
+      "|------|----|----------|----------|",
+      "| S01 | terminal | feature-a | nothing |",
+      "| S02 | terminal | feature-b | nothing |",
+    ].join("\n"),
+  );
+
+  writeFileSync(
+    join(s01Dir, "S01-PLAN.md"),
+    [
+      "# S01: First Feature",
+      "",
+      "**Goal:** Implement first feature.",
+      "",
+      "## Tasks",
+      "",
+      "- [ ] **T01: Implementation** `est:30m`",
+      "  - Do: Build it",
+      "  - Verify: Run tests",
+      "",
+      "- [ ] **T02: Testing** `est:30m`",
+      "  - Do: Write tests",
+      "  - Verify: Run tests",
+    ].join("\n"),
+  );
+
+  writeFileSync(join(s01Tasks, "T01-PLAN.md"), "# T01 Plan\nImplement.\n");
+  writeFileSync(join(s01Tasks, "T02-PLAN.md"), "# T02 Plan\nTest.\n");
+
+  writeFileSync(
+    join(s02Dir, "S02-PLAN.md"),
+    [
+      "# S02: Second Feature",
+      "",
+      "**Goal:** Implement second feature.",
+      "",
+      "## Tasks",
+      "",
+      "- [ ] **T01: Implementation** `est:30m`",
+      "  - Do: Build it",
+      "  - Verify: Run tests",
+    ].join("\n"),
+  );
+
+  writeFileSync(join(s02Tasks, "T01-PLAN.md"), "# T01 Plan\nBuild.\n");
+
+  return base;
+}
+
+/**
+ * Create a multi-milestone fixture with M001 → M002 → M003 dependency chain.
+ */
+function createMultiMilestoneFixture(): string {
+  const base = makeTempDir();
+  const gsdDir = join(base, ".gsd");
+
+  for (const mid of ["M001", "M002", "M003"]) {
+    const mDir = join(gsdDir, "milestones", mid);
+    const sDir = join(mDir, "slices", "S01", "tasks");
+    mkdirSync(sDir, { recursive: true });
+
+    writeFileSync(
+      join(mDir, `${mid}-CONTEXT.md`),
+      `# ${mid}: Milestone ${mid.slice(-1)}\n\n## Purpose\nTest deps.\n`,
+    );
+
+    writeFileSync(
+      join(mDir, `${mid}-ROADMAP.md`),
+      [
+        `# ${mid}: Milestone ${mid.slice(-1)}`,
+        "",
+        "## Vision",
+        "Test dependency chains.",
+        "",
+        "## Success Criteria",
+        "- Works",
+        "",
+        "## Slices",
+        "",
+        "- [ ] **S01: Only Slice** `risk:low` `depends:[]`",
+        "  - After this: Done.",
+        "",
+        "## Boundary Map",
+        "",
+        "| From | To | Produces | Consumes |",
+        "|------|----|----------|----------|",
+        "| S01 | terminal | output | nothing |",
+      ].join("\n"),
+    );
+
+    writeFileSync(
+      join(mDir, "slices", "S01", "S01-PLAN.md"),
+      [
+        "# S01: Only Slice",
+        "",
+        "**Goal:** Do the thing.",
+        "",
+        "## Tasks",
+        "",
+        "- [ ] **T01: Task** `est:30m`",
+        "  - Do: Implement",
+        "  - Verify: Run tests",
+      ].join("\n"),
+    );
+
+    writeFileSync(join(sDir, "T01-PLAN.md"), "# T01 Plan\nDo it.\n");
+  }
+
+  return base;
+}
+
+function buildDispatchCtx(
+  base: string,
+  mid: string,
+  stateOverrides: Partial<import("../../types.ts").GSDState> = {},
+): DispatchContext {
+  return {
+    basePath: base,
+    mid,
+    midTitle: `${mid} Test`,
+    state: {
+      activeMilestone: { id: mid, title: `${mid} Test` },
+      activeSlice: null,
+      activeTask: null,
+      phase: "executing",
+      recentDecisions: [],
+      blockers: [],
+      nextAction: "",
+      registry: [],
+      requirements: { active: 0, validated: 0, invalidated: 0, deferred: 0 },
+      progress: { milestones: { done: 0, total: 1 } },
+      ...stateOverrides,
+    },
+    prefs: undefined,
+  };
+}
+
+// ═══════════════════════════════════════════════════════════════════════════
+// Test Suite
+// ═══════════════════════════════════════════════════════════════════════════
+
+// ─────────────────────────────────────────────────────────────────────────
+// SECTION 1: State Derivation Failure Modes
+// ─────────────────────────────────────────────────────────────────────────
+
+describe("state derivation failures", () => {
+  let base: string;
+
+  afterEach(() => {
+    try { closeDatabase(); } catch { /* may not be open */ }
+    if (base) rmSync(base, { recursive: true, force: true });
+  });
+
+  test("file deleted between deriveState calls produces consistent result", async () => {
+    // Simulates race condition: PLAN file exists on first derive, deleted before second
+    base = createFullFixture();
+    openDatabase(join(base, ".gsd", "gsd.db"));
+    insertMilestone({ id: "M001", title: "Active", status: "active" });
+    insertSlice({ id: "S01", milestoneId: "M001", title: "First", status: "in_progress" });
+    insertTask({ id: "T01", sliceId: "S01", milestoneId: "M001", status: "pending" });
+
+    invalidateAllCaches();
+    const stateBefore = await deriveStateFromDb(base);
+    assert.equal(stateBefore.phase, "executing");
+
+    // Delete the task plan file mid-flow
+    const planPath = join(base, ".gsd", "milestones", "M001", "slices", "S01", "tasks", "T01-PLAN.md");
+    if (existsSync(planPath)) unlinkSync(planPath);
+
+    invalidateAllCaches();
+    const stateAfter = await deriveStateFromDb(base);
+    // State machine should still function — either executing (DB says task exists)
+    // or planning (missing plan file triggers replan). Should NOT throw.
+    assert.ok(
+      ["executing", "planning"].includes(stateAfter.phase),
+      `expected executing or planning after plan deletion, got: ${stateAfter.phase}`,
+    );
+  });
+
+  test("partial DB write: milestone inserted but no slices → pre-planning", async () => {
+    base = makeTempDir();
+    const mDir = join(base, ".gsd", "milestones", "M001");
+    mkdirSync(mDir, { recursive: true });
+    writeFileSync(join(mDir, "M001-CONTEXT.md"), "# M001: Test\n\n## Purpose\nTest.\n");
+
+    openDatabase(join(base, ".gsd", "gsd.db"));
+    // Only insert milestone — no slices, no roadmap
+    insertMilestone({ id: "M001", title: "Partial", status: "active" });
+
+    invalidateAllCaches();
+    const state = await deriveStateFromDb(base);
+    // No roadmap → pre-planning (milestone exists but no structure yet)
+    assert.equal(state.phase, "pre-planning");
+    assert.equal(state.activeMilestone?.id, "M001");
+  });
+
+  test("cache staleness: derive within TTL returns same result after DB mutation", async () => {
+    base = createFullFixture();
+    openDatabase(join(base, ".gsd", "gsd.db"));
+    insertMilestone({ id: "M001", title: "Active", status: "active" });
+    insertSlice({ id: "S01", milestoneId: "M001", title: "First", status: "in_progress" });
+    insertTask({ id: "T01", sliceId: "S01", milestoneId: "M001", status: "pending" });
+
+    // First call populates cache
+    invalidateStateCache();
+    const state1 = await deriveState(base);
+    assert.equal(state1.phase, "executing");
+
+    // Mutate DB WITHOUT invalidating cache
+    updateTaskStatus("M001", "S01", "T01", "complete", new Date().toISOString());
+
+    // Second call within 100ms TTL should return cached (stale) result
+    const state2 = await deriveState(base);
+    assert.equal(state2.phase, "executing", "cached result should still show executing");
+
+    // After explicit invalidation, should reflect the DB mutation
+    invalidateStateCache();
+    const state3 = await deriveState(base);
+    assert.equal(state3.phase, "summarizing", "after cache invalidation should show summarizing");
+  });
+
+  test("corrupt ROADMAP: binary content does not crash deriveState", async () => {
+    base = makeTempDir();
+    const mDir = join(base, ".gsd", "milestones", "M001");
+    mkdirSync(mDir, { recursive: true });
+    writeFileSync(join(mDir, "M001-CONTEXT.md"), "# M001: Corrupt\n\n## Purpose\nTest.\n");
+    // Write binary garbage as ROADMAP
+    writeFileSync(join(mDir, "M001-ROADMAP.md"), Buffer.from([0x00, 0xFF, 0xFE, 0x89, 0x50, 0x4E, 0x47]));
+
+    openDatabase(join(base, ".gsd", "gsd.db"));
+    insertMilestone({ id: "M001", title: "Corrupt", status: "active" });
+
+    invalidateAllCaches();
+    // Should NOT throw — should degrade gracefully
+    const state = await deriveStateFromDb(base);
+    assert.ok(state.phase, "should produce a valid phase even with corrupt ROADMAP");
+  });
+
+  test("0-byte ROADMAP file is treated as no roadmap (pre-planning)", async () => {
+    base = makeTempDir();
+    const mDir = join(base, ".gsd", "milestones", "M001");
+    mkdirSync(mDir, { recursive: true });
+    writeFileSync(join(mDir, "M001-CONTEXT.md"), "# M001: Empty\n\n## Purpose\nTest.\n");
+    writeFileSync(join(mDir, "M001-ROADMAP.md"), "");
+
+    openDatabase(join(base, ".gsd", "gsd.db"));
+    insertMilestone({ id: "M001", title: "Empty", status: "active" });
+
+    invalidateAllCaches();
+    const state = await deriveStateFromDb(base);
+    assert.equal(state.phase, "pre-planning", "empty ROADMAP should result in pre-planning");
+  });
+
+  test("ROADMAP with no ## Slices section derives pre-planning", async () => {
+    base = makeTempDir();
+    const mDir = join(base, ".gsd", "milestones", "M001");
+    mkdirSync(mDir, { recursive: true });
+    writeFileSync(join(mDir, "M001-CONTEXT.md"), "# M001: No Slices\n\n## Purpose\nTest.\n");
+    writeFileSync(
+      join(mDir, "M001-ROADMAP.md"),
+      [
+        "# M001: No Slices",
+        "",
+        "## Vision",
+        "Test zero slices.",
+        "",
+        "## Success Criteria",
+        "- Works",
+        "",
+        "## Slices",
+        "",
+        "## Boundary Map",
+        "",
+        "| From | To | Produces | Consumes |",
+        "|------|----|----------|----------|",
+      ].join("\n"),
+    );
+
+    openDatabase(join(base, ".gsd", "gsd.db"));
+    insertMilestone({ id: "M001", title: "No Slices", status: "active" });
+
+    invalidateAllCaches();
+    const state = await deriveStateFromDb(base);
+    // 0-slice ROADMAP guard: should NOT derive validating-milestone (#2667)
+    assert.notEqual(
+      state.phase,
+      "validating-milestone",
+      "0-slice ROADMAP must NOT produce validating-milestone",
+    );
+  });
+
+  test("corrupt VALIDATION frontmatter: extractVerdict returns undefined", () => {
+    // Test the verdict parser directly with malformed content
+    assert.equal(extractVerdict(""), undefined, "empty string → undefined");
+    assert.equal(extractVerdict("---\n\n---\n# No verdict"), undefined, "empty frontmatter → undefined");
+    assert.equal(extractVerdict("---\nverdict:\n---"), undefined, "verdict with no value → undefined");
+    assert.equal(
+      extractVerdict("random text without frontmatter"),
+      undefined,
+      "no frontmatter → undefined",
+    );
+  });
+
+  test("VALIDATION with binary/garbage content: isValidationTerminal returns false", () => {
+    assert.equal(isValidationTerminal(""), false, "empty → not terminal");
+    assert.equal(isValidationTerminal("\x00\xFF\xFE"), false, "binary → not terminal");
+    assert.equal(
+      isValidationTerminal("---\ngarbage: yes\n---\nNo verdict here."),
+      false,
+      "no verdict field → not terminal",
+    );
+  });
+});
+
+// ─────────────────────────────────────────────────────────────────────────
+// SECTION 2: Transition Boundary Failures
+// ─────────────────────────────────────────────────────────────────────────
+
+describe("transition boundary failures", () => {
+  let base: string;
+
+  afterEach(() => {
+    try { closeDatabase(); } catch { /* may not be open */ }
+    if (base) rmSync(base, { recursive: true, force: true });
+  });
+
+  test("mid-transition: CONTEXT.md created between derives transitions needs-discussion → pre-planning correctly", async () => {
+    base = makeTempDir();
+    const mDir = join(base, ".gsd", "milestones", "M001");
+    mkdirSync(mDir, { recursive: true });
+
+    // Start with only CONTEXT-DRAFT → needs-discussion
+    writeFileSync(join(mDir, "M001-CONTEXT-DRAFT.md"), "# Draft\nSome draft.\n");
+
+    openDatabase(join(base, ".gsd", "gsd.db"));
+    invalidateAllCaches();
+    const state1 = await deriveState(base);
+    assert.equal(state1.phase, "needs-discussion");
+
+    // Now write the full CONTEXT (simulates discussion completion)
+    writeFileSync(join(mDir, "M001-CONTEXT.md"), "# M001: Resolved\n\n## Purpose\nDone.\n");
+
+    invalidateAllCaches();
+    const state2 = await deriveState(base);
+    // Should advance to pre-planning (has context but no roadmap yet)
+    assert.equal(state2.phase, "pre-planning");
+  });
+
+  test("cascading slice dependencies: S02 depends S01, S03 depends S02 — only S01 eligible", async () => {
+    base = makeTempDir();
+    const mDir = join(base, ".gsd", "milestones", "M001");
+
+    // Create 3 slices with chain deps
+    for (const sid of ["S01", "S02", "S03"]) {
+      const sDir = join(mDir, "slices", sid, "tasks");
+      mkdirSync(sDir, { recursive: true });
+      writeFileSync(
+        join(mDir, "slices", sid, `${sid}-PLAN.md`),
+        [
+          `# ${sid}: Feature`,
+          "",
+          "**Goal:** Do the thing.",
+          "",
+          "## Tasks",
+          "",
+          "- [ ] **T01: Task** `est:30m`",
+          "  - Do: Implement",
+          "  - Verify: Run tests",
+        ].join("\n"),
+      );
+      writeFileSync(join(sDir, "T01-PLAN.md"), "# T01 Plan\nDo it.\n");
+    }
+
+    writeFileSync(join(mDir, "M001-CONTEXT.md"), "# M001: Chain\n\n## Purpose\nTest deps.\n");
+    writeFileSync(
+      join(mDir, "M001-ROADMAP.md"),
+      [
+        "# M001: Chain Deps",
+        "",
+        "## Vision",
+        "Test cascading.",
+        "",
+        "## Success Criteria",
+        "- Works",
+        "",
+        "## Slices",
+        "",
+        "- [ ] **S01: Base** `risk:low` `depends:[]`",
+        "  - After this: Base done.",
+        "",
+        "- [ ] **S02: Middle** `risk:low` `depends:[S01]`",
+        "  - After this: Middle done.",
+        "",
+        "- [ ] **S03: Top** `risk:low` `depends:[S02]`",
+        "  - After this: Top done.",
+        "",
+        "## Boundary Map",
+        "",
+        "| From | To | Produces | Consumes |",
+        "|------|----|----------|----------|",
+        "| S01 | S02 | base | nothing |",
+        "| S02 | S03 | middle | base |",
+        "| S03 | terminal | top | middle |",
+      ].join("\n"),
+    );
+
+    openDatabase(join(base, ".gsd", "gsd.db"));
+    insertMilestone({ id: "M001", title: "Chain", status: "active" });
+    insertSlice({ id: "S01", milestoneId: "M001", title: "Base", status: "pending", depends: [] });
+    insertSlice({ id: "S02", milestoneId: "M001", title: "Middle", status: "pending", depends: ["S01"] });
+    insertSlice({ id: "S03", milestoneId: "M001", title: "Top", status: "pending", depends: ["S02"] });
+    insertTask({ id: "T01", sliceId: "S01", milestoneId: "M001", status: "pending" });
+    insertTask({ id: "T01", sliceId: "S02", milestoneId: "M001", status: "pending" });
+    insertTask({ id: "T01", sliceId: "S03", milestoneId: "M001", status: "pending" });
+
+    invalidateAllCaches();
+    const state = await deriveStateFromDb(base);
+
+    // Only S01 should be active — S02 and S03 are dep-blocked
+    assert.equal(state.activeSlice?.id, "S01", "S01 should be the active slice (no deps)");
+    assert.equal(state.phase, "executing", "should be executing S01");
+  });
+
+  test("cascading deps: completing S01 unblocks S02 (not S03)", async () => {
+    base = makeTempDir();
+    const mDir = join(base, ".gsd", "milestones", "M001");
+    for (const sid of ["S01", "S02", "S03"]) {
+      const sDir = join(mDir, "slices", sid, "tasks");
+      mkdirSync(sDir, { recursive: true });
+      writeFileSync(
+        join(mDir, "slices", sid, `${sid}-PLAN.md`),
+        `# ${sid}\n\n**Goal:** Do.\n\n## Tasks\n\n- [ ] **T01: Task** \`est:30m\`\n  - Do: Impl\n  - Verify: Test\n`,
+      );
+      writeFileSync(join(sDir, "T01-PLAN.md"), `# T01 Plan\nDo it.\n`);
+    }
+    // Write slice SUMMARY for S01
+    writeFileSync(
+      join(mDir, "slices", "S01", "S01-SUMMARY.md"),
+      "---\n---\n# S01 Summary\nDone.\n",
+    );
+
+    writeFileSync(join(mDir, "M001-CONTEXT.md"), "# M001: Chain\n\n## Purpose\nTest.\n");
+    writeFileSync(
+      join(mDir, "M001-ROADMAP.md"),
+      [
+        "# M001: Chain",
+        "",
+        "## Vision",
+        "Test.",
+        "",
+        "## Success Criteria",
+        "- Works",
+        "",
+        "## Slices",
+        "",
+        "- [x] **S01: Base** `risk:low` `depends:[]`",
+        "  - After this: Done.",
+        "",
+        "- [ ] **S02: Middle** `risk:low` `depends:[S01]`",
+        "  - After this: Done.",
+        "",
+        "- [ ] **S03: Top** `risk:low` `depends:[S02]`",
+        "  - After this: Done.",
+        "",
+        "## Boundary Map",
+        "",
+        "| From | To | Produces | Consumes |",
+        "|------|----|----------|----------|",
+        "| S01 | S02 | x | nothing |",
+        "| S02 | S03 | y | x |",
+        "| S03 | terminal | z | y |",
+      ].join("\n"),
+    );
+
+    openDatabase(join(base, ".gsd", "gsd.db"));
+    insertMilestone({ id: "M001", title: "Chain", status: "active" });
+    insertSlice({ id: "S01", milestoneId: "M001", title: "Base", status: "complete", depends: [] });
+    insertSlice({ id: "S02", milestoneId: "M001", title: "Middle", status: "pending", depends: ["S01"] });
+    insertSlice({ id: "S03", milestoneId: "M001", title: "Top", status: "pending", depends: ["S02"] });
+    insertTask({ id: "T01", sliceId: "S01", milestoneId: "M001", status: "complete" });
+    insertTask({ id: "T01", sliceId: "S02", milestoneId: "M001", status: "pending" });
+    insertTask({ id: "T01", sliceId: "S03", milestoneId: "M001", status: "pending" });
+
+    invalidateAllCaches();
+    const state = await deriveStateFromDb(base);
+
+    // S01 complete → S02 unblocked → S02 should be active
+    assert.equal(state.activeSlice?.id, "S02", "S02 should be active after S01 completes");
+    assert.equal(state.phase, "executing");
+  });
+
+  test("multi-milestone deps: M002 depends M001, M003 depends M002 — blocked correctly", async () => {
+    base = createMultiMilestoneFixture();
+    openDatabase(join(base, ".gsd", "gsd.db"));
+    insertMilestone({ id: "M001", title: "First", status: "active" });
+    insertMilestone({ id: "M002", title: "Second", status: "active", depends_on: ["M001"] });
+    insertMilestone({ id: "M003", title: "Third", status: "active", depends_on: ["M002"] });
+
+    insertSlice({ id: "S01", milestoneId: "M001", title: "S01", status: "pending" });
+    insertTask({ id: "T01", sliceId: "S01", milestoneId: "M001", status: "pending" });
+    insertSlice({ id: "S01", milestoneId: "M002", title: "S01", status: "pending" });
+    insertTask({ id: "T01", sliceId: "S01", milestoneId: "M002", status: "pending" });
+    insertSlice({ id: "S01", milestoneId: "M003", title: "S01", status: "pending" });
+    insertTask({ id: "T01", sliceId: "S01", milestoneId: "M003", status: "pending" });
+
+    invalidateAllCaches();
+    const state = await deriveStateFromDb(base);
+
+    // Only M001 should be active — M002 and M003 are blocked
+    assert.equal(state.activeMilestone?.id, "M001", "M001 should be active (no deps)");
+  });
+
+  test("blocker_discovered in task transitions to replanning-slice", async () => {
+    base = createFullFixture();
+    openDatabase(join(base, ".gsd", "gsd.db"));
+    insertMilestone({ id: "M001", title: "Active", status: "active" });
+    insertSlice({ id: "S01", milestoneId: "M001", title: "First", status: "in_progress" });
+    insertTask({ id: "T01", sliceId: "S01", milestoneId: "M001", status: "complete", blockerDiscovered: true });
+    insertTask({ id: "T02", sliceId: "S01", milestoneId: "M001", status: "pending" });
+
+    invalidateAllCaches();
+    const state = await deriveStateFromDb(base);
+    assert.equal(state.phase, "replanning-slice", "blocker_discovered should trigger replanning");
+    assert.ok(state.blockers.length > 0, "should report blocker");
+  });
+
+  test("replan loop protection: replan already done skips replanning-slice", async () => {
+    base = createFullFixture();
+    openDatabase(join(base, ".gsd", "gsd.db"));
+    insertMilestone({ id: "M001", title: "Active", status: "active" });
+    insertSlice({ id: "S01", milestoneId: "M001", title: "First", status: "in_progress" });
+    insertTask({ id: "T01", sliceId: "S01", milestoneId: "M001", status: "complete", blockerDiscovered: true });
+    insertTask({ id: "T02", sliceId: "S01", milestoneId: "M001", status: "pending" });
+
+    // Record that a replan was already done for this slice
+    insertReplanHistory({
+      milestoneId: "M001",
+      sliceId: "S01",
+      summary: "Already replanned once",
+    });
+
+    invalidateAllCaches();
+    const state = await deriveStateFromDb(base);
+    // With replan history, should NOT re-enter replanning-slice
+    assert.notEqual(
+      state.phase,
+      "replanning-slice",
+      "replan loop protection: should not re-enter replanning after replan was done",
+    );
+  });
+
+  test("blocked state: all slices have unmet deps → blocked phase", async () => {
+    base = makeTempDir();
+    const mDir = join(base, ".gsd", "milestones", "M001");
+    mkdirSync(join(mDir, "slices", "S01", "tasks"), { recursive: true });
+    mkdirSync(join(mDir, "slices", "S02", "tasks"), { recursive: true });
+
+    writeFileSync(join(mDir, "M001-CONTEXT.md"), "# M001\n\n## Purpose\nTest.\n");
+    writeFileSync(
+      join(mDir, "M001-ROADMAP.md"),
+      [
+        "# M001: Blocked",
+        "",
+        "## Vision",
+        "Test blocked.",
+        "",
+        "## Success Criteria",
+        "- Works",
+        "",
+        "## Slices",
+        "",
+        "- [ ] **S01: A** `risk:low` `depends:[S02]`",
+        "  - After this: Done.",
+        "",
+        "- [ ] **S02: B** `risk:low` `depends:[S01]`",
+        "  - After this: Done.",
+        "",
+        "## Boundary Map",
+        "",
+        "| From | To | Produces | Consumes |",
+        "|------|----|----------|----------|",
+        "| S01 | S02 | a | b |",
+        "| S02 | S01 | b | a |",
+      ].join("\n"),
+    );
+
+    openDatabase(join(base, ".gsd", "gsd.db"));
+    insertMilestone({ id: "M001", title: "Blocked", status: "active" });
+    // Circular deps: S01→S02 and S02→S01 — both blocked
+    insertSlice({ id: "S01", milestoneId: "M001", title: "A", status: "pending", depends: ["S02"] });
+    insertSlice({ id: "S02", milestoneId: "M001", title: "B", status: "pending", depends: ["S01"] });
+    insertTask({ id: "T01", sliceId: "S01", milestoneId: "M001", status: "pending" });
+    insertTask({ id: "T01", sliceId: "S02", milestoneId: "M001", status: "pending" });
+
+    invalidateAllCaches();
+    const state = await deriveStateFromDb(base);
+    assert.equal(state.phase, "blocked", "circular deps should produce blocked phase");
+  });
+});
+
+// ─────────────────────────────────────────────────────────────────────────
+// SECTION 3: Dispatch Failure Modes
+// ─────────────────────────────────────────────────────────────────────────
+
+describe("dispatch failure modes", () => {
+  let base: string;
+
+  afterEach(() => {
+    try { closeDatabase(); } catch { /* may not be open */ }
+    if (base) rmSync(base, { recursive: true, force: true });
+  });
+
+  test("dispatch with null activeSlice in executing phase → stop (error)", async () => {
+    base = createFullFixture();
+    openDatabase(join(base, ".gsd", "gsd.db"));
+    insertMilestone({ id: "M001", title: "Active", status: "active" });
+
+    const ctx = buildDispatchCtx(base, "M001", {
+      phase: "executing",
+      activeSlice: null,
+      activeTask: { id: "T01", title: "Task" },
+    });
+
+    // The "executing → execute-task (recover missing task plan)" rule checks activeSlice
+    // and returns missingSliceStop when null
+    const result = await resolveDispatch(ctx);
+    assert.equal(result.action, "stop", "null activeSlice in executing should stop");
+  });
+
+  test("dispatch for unhandled phase → stop with diagnostic", async () => {
+    base = createFullFixture();
+    openDatabase(join(base, ".gsd", "gsd.db"));
+
+    const ctx = buildDispatchCtx(base, "M001", {
+      phase: "paused" as any,
+      activeSlice: null,
+      activeTask: null,
+    });
+
+    const result = await resolveDispatch(ctx);
+    assert.equal(result.action, "stop", "unhandled phase should produce stop action");
+  });
+
+  test("dispatch: summarizing with null activeSlice → stop (error)", async () => {
+    base = createFullFixture();
+    openDatabase(join(base, ".gsd", "gsd.db"));
+
+    const ctx = buildDispatchCtx(base, "M001", {
+      phase: "summarizing",
+      activeSlice: null,
+      activeTask: null,
+    });
+
+    const result = await resolveDispatch(ctx);
+    assert.equal(result.action, "stop", "summarizing without activeSlice should stop");
+    assert.ok(
+      (result as any).reason?.includes("no active slice"),
+      "stop reason should mention missing slice",
+    );
+  });
+
+  test("dispatch: evaluating-gates without gate config → skip (gates omitted)", async () => {
+    base = createFullFixture();
+    openDatabase(join(base, ".gsd", "gsd.db"));
+    insertMilestone({ id: "M001", title: "Active", status: "active" });
+    insertSlice({ id: "S01", milestoneId: "M001", title: "First", status: "in_progress" });
+
+    const ctx = buildDispatchCtx(base, "M001", {
+      phase: "evaluating-gates",
+      activeSlice: { id: "S01", title: "First" },
+      activeTask: null,
+    });
+    ctx.prefs = undefined; // No prefs → gate_evaluation not enabled
+
+    const result = await resolveDispatch(ctx);
+    // Without gate config, the rule should skip (gates omitted)
+    assert.ok(
+      result.action === "skip" || result.action === "stop",
+      `evaluating-gates without config should skip or stop, got: ${result.action}`,
+    );
+  });
+
+  test("dispatch: needs-discussion → discuss-milestone dispatch", async () => {
+    base = createFullFixture();
+    openDatabase(join(base, ".gsd", "gsd.db"));
+
+    const ctx = buildDispatchCtx(base, "M001", {
+      phase: "needs-discussion",
+      activeSlice: null,
+      activeTask: null,
+    });
+
+    const result = await resolveDispatch(ctx);
+    assert.equal(result.action, "dispatch");
+    assert.equal((result as any).unitType, "discuss-milestone");
+  });
+
+  test("dispatch: complete phase → stop with info level", async () => {
+    base = createFullFixture();
+    openDatabase(join(base, ".gsd", "gsd.db"));
+
+    const ctx = buildDispatchCtx(base, "M001", {
+      phase: "complete",
+      activeSlice: null,
+      activeTask: null,
+    });
+
+    const result = await resolveDispatch(ctx);
+    assert.equal(result.action, "stop");
+    assert.equal((result as any).level, "info");
+    assert.ok((result as any).reason?.includes("complete"), "reason should mention completion");
+  });
+
+  test("dispatch rule order: first match wins for overlapping rules", () => {
+    const ruleNames = getDispatchRuleNames();
+    // Verify critical ordering constraints
+    const summarizeIdx = ruleNames.indexOf("summarizing → complete-slice");
+    const runUatIdx = ruleNames.indexOf("run-uat (post-completion)");
+    const uatGateIdx = ruleNames.indexOf("uat-verdict-gate (non-PASS blocks progression)");
+    const executeIdx = ruleNames.indexOf("executing → execute-task");
+
+    // summarizing should come before execute-task
+    assert.ok(summarizeIdx < executeIdx, "summarizing rule should precede execute-task");
+    // run-uat should come before uat-verdict-gate
+    assert.ok(runUatIdx < uatGateIdx, "run-uat should precede uat-verdict-gate");
+  });
+});
+
+// ─────────────────────────────────────────────────────────────────────────
+// SECTION 4: Completion & Verification Failures
+// ─────────────────────────────────────────────────────────────────────────
+
+describe("completion and verification failures", () => {
+  let base: string;
+
+  afterEach(() => {
+    try { closeDatabase(); } catch { /* may not be open */ }
+    if (base) rmSync(base, { recursive: true, force: true });
+  });
+
+  test("needs-remediation VALIDATION blocks milestone completion dispatch", async () => {
+    base = createFullFixture();
+    const mDir = join(base, ".gsd", "milestones", "M001");
+    writeFileSync(
+      join(mDir, "M001-VALIDATION.md"),
+      [
+        "---",
+        "verdict: needs-remediation",
+        "remediation_round: 1",
+        "---",
+        "",
+        "# Validation",
+        "",
+        "Needs remediation work.",
+      ].join("\n"),
+    );
+
+    openDatabase(join(base, ".gsd", "gsd.db"));
+    insertMilestone({ id: "M001", title: "Active", status: "active" });
+    insertSlice({ id: "S01", milestoneId: "M001", title: "First", status: "complete" });
+    insertSlice({ id: "S02", milestoneId: "M001", title: "Second", status: "complete" });
+
+    const ctx = buildDispatchCtx(base, "M001", {
+      phase: "completing-milestone",
+      activeSlice: null,
+      activeTask: null,
+    });
+
+    const result = await resolveDispatch(ctx);
+    assert.equal(result.action, "stop", "needs-remediation should block completion");
+    assert.ok(
+      (result as any).reason?.includes("needs-remediation"),
+      "stop reason should mention needs-remediation",
+    );
+  });
+
+  test("missing slice SUMMARY blocks milestone validation dispatch", async () => {
+    base = createFullFixture();
+    openDatabase(join(base, ".gsd", "gsd.db"));
+    insertMilestone({ id: "M001", title: "Active", status: "active" });
+    insertSlice({ id: "S01", milestoneId: "M001", title: "First", status: "complete" });
+    insertSlice({ id: "S02", milestoneId: "M001", title: "Second", status: "complete" });
+    // No S01-SUMMARY.md or S02-SUMMARY.md on disk
+
+    const ctx = buildDispatchCtx(base, "M001", {
+      phase: "validating-milestone",
+      activeSlice: null,
+      activeTask: null,
+    });
+
+    const result = await resolveDispatch(ctx);
+    assert.equal(result.action, "stop", "missing SUMMARY files should block validation");
+    assert.ok(
+      (result as any).reason?.includes("missing SUMMARY"),
+      "stop reason should mention missing SUMMARY",
+    );
+  });
+
+  test("VALIDATION with pass verdict: isValidationTerminal returns true", () => {
+    const content = "---\nverdict: pass\nremediation_round: 0\n---\n# Pass\n";
+    assert.equal(isValidationTerminal(content), true);
+  });
+
+  test("VALIDATION with needs-attention: isValidationTerminal returns true", () => {
+    const content = "---\nverdict: needs-attention\n---\n# Attention\n";
+    assert.equal(isValidationTerminal(content), true);
+  });
+
+  test("VALIDATION with needs-remediation: isValidationTerminal returns true (terminal for loop prevention)", () => {
+    // Per #832: needs-remediation IS terminal to prevent validate-milestone loops
+    const content = "---\nverdict: needs-remediation\nremediation_round: 1\n---\n# Remediate\n";
+    assert.equal(isValidationTerminal(content), true);
+  });
+
+  test("UAT verdict gate: non-PASS verdict blocks progression", () => {
+    assert.equal(isAcceptableUatVerdict("pass", undefined), true);
+    assert.equal(isAcceptableUatVerdict("passed", undefined), true);
+    assert.equal(isAcceptableUatVerdict("fail", undefined), false);
+    assert.equal(isAcceptableUatVerdict("needs-remediation", undefined), false);
+    assert.equal(isAcceptableUatVerdict("partial", undefined), false, "partial without eligible type → not acceptable");
+    assert.equal(isAcceptableUatVerdict("partial", "mixed"), true, "partial with mixed type → acceptable");
+    assert.equal(isAcceptableUatVerdict("partial", "human-experience"), true, "partial with human-experience → acceptable");
+    assert.equal(isAcceptableUatVerdict("partial", "artifact-driven"), false, "partial with artifact-driven → not acceptable");
+  });
+
+  test("milestone validation verdict schema validation", () => {
+    assert.equal(isValidMilestoneVerdict("pass"), true);
+    assert.equal(isValidMilestoneVerdict("needs-attention"), true);
+    assert.equal(isValidMilestoneVerdict("needs-remediation"), true);
+    assert.equal(isValidMilestoneVerdict("fail"), false, "fail is not a valid milestone verdict");
+    assert.equal(isValidMilestoneVerdict(""), false);
+    assert.equal(isValidMilestoneVerdict("unknown"), false);
+  });
+
+  test("all slices done + no VALIDATION → validating-milestone (not completing)", async () => {
+    base = createFullFixture();
+    openDatabase(join(base, ".gsd", "gsd.db"));
+    insertMilestone({ id: "M001", title: "Active", status: "active" });
+    insertSlice({ id: "S01", milestoneId: "M001", title: "First", status: "complete" });
+    insertSlice({ id: "S02", milestoneId: "M001", title: "Second", status: "complete" });
+    insertTask({ id: "T01", sliceId: "S01", milestoneId: "M001", status: "complete" });
+    insertTask({ id: "T02", sliceId: "S01", milestoneId: "M001", status: "complete" });
+    insertTask({ id: "T01", sliceId: "S02", milestoneId: "M001", status: "complete" });
+
+    invalidateAllCaches();
+    const state = await deriveStateFromDb(base);
+    assert.equal(
+      state.phase,
+      "validating-milestone",
+      "all slices done without VALIDATION should be validating-milestone",
+    );
+  });
+
+  test("all slices done + terminal VALIDATION + no SUMMARY → completing-milestone", async () => {
+    base = createFullFixture();
+    writeFileSync(
+      join(base, ".gsd", "milestones", "M001", "M001-VALIDATION.md"),
+      "---\nverdict: pass\n---\n# Validation\nPassed.\n",
+    );
+
+    openDatabase(join(base, ".gsd", "gsd.db"));
+    insertMilestone({ id: "M001", title: "Active", status: "active" });
+    insertSlice({ id: "S01", milestoneId: "M001", title: "First", status: "complete" });
+    insertSlice({ id: "S02", milestoneId: "M001", title: "Second", status: "complete" });
+    insertTask({ id: "T01", sliceId: "S01", milestoneId: "M001", status: "complete" });
+    insertTask({ id: "T02", sliceId: "S01", milestoneId: "M001", status: "complete" });
+    insertTask({ id: "T01", sliceId: "S02", milestoneId: "M001", status: "complete" });
+
+    invalidateAllCaches();
+    const state = await deriveStateFromDb(base);
+    assert.equal(
+      state.phase,
+      "completing-milestone",
+      "terminal VALIDATION without SUMMARY should be completing-milestone",
+    );
+  });
+
+  test("extractVerdict: markdown body fallback works", () => {
+    // When LLM writes verdict in body instead of frontmatter (#2960)
+    assert.equal(extractVerdict("# Validation\n\n**Verdict:** PASS"), "pass");
+    assert.equal(extractVerdict("# Validation\n\n**Verdict:** ✅ PASS"), "pass");
+    assert.equal(extractVerdict("# Validation\n\n**Verdict** needs-remediation"), "needs-remediation");
+  });
+
+  test("extractVerdict: normalizes 'passed' to 'pass'", () => {
+    assert.equal(extractVerdict("---\nverdict: passed\n---"), "pass");
+    assert.equal(extractVerdict("**Verdict:** passed"), "pass");
+  });
+
+  test("isClosedStatus: boundary values", () => {
+    assert.equal(isClosedStatus("complete"), true);
+    assert.equal(isClosedStatus("done"), true);
+    assert.equal(isClosedStatus("skipped"), true);
+    assert.equal(isClosedStatus("active"), false);
+    assert.equal(isClosedStatus("pending"), false);
+    assert.equal(isClosedStatus("in_progress"), false);
+    assert.equal(isClosedStatus(""), false);
+    assert.equal(isClosedStatus("COMPLETE"), false, "case-sensitive: uppercase should be false");
+  });
+});
+
+// ─────────────────────────────────────────────────────────────────────────
+// SECTION 5: Ghost Milestone Edge Cases
+// ─────────────────────────────────────────────────────────────────────────
+
+describe("ghost milestone edge cases", () => {
+  let base: string;
+
+  afterEach(() => {
+    try { closeDatabase(); } catch { /* may not be open */ }
+    if (base) rmSync(base, { recursive: true, force: true });
+  });
+
+  test("empty directory with DB row is NOT a ghost (#2921)", () => {
+    base = makeTempDir();
+    const mDir = join(base, ".gsd", "milestones", "M001");
+    mkdirSync(mDir, { recursive: true });
+
+    openDatabase(join(base, ".gsd", "gsd.db"));
+    insertMilestone({ id: "M001", title: "Queued", status: "active" });
+
+    assert.equal(isGhostMilestone(base, "M001"), false, "DB row means not a ghost");
+  });
+
+  test("empty directory with worktree is NOT a ghost (#2921)", () => {
+    base = makeTempDir();
+    const mDir = join(base, ".gsd", "milestones", "M001");
+    mkdirSync(mDir, { recursive: true });
+    // Simulate worktree existence
+    mkdirSync(join(base, ".gsd", "worktrees", "M001"), { recursive: true });
+
+    assert.equal(isGhostMilestone(base, "M001"), false, "worktree means not a ghost");
+  });
+
+  test("empty directory without DB or worktree IS a ghost", () => {
+    base = makeTempDir();
+    const mDir = join(base, ".gsd", "milestones", "M001");
+    mkdirSync(mDir, { recursive: true });
+
+    assert.equal(isGhostMilestone(base, "M001"), true, "no DB, no worktree, no files → ghost");
+  });
+
+  test("directory with only META.json is still a ghost", () => {
+    base = makeTempDir();
+    const mDir = join(base, ".gsd", "milestones", "M001");
+    mkdirSync(mDir, { recursive: true });
+    writeFileSync(join(mDir, "META.json"), '{"created":"2026-01-01"}');
+
+    assert.equal(isGhostMilestone(base, "M001"), true, "META.json alone → ghost");
+  });
+
+  test("ghost milestones are skipped in state derivation", async () => {
+    base = makeTempDir();
+    const gsdDir = join(base, ".gsd", "milestones");
+
+    // M001 is ghost — empty dir
+    mkdirSync(join(gsdDir, "M001"), { recursive: true });
+
+    // M002 is real — has CONTEXT-DRAFT
+    mkdirSync(join(gsdDir, "M002"), { recursive: true });
+    writeFileSync(join(gsdDir, "M002", "M002-CONTEXT-DRAFT.md"), "# Draft\nContent.\n");
+
+    invalidateAllCaches();
+    const state = await deriveState(base);
+    assert.equal(state.activeMilestone?.id, "M002", "ghost M001 skipped, M002 is active");
+  });
+});
+
+// ─────────────────────────────────────────────────────────────────────────
+// SECTION 6: Dispatch Guard Integration
+// ─────────────────────────────────────────────────────────────────────────
+
+describe("dispatch guard integration", () => {
+  let base: string;
+
+  afterEach(() => {
+    try { closeDatabase(); } catch { /* may not be open */ }
+    if (base) rmSync(base, { recursive: true, force: true });
+  });
+
+  test("skip_milestone_validation preference writes pass-through VALIDATION", async () => {
+    base = createFullFixture();
+    openDatabase(join(base, ".gsd", "gsd.db"));
+    insertMilestone({ id: "M001", title: "Active", status: "active" });
+    insertSlice({ id: "S01", milestoneId: "M001", title: "First", status: "complete" });
+    insertSlice({ id: "S02", milestoneId: "M001", title: "Second", status: "complete" });
+    // Write slice SUMMARYs so the missing SUMMARY guard doesn't fire
+    writeFileSync(
+      join(base, ".gsd", "milestones", "M001", "slices", "S01", "S01-SUMMARY.md"),
+      "# S01 Summary\nDone.\n",
+    );
+    writeFileSync(
+      join(base, ".gsd", "milestones", "M001", "slices", "S02", "S02-SUMMARY.md"),
+      "# S02 Summary\nDone.\n",
+    );
+
+    const ctx = buildDispatchCtx(base, "M001", {
+      phase: "validating-milestone",
+      activeSlice: null,
+      activeTask: null,
+    });
+    ctx.prefs = { phases: { skip_milestone_validation: true } } as any;
+
+    const result = await resolveDispatch(ctx);
+    assert.equal(result.action, "skip", "skip_milestone_validation should produce skip action");
+
+    // Should have written a pass-through VALIDATION file
+    const validationPath = join(base, ".gsd", "milestones", "M001", "M001-VALIDATION.md");
+    assert.ok(existsSync(validationPath), "VALIDATION file should be written");
+    const content = readFileSync(validationPath, "utf-8");
+    assert.ok(content.includes("verdict: pass"), "should contain pass verdict");
+    assert.ok(content.includes("skipped by preference"), "should note it was skipped");
+  });
+
+  test("rewrite-docs circuit breaker: exceeding MAX attempts resolves all overrides", async () => {
+    base = createFullFixture();
+    openDatabase(join(base, ".gsd", "gsd.db"));
+    insertMilestone({ id: "M001", title: "Active", status: "active" });
+
+    // Write a rewrite count at the max
+    const runtimeDir = join(base, ".gsd", "runtime");
+    mkdirSync(runtimeDir, { recursive: true });
+    writeFileSync(
+      join(runtimeDir, "rewrite-count.json"),
+      JSON.stringify({ count: 3, updatedAt: new Date().toISOString() }),
+    );
+
+    // Import and check
+    const { getRewriteCount } = await import("../../auto-dispatch.ts");
+    assert.equal(getRewriteCount(base), 3, "rewrite count should be 3");
+  });
+
+  test("replanning-slice with null activeSlice → stop (error)", async () => {
+    base = createFullFixture();
+    openDatabase(join(base, ".gsd", "gsd.db"));
+
+    const ctx = buildDispatchCtx(base, "M001", {
+      phase: "replanning-slice",
+      activeSlice: null,
+      activeTask: null,
+    });
+
+    const result = await resolveDispatch(ctx);
+    assert.equal(result.action, "stop", "replanning without activeSlice should stop");
+  });
+});
diff --git a/src/resources/extensions/gsd/tests/integration/state-machine-runtime-failures.test.ts b/src/resources/extensions/gsd/tests/integration/state-machine-runtime-failures.test.ts
new file mode 100644
index 000000000..1c0eadf49
--- /dev/null
+++ b/src/resources/extensions/gsd/tests/integration/state-machine-runtime-failures.test.ts
@@ -0,0 +1,841 @@
+/**
+ * state-machine-runtime-failures.test.ts — Tests for auto-loop runtime failures,
+ * infrastructure errors, stuck detection, session management, merge conflicts,
+ * concurrent access, and race conditions.
+ *
+ * These tests use mocked LoopDeps and AutoSession to exercise the auto-loop
+ * error handling paths without requiring real LLM sessions or network access.
+ *
+ * Coverage gaps filled:
+ * 1. Infrastructure error detection and immediate stop (ENOSPC, ENOMEM, etc.)
+ * 2. Consecutive error graduated recovery (1st → retry, 2nd → cache flush, 3rd → stop)
+ * 3. Stuck detection: same error repeated, same unit 3x, oscillation A↔B
+ * 4. Session lock validation: compromised, pid-mismatch, missing-metadata
+ * 5. Session creation timeout (NEW_SESSION_TIMEOUT_MS = 30s)
+ * 6. MergeConflictError stops auto-loop
+ * 7. Max iteration safety valve
+ * 8. s.active race: pause signal during unit execution
+ * 9. Filesystem mutation during dispatch cycle
+ * 10. Worktree disappearance detection
+ */
+
+// GSD State Machine Runtime Failure Tests
+
+import { describe, test, beforeEach, afterEach } from "node:test";
+import assert from "node:assert/strict";
+import {
+  mkdtempSync,
+  mkdirSync,
+  writeFileSync,
+  rmSync,
+  existsSync,
+  unlinkSync,
+} from "node:fs";
+import { tmpdir } from "node:os";
+import { join } from "node:path";
+
+// ── Infrastructure error detection ───────────────────────────────────────
+import {
+  isInfrastructureError,
+  INFRA_ERROR_CODES,
+} from "../../auto/infra-errors.ts";
+
+// ── Stuck detection ──────────────────────────────────────────────────────
+import { detectStuck } from "../../auto/detect-stuck.ts";
+import type { WindowEntry } from "../../auto/types.ts";
+
+// ── Session constants ────────────────────────────────────────────────────
+import {
+  AutoSession,
+  NEW_SESSION_TIMEOUT_MS,
+  MAX_UNIT_DISPATCHES,
+  STUB_RECOVERY_THRESHOLD,
+  MAX_LIFETIME_DISPATCHES,
+} from "../../auto/session.ts";
+
+// ── Auto-loop types ──────────────────────────────────────────────────────
+import { MAX_LOOP_ITERATIONS } from "../../auto/types.ts";
+
+// ── MergeConflictError ───────────────────────────────────────────────────
+import { MergeConflictError } from "../../git-service.ts";
+
+// ── Session lock ─────────────────────────────────────────────────────────
+import type { SessionLockStatus } from "../../session-lock.ts";
+
+// ── State & DB ───────────────────────────────────────────────────────────
+import {
+  openDatabase,
+  closeDatabase,
+  insertMilestone,
+  insertSlice,
+  insertTask,
+} from "../../gsd-db.ts";
+import {
+  deriveState,
+  deriveStateFromDb,
+  invalidateStateCache,
+  isGhostMilestone,
+} from "../../state.ts";
+import { invalidateAllCaches } from "../../cache.ts";
+
+// ═══════════════════════════════════════════════════════════════════════════
+// Fixture Helpers
+// ═══════════════════════════════════════════════════════════════════════════
+
+function makeTempDir(): string {
+  return mkdtempSync(join(tmpdir(), "gsd-runtime-fail-"));
+}
+
+function createMinimalFixture(): string {
+  const base = makeTempDir();
+  const mDir = join(base, ".gsd", "milestones", "M001", "slices", "S01", "tasks");
+  mkdirSync(mDir, { recursive: true });
+  writeFileSync(
+    join(base, ".gsd", "milestones", "M001", "M001-CONTEXT.md"),
+    "# M001: Runtime Test\n\n## Purpose\nTest runtime failures.\n",
+  );
+  writeFileSync(
+    join(base, ".gsd", "milestones", "M001", "M001-ROADMAP.md"),
+    [
+      "# M001: Runtime Test",
+      "",
+      "## Vision",
+      "Test.",
+      "",
+      "## Success Criteria",
+      "- Works",
+      "",
+      "## Slices",
+      "",
+      "- [ ] **S01: Feature** `risk:low` `depends:[]`",
+      "  - After this: Done.",
+      "",
+      "## Boundary Map",
+      "",
+      "| From | To | Produces | Consumes |",
+      "|------|----|----------|----------|",
+      "| S01 | terminal | out | nothing |",
+    ].join("\n"),
+  );
+  writeFileSync(
+    join(base, ".gsd", "milestones", "M001", "slices", "S01", "S01-PLAN.md"),
+    [
+      "# S01: Feature",
+      "",
+      "**Goal:** Build.",
+      "",
+      "## Tasks",
+      "",
+      "- [ ] **T01: Build** `est:30m`",
+      "  - Do: Build it",
+      "  - Verify: Test it",
+    ].join("\n"),
+  );
+  writeFileSync(
+    join(mDir, "T01-PLAN.md"),
+    "# T01 Plan\nBuild it.\n",
+  );
+  return base;
+}
+
+// ═══════════════════════════════════════════════════════════════════════════
+// Test Suite
+// ═══════════════════════════════════════════════════════════════════════════
+
+// ─────────────────────────────────────────────────────────────────────────
+// SECTION 1: Infrastructure Error Detection
+// ─────────────────────────────────────────────────────────────────────────
+
+describe("infrastructure error detection", () => {
+  test("ENOSPC (disk full) is detected as infrastructure error", () => {
+    const err = Object.assign(new Error("write ENOSPC"), { code: "ENOSPC" });
+    assert.equal(isInfrastructureError(err), "ENOSPC");
+  });
+
+  test("ENOMEM (out of memory) is detected", () => {
+    const err = Object.assign(new Error("Cannot allocate memory"), { code: "ENOMEM" });
+    assert.equal(isInfrastructureError(err), "ENOMEM");
+  });
+
+  test("EROFS (read-only filesystem) is detected", () => {
+    const err = Object.assign(new Error("Read-only file system"), { code: "EROFS" });
+    assert.equal(isInfrastructureError(err), "EROFS");
+  });
+
+  test("EDQUOT (disk quota exceeded) is detected", () => {
+    const err = Object.assign(new Error("Disk quota exceeded"), { code: "EDQUOT" });
+    assert.equal(isInfrastructureError(err), "EDQUOT");
+  });
+
+  test("EMFILE (too many open files - process) is detected", () => {
+    const err = Object.assign(new Error("too many open files"), { code: "EMFILE" });
+    assert.equal(isInfrastructureError(err), "EMFILE");
+  });
+
+  test("ENFILE (too many open files - system) is detected", () => {
+    const err = Object.assign(new Error("file table overflow"), { code: "ENFILE" });
+    assert.equal(isInfrastructureError(err), "ENFILE");
+  });
+
+  test("ECONNREFUSED (connection refused) is detected", () => {
+    const err = Object.assign(new Error("Connection refused"), { code: "ECONNREFUSED" });
+    assert.equal(isInfrastructureError(err), "ECONNREFUSED");
+  });
+
+  test("ENOTFOUND (DNS lookup failed) is detected", () => {
+    const err = Object.assign(new Error("getaddrinfo ENOTFOUND api.anthropic.com"), { code: "ENOTFOUND" });
+    assert.equal(isInfrastructureError(err), "ENOTFOUND");
+  });
+
+  test("ENETUNREACH (network unreachable) is detected", () => {
+    const err = Object.assign(new Error("network is unreachable"), { code: "ENETUNREACH" });
+    assert.equal(isInfrastructureError(err), "ENETUNREACH");
+  });
+
+  test("EAGAIN (resource temporarily unavailable) is detected", () => {
+    const err = Object.assign(new Error("resource temporarily unavailable"), { code: "EAGAIN" });
+    assert.equal(isInfrastructureError(err), "EAGAIN");
+  });
+
+  test("SQLite WAL corruption is detected via message scan", () => {
+    const err = new Error("database disk image is malformed");
+    assert.equal(isInfrastructureError(err), "SQLITE_CORRUPT");
+  });
+
+  test("code-based detection when code property is present", () => {
+    const err = { code: "ENOSPC", message: "something" };
+    assert.equal(isInfrastructureError(err), "ENOSPC");
+  });
+
+  test("message fallback when no code property (e.g. string errors)", () => {
+    const err = new Error("write failed: ENOSPC: no space left on device");
+    assert.equal(isInfrastructureError(err), "ENOSPC");
+  });
+
+  test("non-infrastructure error returns null", () => {
+    assert.equal(isInfrastructureError(new Error("TypeError: x is not a function")), null);
+    assert.equal(isInfrastructureError(new Error("SyntaxError: Unexpected token")), null);
+    assert.equal(isInfrastructureError(new Error("rate_limit_exceeded")), null);
+    assert.equal(isInfrastructureError("just a string error"), null);
+    assert.equal(isInfrastructureError(null), null);
+    assert.equal(isInfrastructureError(undefined), null);
+    assert.equal(isInfrastructureError(42), null);
+  });
+
+  test("all INFRA_ERROR_CODES are covered", () => {
+    const expectedCodes = [
+      "ENOSPC", "ENOMEM", "EROFS", "EDQUOT", "EMFILE",
+      "ENFILE", "EAGAIN", "ECONNREFUSED", "ENOTFOUND", "ENETUNREACH",
+    ];
+    for (const code of expectedCodes) {
+      assert.ok(INFRA_ERROR_CODES.has(code), `${code} should be in INFRA_ERROR_CODES`);
+    }
+    assert.equal(INFRA_ERROR_CODES.size, expectedCodes.length, "no unexpected codes");
+  });
+});
+
+// ─────────────────────────────────────────────────────────────────────────
+// SECTION 2: Stuck Detection
+// ─────────────────────────────────────────────────────────────────────────
+
+describe("stuck detection", () => {
+  test("Rule 1: same error repeated consecutively → stuck", () => {
+    const window: WindowEntry[] = [
+      { key: "M001/S01/T01", error: "Provider returned 500" },
+      { key: "M001/S01/T01", error: "Provider returned 500" },
+    ];
+    const result = detectStuck(window);
+    assert.ok(result?.stuck, "same error twice should be stuck");
+    assert.ok(result?.reason.includes("Same error repeated"), "reason should mention error");
+  });
+
+  test("Rule 1: different errors are NOT stuck", () => {
+    const window: WindowEntry[] = [
+      { key: "M001/S01/T01", error: "Provider returned 500" },
+      { key: "M001/S01/T01", error: "Provider returned 429" },
+    ];
+    const result = detectStuck(window);
+    // Different errors → not stuck by Rule 1 (but might be by Rule 2 with more entries)
+    assert.equal(result, null, "different errors should not trigger Rule 1");
+  });
+
+  test("Rule 2: same unit 3 consecutive times → stuck", () => {
+    const window: WindowEntry[] = [
+      { key: "M001/S01/T01" },
+      { key: "M001/S01/T01" },
+      { key: "M001/S01/T01" },
+    ];
+    const result = detectStuck(window);
+    assert.ok(result?.stuck, "same unit 3x should be stuck");
+    assert.ok(result?.reason.includes("3 consecutive times"), "reason should mention 3x");
+  });
+
+  test("Rule 2: 2 consecutive same units is NOT stuck", () => {
+    const window: WindowEntry[] = [
+      { key: "M001/S01/T01" },
+      { key: "M001/S01/T01" },
+    ];
+    const result = detectStuck(window);
+    assert.equal(result, null, "2x same unit is not stuck");
+  });
+
+  test("Rule 3: oscillation A→B→A→B → stuck", () => {
+    const window: WindowEntry[] = [
+      { key: "M001/S01/T01" },
+      { key: "M001/S01/T02" },
+      { key: "M001/S01/T01" },
+      { key: "M001/S01/T02" },
+    ];
+    const result = detectStuck(window);
+    assert.ok(result?.stuck, "A→B→A→B should be stuck");
+    assert.ok(result?.reason.includes("Oscillation"), "reason should mention oscillation");
+  });
+
+  test("Rule 3: A→B→C→D is NOT oscillation", () => {
+    const window: WindowEntry[] = [
+      { key: "A" },
+      { key: "B" },
+      { key: "C" },
+      { key: "D" },
+    ];
+    assert.equal(detectStuck(window), null, "sequential progress is not stuck");
+  });
+
+  test("empty window returns null", () => {
+    assert.equal(detectStuck([]), null);
+  });
+
+  test("single entry returns null", () => {
+    assert.equal(detectStuck([{ key: "A" }]), null);
+  });
+
+  test("Rule 1 takes precedence over Rule 2 when both apply", () => {
+    const window: WindowEntry[] = [
+      { key: "A", error: "fail" },
+      { key: "A", error: "fail" },
+      { key: "A", error: "fail" },
+    ];
+    const result = detectStuck(window);
+    assert.ok(result?.stuck);
+    // Rule 1 fires first (same error at indices 1,2)
+    assert.ok(result?.reason.includes("Same error repeated"));
+  });
+
+  test("errors on different keys are not stuck by Rule 1", () => {
+    const window: WindowEntry[] = [
+      { key: "A", error: "fail" },
+      { key: "B", error: "fail" },
+    ];
+    // Same error but different keys — Rule 1 compares errors regardless of key
+    const result = detectStuck(window);
+    // Rule 1 says "same error repeated consecutively" — it checks error strings
+    assert.ok(result?.stuck, "same error string on different keys still triggers Rule 1");
+  });
+});
+
+// ─────────────────────────────────────────────────────────────────────────
+// SECTION 3: Session Management
+// ─────────────────────────────────────────────────────────────────────────
+
+describe("session management", () => {
+  test("AutoSession reset() clears all mutable state", () => {
+    const s = new AutoSession();
+    s.active = true;
+    s.paused = true;
+    s.basePath = "/tmp/test";
+    s.currentUnit = { type: "execute-task", id: "M001/S01/T01", startedAt: Date.now() };
+    s.currentMilestoneId = "M001";
+    s.unitDispatchCount.set("M001/S01/T01", 3);
+    s.unitLifetimeDispatches.set("M001/S01/T01", 5);
+    s.unitRecoveryCount.set("M001/S01/T01", 1);
+
+    s.reset();
+
+    assert.equal(s.active, false, "active should be false after reset");
+    assert.equal(s.paused, false, "paused should be false after reset");
+    assert.equal(s.currentUnit, null, "currentUnit should be null after reset");
+    assert.equal(s.currentMilestoneId, null, "currentMilestoneId should be null");
+    assert.equal(s.unitDispatchCount.size, 0, "dispatch counts cleared");
+    assert.equal(s.unitLifetimeDispatches.size, 0, "lifetime dispatches cleared");
+    assert.equal(s.unitRecoveryCount.size, 0, "recovery counts cleared");
+  });
+
+  test("NEW_SESSION_TIMEOUT_MS is 30 seconds", () => {
+    assert.equal(NEW_SESSION_TIMEOUT_MS, 30_000, "session timeout should be 30s");
+  });
+
+  test("MAX_UNIT_DISPATCHES limits retries for a single unit", () => {
+    assert.equal(MAX_UNIT_DISPATCHES, 3, "max unit dispatches should be 3");
+  });
+
+  test("MAX_LIFETIME_DISPATCHES is the absolute limit per unit", () => {
+    assert.equal(MAX_LIFETIME_DISPATCHES, 6, "max lifetime dispatches should be 6");
+  });
+
+  test("STUB_RECOVERY_THRESHOLD triggers recovery after N stub completions", () => {
+    assert.equal(STUB_RECOVERY_THRESHOLD, 2, "stub recovery threshold should be 2");
+  });
+
+  test("MAX_LOOP_ITERATIONS prevents runaway loops", () => {
+    assert.equal(MAX_LOOP_ITERATIONS, 500, "max iterations should be 500");
+  });
+
+  test("AutoSession dispatch counter tracks per-unit dispatches", () => {
+    const s = new AutoSession();
+    const unitId = "M001/S01/T01";
+
+    assert.equal(s.unitDispatchCount.get(unitId), undefined);
+
+    s.unitDispatchCount.set(unitId, 1);
+    assert.equal(s.unitDispatchCount.get(unitId), 1);
+
+    s.unitDispatchCount.set(unitId, 2);
+    assert.equal(s.unitDispatchCount.get(unitId), 2);
+
+    // Exceeding MAX_UNIT_DISPATCHES
+    s.unitDispatchCount.set(unitId, MAX_UNIT_DISPATCHES + 1);
+    assert.ok(
+      s.unitDispatchCount.get(unitId)! > MAX_UNIT_DISPATCHES,
+      "should track count beyond max for detection",
+    );
+  });
+
+  test("AutoSession toJSON() provides diagnostic snapshot", () => {
+    const s = new AutoSession();
+    s.active = true;
+    s.basePath = "/tmp/test";
+    s.currentUnit = { type: "execute-task", id: "M001/S01/T01", startedAt: Date.now() };
+
+    const json = s.toJSON();
+    assert.ok(json, "toJSON should return a value");
+    assert.equal(typeof json, "object", "toJSON should return an object");
+  });
+});
+
+// ─────────────────────────────────────────────────────────────────────────
+// SECTION 4: Session Lock Validation
+// ─────────────────────────────────────────────────────────────────────────
+
+describe("session lock validation", () => {
+  test("SessionLockStatus: valid lock", () => {
+    const status: SessionLockStatus = { valid: true };
+    assert.equal(status.valid, true);
+    assert.equal(status.failureReason, undefined);
+  });
+
+  test("SessionLockStatus: compromised lock (sleep/wake cycle)", () => {
+    const status: SessionLockStatus = {
+      valid: false,
+      failureReason: "compromised",
+    };
+    assert.equal(status.valid, false);
+    assert.equal(status.failureReason, "compromised");
+  });
+
+  test("SessionLockStatus: pid-mismatch (another process took over)", () => {
+    const status: SessionLockStatus = {
+      valid: false,
+      failureReason: "pid-mismatch",
+      existingPid: 12345,
+      expectedPid: 67890,
+    };
+    assert.equal(status.valid, false);
+    assert.equal(status.failureReason, "pid-mismatch");
+    assert.notEqual(status.existingPid, status.expectedPid);
+  });
+
+  test("SessionLockStatus: missing-metadata", () => {
+    const status: SessionLockStatus = {
+      valid: false,
+      failureReason: "missing-metadata",
+    };
+    assert.equal(status.valid, false);
+    assert.equal(status.failureReason, "missing-metadata");
+  });
+});
+
+// ─────────────────────────────────────────────────────────────────────────
+// SECTION 5: MergeConflictError
+// ─────────────────────────────────────────────────────────────────────────
+
+describe("MergeConflictError handling", () => {
+  test("MergeConflictError has correct properties", () => {
+    const err = new MergeConflictError(
+      ["src/feature.ts", "src/utils.ts"],
+      "squash",
+      "gsd/auto/M001",
+      "main",
+    );
+
+    assert.ok(err instanceof Error, "should be an Error");
+    assert.ok(err instanceof MergeConflictError, "should be a MergeConflictError");
+    assert.deepEqual(err.conflictedFiles, ["src/feature.ts", "src/utils.ts"]);
+    assert.equal(err.strategy, "squash");
+    assert.equal(err.branch, "gsd/auto/M001");
+    assert.equal(err.mainBranch, "main");
+  });
+
+  test("MergeConflictError with merge strategy", () => {
+    const err = new MergeConflictError(
+      ["package.json"],
+      "merge",
+      "feat/new-feature",
+      "main",
+    );
+    assert.equal(err.strategy, "merge");
+  });
+
+  test("MergeConflictError with empty conflict list", () => {
+    const err = new MergeConflictError([], "squash", "branch", "main");
+    assert.deepEqual(err.conflictedFiles, []);
+  });
+
+  test("MergeConflictError is distinguishable from generic errors", () => {
+    const mergeErr = new MergeConflictError(["file.ts"], "squash", "b", "m");
+    const genericErr = new Error("merge failed");
+
+    assert.ok(mergeErr instanceof MergeConflictError);
+    assert.ok(!(genericErr instanceof MergeConflictError));
+
+    // This is the exact pattern used in phases.ts catch blocks
+    if (mergeErr instanceof MergeConflictError) {
+      assert.ok(true, "instanceof check works for catch blocks");
+    }
+  });
+});
+
+// ─────────────────────────────────────────────────────────────────────────
+// SECTION 6: Filesystem Race Conditions
+// ─────────────────────────────────────────────────────────────────────────
+
+describe("filesystem race conditions", () => {
+  let base: string;
+
+  afterEach(() => {
+    try { closeDatabase(); } catch { /* may not be open */ }
+    if (base) rmSync(base, { recursive: true, force: true });
+  });
+
+  test("ROADMAP deleted during derive cycle → graceful degradation", async () => {
+    base = createMinimalFixture();
+    openDatabase(join(base, ".gsd", "gsd.db"));
+    insertMilestone({ id: "M001", title: "Active", status: "active" });
+    insertSlice({ id: "S01", milestoneId: "M001", title: "Feature", status: "in_progress" });
+    insertTask({ id: "T01", sliceId: "S01", milestoneId: "M001", status: "pending" });
+
+    invalidateAllCaches();
+    const state1 = await deriveStateFromDb(base);
+    assert.equal(state1.phase, "executing");
+
+    // Delete ROADMAP mid-flow
+    const roadmapPath = join(base, ".gsd", "milestones", "M001", "M001-ROADMAP.md");
+    unlinkSync(roadmapPath);
+
+    invalidateAllCaches();
+    // DB still has the slice/task data, so derivation should still work
+    const state2 = await deriveStateFromDb(base);
+    assert.ok(state2.phase, "should produce a valid phase even after ROADMAP deletion");
+  });
+
+  test("CONTEXT deleted during derive → falls back gracefully", async () => {
+    base = createMinimalFixture();
+    openDatabase(join(base, ".gsd", "gsd.db"));
+    insertMilestone({ id: "M001", title: "Active", status: "active" });
+
+    const contextPath = join(base, ".gsd", "milestones", "M001", "M001-CONTEXT.md");
+    unlinkSync(contextPath);
+
+    invalidateAllCaches();
+    const state = await deriveStateFromDb(base);
+    // Without CONTEXT, title fallback should still work
+    assert.ok(state.activeMilestone, "should still have an active milestone from DB");
+  });
+
+  test("entire slice directory deleted → derive produces valid state", async () => {
+    base = createMinimalFixture();
+    openDatabase(join(base, ".gsd", "gsd.db"));
+    insertMilestone({ id: "M001", title: "Active", status: "active" });
+    insertSlice({ id: "S01", milestoneId: "M001", title: "Feature", status: "in_progress" });
+    insertTask({ id: "T01", sliceId: "S01", milestoneId: "M001", status: "pending" });
+
+    // Delete entire S01 directory
+    rmSync(join(base, ".gsd", "milestones", "M001", "slices", "S01"), { recursive: true, force: true });
+
+    invalidateAllCaches();
+    const state = await deriveStateFromDb(base);
+    // DB still has slice/task rows, disk is gone — state should degrade gracefully
+    assert.ok(state.phase, "should produce valid phase after slice dir deletion");
+  });
+
+  test("task PLAN file deleted between dispatch and execution → recovery dispatch", async () => {
+    base = createMinimalFixture();
+    openDatabase(join(base, ".gsd", "gsd.db"));
+    insertMilestone({ id: "M001", title: "Active", status: "active" });
+    insertSlice({ id: "S01", milestoneId: "M001", title: "Feature", status: "in_progress" });
+    insertTask({ id: "T01", sliceId: "S01", milestoneId: "M001", status: "pending" });
+
+    // Delete T01-PLAN.md
+    const planPath = join(base, ".gsd", "milestones", "M001", "slices", "S01", "tasks", "T01-PLAN.md");
+    unlinkSync(planPath);
+
+    // Also write milestone RESEARCH so research-slice rule doesn't fire first
+    writeFileSync(
+      join(base, ".gsd", "milestones", "M001", "M001-RESEARCH.md"),
+      "# Research\nDone.\n",
+    );
+    // Write slice RESEARCH so research-slice rule for non-S01 doesn't fire
+    writeFileSync(
+      join(base, ".gsd", "milestones", "M001", "slices", "S01", "S01-RESEARCH.md"),
+      "# S01 Research\nDone.\n",
+    );
+
+    const { resolveDispatch } = await import("../../auto-dispatch.ts");
+
+    invalidateAllCaches();
+    const state = await deriveStateFromDb(base);
+
+    const ctx = {
+      basePath: base,
+      mid: "M001",
+      midTitle: "Active",
+      state,
+      prefs: undefined,
+    };
+
+    const result = await resolveDispatch(ctx);
+    // The "executing → execute-task (recover missing task plan)" rule should
+    // detect missing T01-PLAN.md and dispatch plan-slice instead of execute-task
+    if (result.action === "dispatch") {
+      assert.equal(
+        (result as any).unitType,
+        "plan-slice",
+        "missing task plan should trigger plan-slice recovery",
+      );
+    }
+    // It's also valid if the state changed due to cache invalidation
+    assert.ok(result.action, "should produce a valid dispatch action");
+  });
+
+  test("worktree directory disappearance: isGhostMilestone still works", () => {
+    const tmpBase = makeTempDir();
+    const mDir = join(tmpBase, ".gsd", "milestones", "M001");
+    mkdirSync(mDir, { recursive: true });
+
+    // Create worktree dir then delete it (simulates external deletion)
+    const wtDir = join(tmpBase, ".gsd", "worktrees", "M001");
+    mkdirSync(wtDir, { recursive: true });
+
+    // With worktree → not a ghost
+    assert.equal(isGhostMilestone(tmpBase, "M001"), false, "with worktree: not ghost");
+
+    // Delete worktree (simulates external process removing it)
+    rmSync(wtDir, { recursive: true, force: true });
+    assert.ok(!existsSync(wtDir), "worktree should be gone");
+
+    // Without worktree AND without DB → ghost (existsSync handles missing dir)
+    assert.equal(isGhostMilestone(tmpBase, "M001"), true, "without worktree: ghost");
+
+    rmSync(tmpBase, { recursive: true, force: true });
+  });
+});
+
+// ─────────────────────────────────────────────────────────────────────────
+// SECTION 7: Graduated Error Recovery in Auto-Loop
+// ─────────────────────────────────────────────────────────────────────────
+
+describe("graduated error recovery logic", () => {
+  test("infrastructure error codes are exhaustive and non-overlapping", () => {
+    // Verify the set contains only OS-level error codes
+    for (const code of INFRA_ERROR_CODES) {
+      assert.ok(code.startsWith("E"), `infra code ${code} should start with E`);
+      assert.ok(code.length >= 4, `infra code ${code} should be at least 4 chars`);
+    }
+  });
+
+  test("SQLite corruption detection via message scan (no code property)", () => {
+    // Simulates sql.js or better-sqlite3 error without proper Node code
+    const err = new Error("SqliteError: database disk image is malformed");
+    const result = isInfrastructureError(err);
+    assert.equal(result, "SQLITE_CORRUPT");
+  });
+
+  test("provider rate limit is NOT an infrastructure error (retryable)", () => {
+    const err = new Error("rate_limit_exceeded: Too many requests");
+    assert.equal(isInfrastructureError(err), null);
+  });
+
+  test("overloaded_error is NOT an infrastructure error (retryable)", () => {
+    const err = new Error("overloaded_error: The model is currently overloaded");
+    assert.equal(isInfrastructureError(err), null);
+  });
+
+  test("authentication error is NOT an infrastructure error", () => {
+    const err = new Error("authentication_error: Invalid API key");
+    assert.equal(isInfrastructureError(err), null);
+  });
+
+  test("permission denied (EACCES) is NOT in infrastructure set", () => {
+    // EACCES is intentionally not in the set — it may indicate a fixable
+    // permissions issue rather than a hardware-level failure
+    const err = Object.assign(new Error("permission denied"), { code: "EACCES" });
+    assert.equal(isInfrastructureError(err), null);
+  });
+});
+
+// ─────────────────────────────────────────────────────────────────────────
+// SECTION 8: Multi-Iteration Stuck Scenarios
+// ─────────────────────────────────────────────────────────────────────────
+
+describe("multi-iteration stuck scenarios", () => {
+  test("progressive window: normal → stuck after 3rd same unit", () => {
+    const window: WindowEntry[] = [];
+
+    window.push({ key: "A" });
+    assert.equal(detectStuck(window), null, "1 entry: not stuck");
+
+    window.push({ key: "A" });
+    assert.equal(detectStuck(window), null, "2 entries: not stuck yet");
+
+    window.push({ key: "A" });
+    assert.ok(detectStuck(window)?.stuck, "3 entries: stuck");
+  });
+
+  test("progressive window: oscillation builds up", () => {
+    const window: WindowEntry[] = [];
+
+    window.push({ key: "A" });
+    assert.equal(detectStuck(window), null);
+
+    window.push({ key: "B" });
+    assert.equal(detectStuck(window), null);
+
+    window.push({ key: "A" });
+    assert.equal(detectStuck(window), null, "3 entries A→B→A: not stuck yet");
+
+    window.push({ key: "B" });
+    assert.ok(detectStuck(window)?.stuck, "4 entries A→B→A→B: stuck");
+  });
+
+  test("mixed progress then stuck: A→B→C→C→C → stuck on C", () => {
+    const window: WindowEntry[] = [
+      { key: "A" },
+      { key: "B" },
+      { key: "C" },
+      { key: "C" },
+      { key: "C" },
+    ];
+    const result = detectStuck(window);
+    assert.ok(result?.stuck, "3 consecutive C: stuck");
+    assert.ok(result?.reason.includes("C"), "reason should mention stuck unit");
+  });
+
+  test("error in middle of window does not false-positive", () => {
+    const window: WindowEntry[] = [
+      { key: "A" },
+      { key: "B", error: "transient failure" },
+      { key: "C" },
+      { key: "D" },
+    ];
+    assert.equal(detectStuck(window), null, "single error should not trigger stuck");
+  });
+
+  test("consecutive errors on different keys still triggers Rule 1", () => {
+    const window: WindowEntry[] = [
+      { key: "A", error: "Provider returned 503 Service Unavailable" },
+      { key: "B", error: "Provider returned 503 Service Unavailable" },
+    ];
+    const result = detectStuck(window);
+    assert.ok(result?.stuck, "same error on different keys: stuck by Rule 1");
+  });
+});
+
+// ─────────────────────────────────────────────────────────────────────────
+// SECTION 9: State Consistency Under Concurrent DB Operations
+// ─────────────────────────────────────────────────────────────────────────
+
+describe("state consistency under DB mutations", () => {
+  let base: string;
+
+  afterEach(() => {
+    try { closeDatabase(); } catch { /* may not be open */ }
+    if (base) rmSync(base, { recursive: true, force: true });
+  });
+
+  test("rapid DB mutations produce consistent deriveStateFromDb results", async () => {
+    base = createMinimalFixture();
+    openDatabase(join(base, ".gsd", "gsd.db"));
+    insertMilestone({ id: "M001", title: "Active", status: "active" });
+    insertSlice({ id: "S01", milestoneId: "M001", title: "Feature", status: "in_progress" });
+    insertTask({ id: "T01", sliceId: "S01", milestoneId: "M001", status: "pending" });
+
+    // Rapid mutations with invalidation between each
+    invalidateAllCaches();
+    const states: string[] = [];
+
+    const s1 = await deriveStateFromDb(base);
+    states.push(s1.phase);
+
+    // pending → complete
+    const { updateTaskStatus } = await import("../../gsd-db.ts");
+    updateTaskStatus("M001", "S01", "T01", "complete", new Date().toISOString());
+    invalidateAllCaches();
+    const s2 = await deriveStateFromDb(base);
+    states.push(s2.phase);
+
+    // S01 should now be summarizing (all tasks done)
+    assert.equal(states[0], "executing", "initially executing");
+    assert.equal(states[1], "summarizing", "after task complete → summarizing");
+
+    // No state should be undefined or null
+    for (const phase of states) {
+      assert.ok(phase, "every state should have a valid phase");
+    }
+  });
+
+  test("DB milestone status change is reflected after cache invalidation", async () => {
+    base = createMinimalFixture();
+    openDatabase(join(base, ".gsd", "gsd.db"));
+    insertMilestone({ id: "M001", title: "Active", status: "active" });
+    insertSlice({ id: "S01", milestoneId: "M001", title: "Feature", status: "complete" });
+    insertTask({ id: "T01", sliceId: "S01", milestoneId: "M001", status: "complete" });
+
+    invalidateAllCaches();
+    const s1 = await deriveStateFromDb(base);
+    assert.equal(s1.phase, "validating-milestone");
+
+    // Mark milestone complete directly
+    const { updateMilestoneStatus } = await import("../../gsd-db.ts");
+    updateMilestoneStatus("M001", "complete", new Date().toISOString());
+    // Write SUMMARY to make it truly complete
+    writeFileSync(
+      join(base, ".gsd", "milestones", "M001", "M001-SUMMARY.md"),
+      "# M001 Summary\nDone.\n",
+    );
+
+    invalidateAllCaches();
+    const s2 = await deriveStateFromDb(base);
+    // With only M001 and it's complete, should be "complete"
+    assert.equal(s2.phase, "complete", "after milestone completion should be complete");
+  });
+
+  test("deriveState is idempotent: same inputs produce same outputs", async () => {
+    base = createMinimalFixture();
+    openDatabase(join(base, ".gsd", "gsd.db"));
+    insertMilestone({ id: "M001", title: "Active", status: "active" });
+    insertSlice({ id: "S01", milestoneId: "M001", title: "Feature", status: "in_progress" });
+    insertTask({ id: "T01", sliceId: "S01", milestoneId: "M001", status: "pending" });
+
+    // Call deriveState 5 times with cache invalidation between each
+    const results: string[] = [];
+    for (let i = 0; i < 5; i++) {
+      invalidateAllCaches();
+      const state = await deriveStateFromDb(base);
+      results.push(state.phase);
+    }
+
+    // All should be identical
+    const unique = new Set(results);
+    assert.equal(unique.size, 1, `expected all identical, got: ${[...unique].join(", ")}`);
+    assert.equal(results[0], "executing");
+  });
+});