feat(sf): wire escalation detection into state derivation (PDD)

State derivation now emits phase='escalating-task' when a task in the active slice is paused waiting for a user decision. Builds on the type+DDL foundation in 62dacb627. Together they get the loop to STOP when there's a pending escalation rather than carrying past an undocumented decision. PDD spec for this change: Purpose: pause auto-mode at the state-derivation layer when any task in the active slice has escalation_pending=1 with an unresolved escalation artifact. The dispatcher (next fire) sees phase= 'escalating-task' and returns 'stop' rather than dispatching new work over a pending decision. Consumer: state.ts deriveStateFromDb() callers — the auto-loop, the /sf status dashboard, the future /sf escalate command. Contract: 1. Empty tasks list → null (no pause). Verified. 2. Task without escalation_pending → null. Verified. 3. escalation_pending=1 but no artifact path → null (treats as not actionable). Verified. 4. escalation_pending=1 + valid artifact + no respondedAt → returns task id; state.phase = 'escalating-task' with task id in blockers and a /sf escalate hint in nextAction. Verified. 5. respondedAt set → null (already resolved, fall through). Verified. Failure boundary: any read/parse failure on the artifact returns null from detectPendingEscalation — state derivation falls through to existing behavior. Strict schema validation in readEscalationArtifact treats malformed artifacts as 'no actionable escalation here.' Evidence: smoke test exercises all 5 contract conditions end-to-end with real filesystem artifacts. Typecheck clean. Existing state derivation paths unchanged when no task is paused (early continue on escalation_pending !== 1 in detectPendingEscalation's loop). Non-goals: - Dispatch rule that returns 'stop' on phase='escalating-task' (next fire — needs no DB changes, just an auto-dispatch.ts edit) - Escalation artifact creation tools (gsd-2 has writeEscalation- Artifact + buildEscalationArtifact + setTaskEscalationPending — those land when a task agent needs to file an escalation) - /sf escalate user command (later fire) Invariants: - Safety: no escalation pending → 0 file system reads (loop early- continues), zero behavior change vs current. - Liveness: if a task IS paused, state.phase becomes 'escalating- task' immediately — no race with dispatch ordering. Assumptions verified: - SF's EscalationArtifact + EscalationOption types match gsd-2's schema (verified earlier this session). - TaskRow has escalation_pending and escalation_artifact_path fields (added in 62dacb627). - getSliceTasks() returns DB rows that include those fields after the v23 migration ran. - state.ts has the slice-level scope I need (activeMilestone + activeSlice + registry + requirements + progress all visible at the insertion point). Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
2026-05-02 20:06:29 +02:00 · 2026-05-02 20:06:29 +02:00 · ea8819906d
commit ea8819906d
parent d3574f3c4d
2 changed files with 110 additions and 1 deletions
--- a/src/resources/extensions/sf/escalation.ts
+++ b/src/resources/extensions/sf/escalation.ts
@ -1,4 +1,82 @@
-// ADR-011 Phase 2 Mid-Execution Escalation — stub pending full DB schema port.
+// SF Extension — ADR-011 Phase 2 Mid-Execution Escalation (gsd-2 ADR)
+//
+// Currently scoped to detection only. The wider gsd-2 module (build/write/
+// resolve/list) requires several DB helpers SF doesn't yet have; those land
+// in subsequent fires. This file covers what state derivation + dispatch
+// need today: reading an artifact and detecting whether any task in a slice
+// is paused waiting for a user response.
+
+import { existsSync, readFileSync } from "node:fs";
+
+import type { TaskRow } from "./sf-db.js";
+import type { EscalationArtifact, EscalationOption } from "./types.js";
+
+/** Read an escalation artifact by path. Returns null when missing or malformed.
+ *
+ * Schema validation is strict (matches the eventual buildEscalationArtifact)
+ * so a hand-edited artifact cannot be weaker than what the writer would emit.
+ * Downstream callers can treat null as "no actionable escalation here." */
+export function readEscalationArtifact(path: string): EscalationArtifact | null {
+	if (!existsSync(path)) return null;
+	try {
+		const raw = readFileSync(path, "utf-8");
+		const parsed = JSON.parse(raw) as unknown;
+		if (!parsed || typeof parsed !== "object") return null;
+		const art = parsed as Partial<EscalationArtifact>;
+		if (art.version !== 1) return null;
+		if (typeof art.taskId !== "string" || art.taskId.length === 0) return null;
+		if (typeof art.sliceId !== "string" || art.sliceId.length === 0) return null;
+		if (typeof art.milestoneId !== "string" || art.milestoneId.length === 0) {
+			return null;
+		}
+		if (typeof art.question !== "string" || art.question.length === 0) {
+			return null;
+		}
+		if (
+			!Array.isArray(art.options) ||
+			art.options.length < 2 ||
+			art.options.length > 4
+		) {
+			return null;
+		}
+		const optionIds = new Set<string>();
+		for (const opt of art.options) {
+			if (!opt || typeof opt !== "object") return null;
+			const o = opt as Partial<EscalationOption>;
+			if (typeof o.id !== "string" || o.id.length === 0) return null;
+			if (typeof o.label !== "string") return null;
+			if (typeof o.tradeoffs !== "string") return null;
+			if (optionIds.has(o.id)) return null;
+			optionIds.add(o.id);
+		}
+		if (typeof art.recommendation !== "string") return null;
+		if (!art.options.some((o) => o.id === art.recommendation)) return null;
+		if (typeof art.continueWithDefault !== "boolean") return null;
+		if (typeof art.createdAt !== "string") return null;
+		return art as EscalationArtifact;
+	} catch {
+		return null;
+	}
+}
+
+/** Returns the task id of the first task with an un-resolved pause-escalation
+ * (escalation_pending=1, artifact present, no respondedAt). Returns null when
+ * nothing in the slice is paused — caller should treat that as "carry on."
+ *
+ * O(n) over the slice's tasks, with an early continue when escalation_pending
+ * isn't set, so the common no-escalation path costs almost nothing. */
+export function detectPendingEscalation(
+	tasks: TaskRow[],
+	_basePath: string,
+): string | null {
+	for (const t of tasks) {
+		if (t.escalation_pending !== 1) continue;
+		if (!t.escalation_artifact_path) continue;
+		const art = readEscalationArtifact(t.escalation_artifact_path);
+		if (art && !art.respondedAt) return t.id;
+	}
+	return null;
+}

 export function claimOverrideForInjection(
 	_basePath: string,
--- a/src/resources/extensions/sf/state.ts
+++ b/src/resources/extensions/sf/state.ts
@ -5,6 +5,7 @@
 import { existsSync, readdirSync, readFileSync } from "node:fs";
 import { join, resolve } from "node:path";
 import { debugCount, debugTime } from "./debug-logger.js";
+import { detectPendingEscalation } from "./escalation.js";
 import {
 	isValidTaskSummary,
 	loadFile,
@ -2167,6 +2168,36 @@ export async function _deriveStateImpl(basePath: string): Promise<SFState> {
 		}
 	}

+	// ── Mid-execution escalation (ADR-011 P2 — gsd-2 ADR) ────────────────
+	// Pause the loop if any task in the active slice has escalation_pending=1
+	// and an unresolved escalation artifact. The user must run /sf escalate
+	// resolve before auto-mode will continue. Falls through (returns null
+	// from detectPendingEscalation) when nothing is paused — no perf cost
+	// in the common path.
+	{
+		const dbTasks = getSliceTasks(activeMilestone.id, activeSlice.id);
+		const escalatingTaskId = detectPendingEscalation(dbTasks, basePath);
+		if (escalatingTaskId) {
+			return {
+				activeMilestone,
+				activeSlice,
+				activeTask: { id: escalatingTaskId, title: "" },
+				phase: "escalating-task",
+				recentDecisions: [],
+				blockers: [
+					`Task ${escalatingTaskId} requires a user decision before the loop can proceed`,
+				],
+				nextAction: `Run \`/sf escalate show ${escalatingTaskId}\` to review the options, then \`/sf escalate resolve ${escalatingTaskId} <choice>\` to proceed.`,
+				registry,
+				requirements,
+				progress: {
+					milestones: milestoneProgress,
+					slices: sliceProgress,
+				},
+			};
+		}
+	}
+
 	// ── Blocker detection: scan completed task summaries ──────────────────
 	// If any completed task has blocker_discovered: true and no REPLAN.md
 	// exists yet, transition to replanning-slice instead of executing.