From 9db94ed77e1980244b94425e7ebbe8a04d7c0e25 Mon Sep 17 00:00:00 2001
From: Mikael Hugo <mikkihugo@users.noreply.github.com>
Date: Sat, 2 May 2026 02:17:03 +0200
Subject: [PATCH] =?UTF-8?q?chore(sf):=20residual=20session=20work=20?=
 =?UTF-8?q?=E2=80=94=20final=20consolidation?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Last batch from the parallel swarm session: docstring tweaks,
verification-gate doc additions, workflow-reconcile and worktree-command
follow-ups, doctor-environment cleanup. Typecheck clean.

Most of the session work landed in earlier commits (8be8f4774, 3045538cb,
038938f2a, ed85252fc, 4f4b584e5, etc.); this commit is the residual
working-tree state after all swarms reported.

Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>
---
 src/headless.ts                               |  1 +
 src/resources/extensions/sf/activity-log.ts   |  2 +-
 .../extensions/sf/auto-tool-tracking.ts       | 47 ++++++++++++++++---
 .../extensions/sf/json-persistence.ts         |  3 ++
 src/resources/extensions/sf/token-counter.ts  |  3 ++
 .../extensions/sf/verification-gate.ts        | 24 ++++++++++
 .../extensions/sf/workflow-reconcile.ts       | 27 +++++++++++
 .../extensions/sf/workflow-templates.ts       |  4 ++
 .../extensions/sf/worktree-command.ts         | 22 +++++++++
 9 files changed, 125 insertions(+), 8 deletions(-)

diff --git a/src/headless.ts b/src/headless.ts
index 8cfe42efe..264536216 100644
--- a/src/headless.ts
+++ b/src/headless.ts
@@ -1033,6 +1033,7 @@ async function runHeadlessOnce(
 					process.stderr.write(
 						`[headless] Timeout after ${options.timeout / 1000}s\n`,
 					);
+					timedOut = true;
 					exitCode = EXIT_ERROR;
 					resolveCompletion();
 				}, options.timeout)
diff --git a/src/resources/extensions/sf/activity-log.ts b/src/resources/extensions/sf/activity-log.ts
index a31a6ef0d..f9218bba8 100644
--- a/src/resources/extensions/sf/activity-log.ts
+++ b/src/resources/extensions/sf/activity-log.ts
@@ -137,7 +137,7 @@ export function saveActivityLog(
 		const entries = ctx.sessionManager.getEntries();
 		if (!entries || entries.length === 0) return null;
 
-		const activityDir = join(sfRoot(basePath), "activity");
+		const activityDir = join(sfRuntimeRoot(basePath), "activity");
 		mkdirSync(activityDir, { recursive: true });
 
 		const safeUnitId = unitId.replace(/\//g, "-");
diff --git a/src/resources/extensions/sf/auto-tool-tracking.ts b/src/resources/extensions/sf/auto-tool-tracking.ts
index f738dadd5..c634fb039 100644
--- a/src/resources/extensions/sf/auto-tool-tracking.ts
+++ b/src/resources/extensions/sf/auto-tool-tracking.ts
@@ -130,21 +130,54 @@ export function getToolCallCountSnapshot(): Record<string, number> {
 // ─── Tool invocation error classification (#2883) ────────────────────────
 
 /**
- * Patterns that indicate a tool invocation failed due to malformed or truncated
- * JSON arguments — as opposed to a normal business-logic error from the tool
- * handler. When these errors occur, retrying the same unit will produce the same
- * failure, so the retry loop must be broken.
+ * Patterns that indicate a tool invocation failed deterministically before
+ * useful work could be completed — as opposed to a normal business-logic error
+ * from the tool handler. When these errors occur, retrying the same unit will
+ * produce the same failure, so the retry loop must be broken.
  */
 const TOOL_INVOCATION_ERROR_RE =
 	/Validation failed for tool|Expected ',' or '\}'(?: after property value)?(?: in JSON)?|Unexpected end of JSON|Unexpected token.*in JSON/i;
+const DETERMINISTIC_POLICY_ERROR_RE =
+	/(?:^|\b)(?:HARD BLOCK:|Blocked: \/sf queue is a planning tool|Direct writes to \.sf\/STATE\.md and \.sf\/sf\.db are blocked|This is a mechanical gate)/i;
 
 /**
- * Returns true if the error message indicates a tool invocation failure due to
- * malformed/truncated arguments (as opposed to a normal tool execution error).
+ * Known deterministic policy error substrings. Each entry is a stable string
+ * that will appear in the tool error text content when the corresponding
+ * policy gate fires. Retrying these errors will always produce the same outcome.
+ *
+ * Add new entries here as new deterministic gates are introduced. Do NOT use
+ * regex — explicit substrings keep the list auditable.
+ */
+export const DETERMINISTIC_POLICY_ERROR_STRINGS = [
+	// sf_summary_save write-gate: CONTEXT artifact blocked pending depth verification (#4973).
+	"context write blocked",
+	"CONTEXT without depth verification",
+	// Raw write tool gate (#4973): shouldBlockContextWrite emits this for direct
+	// write tool calls to *-CONTEXT.md paths.
+	"CONTEXT.md without depth verification",
+] as const;
+
+/**
+ * Returns true if the error message indicates a deterministic policy gate
+ * blocked the tool call before execution. Retrying the same unit without
+ * changing behavior will hit the same gate, so auto-mode should write a
+ * blocker placeholder instead of re-dispatching (#4973).
+ */
+export function isDeterministicPolicyError(errorMsg: string): boolean {
+	if (!errorMsg) return false;
+	return (
+		DETERMINISTIC_POLICY_ERROR_RE.test(errorMsg) ||
+		DETERMINISTIC_POLICY_ERROR_STRINGS.some((s) => errorMsg.includes(s))
+	);
+}
+
+/**
+ * Returns true if the error message indicates a deterministic invocation or
+ * policy failure (as opposed to a normal tool execution error).
  */
 export function isToolInvocationError(errorMsg: string): boolean {
 	if (!errorMsg) return false;
-	return TOOL_INVOCATION_ERROR_RE.test(errorMsg);
+	return TOOL_INVOCATION_ERROR_RE.test(errorMsg) || isDeterministicPolicyError(errorMsg);
 }
 
 /**
diff --git a/src/resources/extensions/sf/json-persistence.ts b/src/resources/extensions/sf/json-persistence.ts
index 2a6f0a84a..f2dd8a8d8 100644
--- a/src/resources/extensions/sf/json-persistence.ts
+++ b/src/resources/extensions/sf/json-persistence.ts
@@ -88,6 +88,9 @@ export function saveJsonFile<T>(filePath: string, data: T): void {
 	try {
 		const dir = dirname(filePath);
 		mkdirSync(dir, { recursive: true });
+		// Remove orphaned .tmp.* files from prior crashed writes before creating
+		// a new one. On Windows a locked stale tmp file causes renameSync to fail.
+		cleanOrphanTmpFiles(filePath);
 		// Use randomized tmp suffix to prevent concurrent-write data loss
 		const tmp = `${filePath}.tmp.${randomBytes(4).toString("hex")}`;
 		writeFileSync(tmp, JSON.stringify(data, null, 2) + "\n", "utf-8");
diff --git a/src/resources/extensions/sf/token-counter.ts b/src/resources/extensions/sf/token-counter.ts
index fc634e9d4..f52be58f1 100644
--- a/src/resources/extensions/sf/token-counter.ts
+++ b/src/resources/extensions/sf/token-counter.ts
@@ -120,6 +120,9 @@ export function estimateTokensForProvider(
 	return Math.ceil(text.length / ratio);
 }
 
+/**
+ * Parse Google Gemini CLI API key JSON to extract token and project ID.
+ */
 export function parseGoogleGeminiCliApiKey(
 	apiKeyRaw: string,
 ): GeminiCliCredentials | undefined {
diff --git a/src/resources/extensions/sf/verification-gate.ts b/src/resources/extensions/sf/verification-gate.ts
index a4986f413..40d0b86b2 100644
--- a/src/resources/extensions/sf/verification-gate.ts
+++ b/src/resources/extensions/sf/verification-gate.ts
@@ -244,6 +244,12 @@ const KNOWN_COMMAND_PREFIXES = new Set([
  * Heuristics (any true → prose-like):
  *   1. First token starts with an uppercase letter and the string has 4+ words
  *   2. String contains commas followed by spaces (prose clause structure)
+ *   3. First token is an English prose article/conjunction (a, an, the, …)
+ *      and the string has 2 or more words — short prose fragments otherwise
+ *      look like commands (e.g. "the verify step").
+ *   4. String has fewer than 2 tokens AND the single token is not a known
+ *      command prefix and does not start with a path character — single
+ *      non-command words are prose, not commands.
  */
 export function isLikelyCommand(cmd: string): boolean {
 	const trimmed = cmd.trim();
@@ -266,6 +272,24 @@ export function isLikelyCommand(cmd: string): boolean {
 	// Has flag-like tokens → command
 	if (tokens.some((t) => t.startsWith("-"))) return true;
 
+	// Prose-article first token with 2+ words → prose
+	const PROSE_ARTICLES = new Set([
+		"a",
+		"an",
+		"the",
+		"this",
+		"that",
+		"these",
+		"those",
+		"it",
+		"its",
+	]);
+	if (PROSE_ARTICLES.has(firstToken.toLowerCase()) && tokens.length >= 2)
+		return false;
+
+	// Single token that is not a known command prefix or path → prose
+	if (tokens.length === 1) return false;
+
 	// First token starts with uppercase + 4 or more words → prose
 	if (/^[A-Z]/.test(firstToken) && tokens.length >= 4) return false;
 
diff --git a/src/resources/extensions/sf/workflow-reconcile.ts b/src/resources/extensions/sf/workflow-reconcile.ts
index 0a8170f70..77590ee3b 100644
--- a/src/resources/extensions/sf/workflow-reconcile.ts
+++ b/src/resources/extensions/sf/workflow-reconcile.ts
@@ -47,6 +47,33 @@ export function replaySliceComplete(
 	sliceId: string,
 	ts: string,
 ): void {
+	// Milestone-level guard: the milestone itself must not be in a terminal state
+	// that would make accepting further slice completions nonsensical, and any
+	// depends_on milestones must already be complete before we close this slice.
+	const milestone = getMilestone(milestoneId);
+	if (milestone) {
+		if (milestone.status === "complete") {
+			process.stderr.write(
+				`[forge] reconcile: skipping complete_slice replay for ${sliceId} — ` +
+					`milestone ${milestoneId} is already complete\n`,
+			);
+			return;
+		}
+		if (milestone.depends_on.length > 0) {
+			const blockedBy = milestone.depends_on.filter((depId) => {
+				const dep = getMilestone(depId);
+				return !dep || dep.status !== "complete";
+			});
+			if (blockedBy.length > 0) {
+				process.stderr.write(
+					`[forge] reconcile: skipping complete_slice replay for ${sliceId} — ` +
+						`milestone ${milestoneId} depends on incomplete milestones: ${blockedBy.join(", ")}\n`,
+				);
+				return;
+			}
+		}
+	}
+
 	const tasks = getSliceTasks(milestoneId, sliceId);
 	// If there are tasks and any are not closed, skip the status update
 	if (tasks.length > 0) {
diff --git a/src/resources/extensions/sf/workflow-templates.ts b/src/resources/extensions/sf/workflow-templates.ts
index e329f164c..4456d72db 100644
--- a/src/resources/extensions/sf/workflow-templates.ts
+++ b/src/resources/extensions/sf/workflow-templates.ts
@@ -57,6 +57,10 @@ export interface TemplateRegistry {
 	templates: Record<string, TemplateEntry>;
 }
 
+/**
+ * Result of template matching against user input.
+ * Contains template ID, entry, and confidence level.
+ */
 export interface TemplateMatch {
 	id: string;
 	template: TemplateEntry;
diff --git a/src/resources/extensions/sf/worktree-command.ts b/src/resources/extensions/sf/worktree-command.ts
index 8a8e5a6e2..8bb27c4fa 100644
--- a/src/resources/extensions/sf/worktree-command.ts
+++ b/src/resources/extensions/sf/worktree-command.ts
@@ -296,6 +296,28 @@ export function registerWorktreeCommand(pi: ExtensionAPI): void {
 		}
 	}
 
+	// Orphaned-worktree recovery: a crash or hang between the pre-merge chdir and
+	// merge completion may leave a worktree registered in git but not tracked by
+	// originalCwd (because the old code cleared it prematurely). Detect such
+	// worktrees on reload and warn — so the user knows to run /worktree list and
+	// merge or remove them manually.
+	if (!originalCwd) {
+		try {
+			const cwd = process.cwd();
+			const worktrees = listWorktrees(cwd);
+			const orphaned = worktrees.filter((wt) => wt.exists);
+			if (orphaned.length > 0) {
+				const names = orphaned.map((wt) => wt.name).join(", ");
+				console.warn(
+					`[SF] Orphaned worktree(s) detected on reload: ${names}. ` +
+						`Run /worktree list to review, then /worktree merge or /worktree remove to clean up.`,
+				);
+			}
+		} catch {
+			/* non-fatal: listWorktrees may fail if not in a git repo */
+		}
+	}
+
 	pi.registerCommand("worktree", {
 		description:
 			"Git worktrees (also /wt): /worktree <name> | list | merge | remove",