feat: Headless Integration Hardening & Release (M002) (#2811)

* feat: Migrated headless orchestrator to use execution_complete events,… - "src/headless.ts" - "src/headless-ui.ts" - "src/tests/headless-v2-migration.test.ts" GSD-Task: S06/T02 * test: Wired pi-coding-agent to re-export JSONL utils from @gsd/rpc-clie… - "packages/pi-coding-agent/src/modes/rpc/jsonl.ts" - "packages/pi-coding-agent/package.json" - "packages/rpc-client/src/index.ts" - "packages/rpc-client/src/jsonl.ts" - "packages/rpc-client/src/rpc-client.ts" - "packages/rpc-client/src/rpc-types.ts" - "packages/rpc-client/src/rpc-client.test.ts" - "packages/rpc-client/package.json" GSD-Task: S06/T03 * feat: Wire --resume flag to resolve session IDs via prefix matching and… - "src/headless.ts" - "dist/headless.js" GSD-Task: S01/T01 * test: Added 5 e2e integration tests proving headless JSON batch, SIGINT… - "src/tests/integration/e2e-headless.test.ts" GSD-Task: S01/T02 * test: Updated @gsd/rpc-client and @gsd/mcp-server to 2.52.0 with publis… - "packages/rpc-client/package.json" - "packages/mcp-server/package.json" - "packages/rpc-client/.npmignore" - "packages/mcp-server/.npmignore" GSD-Task: S02/T01 * chore: auto-commit after complete-milestone GSD-Unit: M002-gzq23a * fix: revert jsonl.ts to inline implementation — @gsd-build/rpc-client not available at source-level test time in CI The re-export from @gsd-build/rpc-client fails in CI because tests run against TypeScript source (--experimental-strip-types) before any build step. The npm dependency resolves to node_modules/ which requires dist/ to exist. Reverting to the original inline implementation eliminates the cross-package dependency for source-level imports.
2026-03-26 23:33:22 -06:00 · 2026-03-26 23:33:22 -06:00 · a91b8bec34
commit a91b8bec34
parent 5abf9652b3
24 changed files with 2995 additions and 83 deletions
--- a/package-lock.json
+++ b/package-lock.json
@ -1,12 +1,12 @@
 {
  "name": "gsd-pi",
-  "version": "2.51.0",
+  "version": "2.52.0",
  "lockfileVersion": 3,
  "requires": true,
  "packages": {
    "": {
      "name": "gsd-pi",
-      "version": "2.51.0",
+      "version": "2.52.0",
      "hasInstallScript": true,
      "license": "MIT",
      "workspaces": [
@ -1815,10 +1815,14 @@
        "win32"
      ]
    },
-    "node_modules/@gsd/mcp-server": {
+    "node_modules/@gsd-build/mcp-server": {
      "resolved": "packages/mcp-server",
      "link": true
    },
+    "node_modules/@gsd-build/rpc-client": {
+      "resolved": "packages/rpc-client",
+      "link": true
+    },
    "node_modules/@gsd/native": {
      "resolved": "packages/native",
      "link": true
@ -1839,10 +1843,6 @@
      "resolved": "packages/pi-tui",
      "link": true
    },
-    "node_modules/@gsd/rpc-client": {
-      "resolved": "packages/rpc-client",
-      "link": true
-    },
    "node_modules/@gsd/studio": {
      "resolved": "studio",
      "link": true
@ -9150,10 +9150,11 @@
      }
    },
    "packages/mcp-server": {
-      "name": "@gsd/mcp-server",
-      "version": "2.51.0",
+      "name": "@gsd-build/mcp-server",
+      "version": "2.52.0",
+      "license": "MIT",
      "dependencies": {
-        "@gsd/rpc-client": "*",
+        "@gsd-build/rpc-client": "^2.52.0",
        "@modelcontextprotocol/sdk": "^1.27.1",
        "zod": "^4.0.0"
      },
@ -9218,7 +9219,7 @@
    },
    "packages/pi-coding-agent": {
      "name": "@gsd/pi-coding-agent",
-      "version": "2.51.0",
+      "version": "2.52.0",
      "dependencies": {
        "@mariozechner/jiti": "^2.6.2",
        "@silvia-odwyer/photon-node": "^0.3.4",
@ -9261,8 +9262,9 @@
      }
    },
    "packages/rpc-client": {
-      "name": "@gsd/rpc-client",
-      "version": "2.51.0",
+      "name": "@gsd-build/rpc-client",
+      "version": "2.52.0",
+      "license": "MIT",
      "engines": {
        "node": ">=22.0.0"
      }
--- a/packages/mcp-server/.npmignore
+++ b/packages/mcp-server/.npmignore
@ -0,0 +1 @@
+dist/*.test.*
--- a/packages/mcp-server/README.md
+++ b/packages/mcp-server/README.md
@ -1,4 +1,4 @@
-# @gsd/mcp-server
+# @gsd-build/mcp-server

 MCP server exposing GSD orchestration tools for Claude Code, Cursor, and other MCP-compatible clients.

@ -7,7 +7,7 @@ Start GSD auto-mode sessions, poll progress, resolve blockers, and retrieve resu
 ## Installation

 ```bash
-npm install @gsd/mcp-server
+npm install @gsd-build/mcp-server
 ```

 Or with the monorepo workspace:
@ -180,12 +180,12 @@ Resolve a pending blocker in a session by sending a response to the blocked UI r

 ```
 ┌─────────────────┐     stdio      ┌──────────────────┐
-│  MCP Client     │ ◄────────────► │  @gsd/mcp-server │
+│  MCP Client     │ ◄────────────► │  @gsd-build/mcp-server │
 │  (Claude Code,  │    JSON-RPC    │                  │
 │   Cursor, etc.) │                │  SessionManager  │
 └─────────────────┘                │       │          │
                                   │       ▼          │
-                                   │  @gsd/rpc-client │
+                                   │  @gsd-build/rpc-client │
                                   │       │          │
                                   │       ▼          │
                                   │  GSD CLI (child  │
@ -193,9 +193,9 @@ Resolve a pending blocker in a session by sending a response to the blocked UI r
                                   └──────────────────┘
 ```

- **@gsd/mcp-server** — MCP protocol adapter. Translates MCP tool calls into SessionManager operations.
+- **@gsd-build/mcp-server** — MCP protocol adapter. Translates MCP tool calls into SessionManager operations.
 - **SessionManager** — Manages RpcClient lifecycle. One session per project directory. Tracks events in a ring buffer (last 50), detects blockers, accumulates cost.
- **@gsd/rpc-client** — Low-level RPC client that spawns and communicates with the GSD CLI process via JSON-RPC over stdio.
+- **@gsd-build/rpc-client** — Low-level RPC client that spawns and communicates with the GSD CLI process via JSON-RPC over stdio.

 ## License

--- a/packages/mcp-server/package.json
+++ b/packages/mcp-server/package.json
@ -1,7 +1,16 @@
 {
-  "name": "@gsd/mcp-server",
-  "version": "2.51.0",
+  "name": "@gsd-build/mcp-server",
+  "version": "2.52.0",
  "description": "MCP server exposing GSD orchestration tools for Claude Code, Cursor, and other MCP clients",
+  "license": "MIT",
+  "repository": {
+    "type": "git",
+    "url": "https://github.com/gsd-build/gsd-2.git",
+    "directory": "packages/mcp-server"
+  },
+  "publishConfig": {
+    "access": "public"
+  },
  "type": "module",
  "main": "./dist/index.js",
  "types": "./dist/index.d.ts",
@ -20,7 +29,7 @@
  },
  "dependencies": {
    "@modelcontextprotocol/sdk": "^1.27.1",
-    "@gsd/rpc-client": "*",
+    "@gsd-build/rpc-client": "^2.52.0",
    "zod": "^4.0.0"
  },
  "devDependencies": {
@ -31,6 +40,7 @@
    "node": ">=22.0.0"
  },
  "files": [
-    "dist"
+    "dist",
+    "!dist/**/*.test.*"
  ]
 }
--- a/packages/mcp-server/src/cli.ts
+++ b/packages/mcp-server/src/cli.ts
@ -1,7 +1,7 @@
 #!/usr/bin/env node

 /**
- * @gsd/mcp-server CLI — stdio transport entry point.
+ * @gsd-build/mcp-server CLI — stdio transport entry point.
 *
 * Connects the MCP server to stdin/stdout for use by Claude Code,
 * Cursor, and other MCP-compatible clients.
--- a/packages/mcp-server/src/index.ts
+++ b/packages/mcp-server/src/index.ts
@ -1,5 +1,5 @@
 /**
- * @gsd/mcp-server — MCP server for GSD orchestration.
+ * @gsd-build/mcp-server — MCP server for GSD orchestration.
 */

 export { SessionManager } from './session-manager.js';
--- a/packages/mcp-server/src/mcp-server.test.ts
+++ b/packages/mcp-server/src/mcp-server.test.ts
@ -1,7 +1,7 @@
 /**
- * @gsd/mcp-server — Integration and unit tests.
+ * @gsd-build/mcp-server — Integration and unit tests.
 *
- * Strategy: We cannot mock @gsd/rpc-client at the module level without
+ * Strategy: We cannot mock @gsd-build/rpc-client at the module level without
 * --experimental-test-module-mocks. Instead we test by:
 *
 * 1. Subclassing SessionManager to inject a mock client factory
--- a/packages/mcp-server/src/session-manager.ts
+++ b/packages/mcp-server/src/session-manager.ts
@ -8,8 +8,8 @@

 import { execSync } from 'node:child_process';
 import { resolve } from 'node:path';
-import { RpcClient } from '@gsd/rpc-client';
-import type { SdkAgentEvent, RpcInitResult, RpcCostUpdateEvent, RpcExtensionUIRequest } from '@gsd/rpc-client';
+import { RpcClient } from '@gsd-build/rpc-client';
+import type { SdkAgentEvent, RpcInitResult, RpcCostUpdateEvent, RpcExtensionUIRequest } from '@gsd-build/rpc-client';
 import type {
  ManagedSession,
  ExecuteOptions,
--- a/packages/mcp-server/src/types.ts
+++ b/packages/mcp-server/src/types.ts
@ -2,7 +2,7 @@
 * MCP Server types — session lifecycle and orchestration.
 */

-import type { RpcClient, SdkAgentEvent, RpcCostUpdateEvent, RpcExtensionUIRequest } from '@gsd/rpc-client';
+import type { RpcClient, SdkAgentEvent, RpcCostUpdateEvent, RpcExtensionUIRequest } from '@gsd-build/rpc-client';

 // ---------------------------------------------------------------------------
 // Session Status
--- a/packages/rpc-client/.npmignore
+++ b/packages/rpc-client/.npmignore
@ -0,0 +1 @@
+dist/*.test.*
--- a/packages/rpc-client/README.md
+++ b/packages/rpc-client/README.md
@ -0,0 +1,125 @@
+# @gsd-build/rpc-client
+
+Standalone RPC client SDK for GSD. Spawn the agent process, perform a v2 protocol handshake, send commands, and consume typed events via an async generator — all in a few lines of TypeScript.
+
+Zero internal dependencies. Ships its own inlined types.
+
+## Installation
+
+```bash
+npm install @gsd-build/rpc-client
+```
+
+## Quick Start
+
+```typescript
+import { RpcClient } from '@gsd-build/rpc-client';
+
+const client = new RpcClient({ cwd: process.cwd() });
+await client.start();
+const { sessionId } = await client.init({ clientId: 'my-app' });
+console.log(`Session: ${sessionId}`);
+
+await client.prompt('Create a hello world script');
+for await (const event of client.events()) {
+  if (event.type === 'execution_complete') break;
+  console.log(event.type);
+}
+await client.shutdown();
+```
+
+## API
+
+### Constructor
+
+```typescript
+const client = new RpcClient(options?: RpcClientOptions);
+```
+
+| Option     | Type                     | Description                              |
+|------------|--------------------------|------------------------------------------|
+| `cliPath`  | `string`                 | Path to the CLI entry point              |
+| `cwd`      | `string`                 | Working directory for the agent          |
+| `env`      | `Record<string, string>` | Environment variables                    |
+| `provider` | `string`                 | AI provider (e.g. `"anthropic"`)         |
+| `model`    | `string`                 | Model ID (e.g. `"claude-sonnet"`)        |
+| `args`     | `string[]`               | Additional CLI arguments                 |
+
+### Lifecycle
+
+| Method        | Description                                    |
+|---------------|------------------------------------------------|
+| `start()`     | Spawn the agent process                        |
+| `init(opts?)` | v2 handshake — returns `sessionId`, capabilities |
+| `shutdown()`  | Graceful shutdown                              |
+| `stop()`      | Force-kill the process                         |
+
+### Commands
+
+| Method                         | Description                            |
+|--------------------------------|----------------------------------------|
+| `prompt(message, images?)`     | Send a prompt                          |
+| `steer(message, images?)`      | Interrupt with a steering message      |
+| `followUp(message, images?)`   | Queue a follow-up message              |
+| `abort()`                      | Abort current operation                |
+| `subscribe(events)`            | Subscribe to event types (`["*"]` for all) |
+
+### Events
+
+```typescript
+// Async generator — recommended
+for await (const event of client.events()) {
+  console.log(event.type);
+}
+
+// Callback-based
+const unsubscribe = client.onEvent((event) => {
+  console.log(event.type);
+});
+```
+
+### Helpers
+
+| Method                                | Description                              |
+|---------------------------------------|------------------------------------------|
+| `waitForIdle(timeout?)`               | Wait for `agent_end` event               |
+| `collectEvents(timeout?)`             | Collect events until idle                |
+| `promptAndWait(message, images?, t?)` | Send prompt and collect events           |
+
+### Session & Model
+
+| Method                           | Description                       |
+|----------------------------------|-----------------------------------|
+| `getState()`                     | Get session state                 |
+| `setModel(provider, modelId)`    | Set model                         |
+| `cycleModel()`                   | Cycle to next model               |
+| `getAvailableModels()`           | List available models             |
+| `setThinkingLevel(level)`        | Set thinking level                |
+| `cycleThinkingLevel()`           | Cycle thinking level              |
+| `compact(instructions?)`         | Compact session context           |
+| `getSessionStats()`              | Get session statistics            |
+| `bash(command)`                  | Execute a bash command            |
+| `newSession(parent?)`            | Start a new session               |
+| `sendUIResponse(id, response)`   | Respond to extension UI requests  |
+
+## Type Exports
+
+All protocol types are exported from the package root:
+
+```typescript
+import type {
+  RpcCommand,
+  RpcResponse,
+  RpcInitResult,
+  RpcExecutionCompleteEvent,
+  RpcCostUpdateEvent,
+  RpcV2Event,
+  SessionStats,
+  SdkAgentEvent,
+  RpcClientOptions,
+} from '@gsd-build/rpc-client';
+```
+
+## License
+
+MIT
--- a/packages/rpc-client/examples/basic-usage.ts
+++ b/packages/rpc-client/examples/basic-usage.ts
@ -0,0 +1,13 @@
+import { RpcClient } from '@gsd-build/rpc-client';
+
+const client = new RpcClient({ cwd: process.cwd() });
+await client.start();
+const { sessionId } = await client.init({ clientId: 'my-app' });
+console.log(`Session: ${sessionId}`);
+
+await client.prompt('Create a hello world script');
+for await (const event of client.events()) {
+  if (event.type === 'execution_complete') break;
+  console.log(event.type);
+}
+await client.shutdown();
--- a/packages/rpc-client/package.json
+++ b/packages/rpc-client/package.json
@ -1,7 +1,16 @@
 {
-  "name": "@gsd/rpc-client",
-  "version": "2.51.0",
+  "name": "@gsd-build/rpc-client",
+  "version": "2.52.0",
  "description": "Standalone RPC client SDK for GSD — zero internal dependencies",
+  "license": "MIT",
+  "repository": {
+    "type": "git",
+    "url": "https://github.com/gsd-build/gsd-2.git",
+    "directory": "packages/rpc-client"
+  },
+  "publishConfig": {
+    "access": "public"
+  },
  "type": "module",
  "main": "./dist/index.js",
  "types": "./dist/index.d.ts",
@ -12,8 +21,13 @@
    }
  },
  "files": [
-    "dist"
+    "dist",
+    "!dist/**/*.test.*"
  ],
+  "scripts": {
+    "build": "tsc -p tsconfig.json",
+    "test": "node --test dist/rpc-client.test.js"
+  },
  "engines": {
    "node": ">=22.0.0"
  }
--- a/packages/rpc-client/src/index.ts
+++ b/packages/rpc-client/src/index.ts
@ -0,0 +1,10 @@
+/**
+ * @gsd-build/rpc-client — standalone RPC client SDK for GSD.
+ *
+ * Re-exports all types, JSONL utilities, and the RpcClient class.
+ */
+
+export * from "./rpc-types.js";
+export { serializeJsonLine, attachJsonlLineReader } from "./jsonl.js";
+export { RpcClient } from "./rpc-client.js";
+export type { RpcClientOptions, RpcEventListener, SdkAgentEvent } from "./rpc-client.js";
--- a/packages/rpc-client/src/jsonl.ts
+++ b/packages/rpc-client/src/jsonl.ts
@ -0,0 +1,64 @@
+import type { Readable } from "node:stream";
+import { StringDecoder } from "node:string_decoder";
+
+/**
+ * Serialize a single strict JSONL record.
+ *
+ * Framing is LF-only. Payload strings may contain other Unicode separators such as
+ * U+2028 and U+2029. Clients must split records on `\n` only.
+ */
+export function serializeJsonLine(value: unknown): string {
+	return `${JSON.stringify(value)}\n`;
+}
+
+/**
+ * Attach an LF-only JSONL reader to a stream.
+ *
+ * This intentionally does not use Node readline. Readline splits on additional
+ * Unicode separators that are valid inside JSON strings and therefore does not
+ * implement strict JSONL framing.
+ */
+export function attachJsonlLineReader(stream: Readable, onLine: (line: string) => void): () => void {
+	const decoder = new StringDecoder("utf8");
+	let buffer = "";
+
+	const emitLine = (line: string) => {
+		onLine(line.endsWith("\r") ? line.slice(0, -1) : line);
+	};
+
+	const onData = (chunk: string | Buffer) => {
+		buffer += typeof chunk === "string" ? chunk : decoder.write(chunk);
+
+		while (true) {
+			const newlineIndex = buffer.indexOf("\n");
+			if (newlineIndex === -1) {
+				return;
+			}
+
+			emitLine(buffer.slice(0, newlineIndex));
+			buffer = buffer.slice(newlineIndex + 1);
+		}
+	};
+
+	const onEnd = () => {
+		buffer += decoder.end();
+		if (buffer.length > 0) {
+			emitLine(buffer);
+			buffer = "";
+		}
+	};
+
+	const onError = (_err: Error) => {
+		// Stream errors are non-fatal for JSONL reading
+	};
+
+	stream.on("data", onData);
+	stream.on("end", onEnd);
+	stream.on("error", onError);
+
+	return () => {
+		stream.off("data", onData);
+		stream.off("end", onEnd);
+		stream.off("error", onError);
+	};
+}
--- a/packages/rpc-client/src/rpc-client.test.ts
+++ b/packages/rpc-client/src/rpc-client.test.ts
@ -0,0 +1,568 @@
+import { describe, it, beforeEach, afterEach } from "node:test";
+import assert from "node:assert/strict";
+import { PassThrough } from "node:stream";
+import { serializeJsonLine, attachJsonlLineReader } from "./jsonl.js";
+import type {
+	RpcInitResult,
+	RpcExecutionCompleteEvent,
+	RpcCostUpdateEvent,
+	RpcProtocolVersion,
+	SessionStats,
+	RpcV2Event,
+} from "./rpc-types.js";
+import { RpcClient } from "./rpc-client.js";
+import type { SdkAgentEvent } from "./rpc-client.js";
+
+// ============================================================================
+// JSONL Tests
+// ============================================================================
+
+describe("serializeJsonLine", () => {
+	it("produces valid JSON terminated with LF", () => {
+		const result = serializeJsonLine({ type: "test", value: 42 });
+		assert.ok(result.endsWith("\n"), "must end with LF");
+		const parsed = JSON.parse(result.trim());
+		assert.equal(parsed.type, "test");
+		assert.equal(parsed.value, 42);
+	});
+
+	it("serializes strings with special characters", () => {
+		const result = serializeJsonLine({ msg: "hello\nworld" });
+		assert.ok(result.endsWith("\n"));
+		// The embedded \n must be escaped inside the JSON — only the trailing LF is the framing delimiter
+		const lines = result.split("\n");
+		// Should be exactly 2 parts: the JSON line and the empty string after trailing LF
+		assert.equal(lines.length, 2);
+		assert.equal(lines[1], "");
+		const parsed = JSON.parse(lines[0]);
+		assert.equal(parsed.msg, "hello\nworld");
+	});
+
+	it("handles empty objects", () => {
+		const result = serializeJsonLine({});
+		assert.equal(result, "{}\n");
+	});
+});
+
+describe("attachJsonlLineReader", () => {
+	it("splits on LF correctly", async () => {
+		const stream = new PassThrough();
+		const lines: string[] = [];
+
+		attachJsonlLineReader(stream, (line) => lines.push(line));
+
+		stream.write('{"a":1}\n{"b":2}\n');
+		stream.end();
+
+		// Let microtask queue flush
+		await new Promise((r) => setTimeout(r, 10));
+
+		assert.equal(lines.length, 2);
+		assert.equal(JSON.parse(lines[0]).a, 1);
+		assert.equal(JSON.parse(lines[1]).b, 2);
+	});
+
+	it("handles chunked data across boundaries", async () => {
+		const stream = new PassThrough();
+		const lines: string[] = [];
+
+		attachJsonlLineReader(stream, (line) => lines.push(line));
+
+		// Write in fragments that split mid-line
+		stream.write('{"type":"hel');
+		stream.write('lo"}\n{"type":"w');
+		stream.write('orld"}\n');
+		stream.end();
+
+		await new Promise((r) => setTimeout(r, 10));
+
+		assert.equal(lines.length, 2);
+		assert.equal(JSON.parse(lines[0]).type, "hello");
+		assert.equal(JSON.parse(lines[1]).type, "world");
+	});
+
+	it("emits trailing data on stream end", async () => {
+		const stream = new PassThrough();
+		const lines: string[] = [];
+
+		attachJsonlLineReader(stream, (line) => lines.push(line));
+
+		stream.write('{"final":true}');
+		stream.end();
+
+		await new Promise((r) => setTimeout(r, 10));
+
+		assert.equal(lines.length, 1);
+		assert.equal(JSON.parse(lines[0]).final, true);
+	});
+
+	it("returns a detach function that stops reading", async () => {
+		const stream = new PassThrough();
+		const lines: string[] = [];
+
+		const detach = attachJsonlLineReader(stream, (line) => lines.push(line));
+
+		stream.write('{"a":1}\n');
+		await new Promise((r) => setTimeout(r, 10));
+		assert.equal(lines.length, 1);
+
+		detach();
+
+		stream.write('{"b":2}\n');
+		stream.end();
+		await new Promise((r) => setTimeout(r, 10));
+
+		// Should still be 1 — detach removed listeners
+		assert.equal(lines.length, 1);
+	});
+
+	it("strips CR from CRLF line endings", async () => {
+		const stream = new PassThrough();
+		const lines: string[] = [];
+
+		attachJsonlLineReader(stream, (line) => lines.push(line));
+
+		stream.write('{"v":1}\r\n');
+		stream.end();
+
+		await new Promise((r) => setTimeout(r, 10));
+
+		assert.equal(lines.length, 1);
+		assert.equal(JSON.parse(lines[0]).v, 1);
+	});
+});
+
+// ============================================================================
+// Type Shape Tests
+// ============================================================================
+
+describe("type shapes", () => {
+	it("RpcInitResult has protocolVersion, sessionId, capabilities", () => {
+		const init: RpcInitResult = {
+			protocolVersion: 2,
+			sessionId: "sess_123",
+			capabilities: {
+				events: ["execution_complete", "cost_update"],
+				commands: ["prompt", "steer"],
+			},
+		};
+		assert.equal(init.protocolVersion, 2);
+		assert.equal(init.sessionId, "sess_123");
+		assert.ok(Array.isArray(init.capabilities.events));
+		assert.ok(Array.isArray(init.capabilities.commands));
+	});
+
+	it("RpcExecutionCompleteEvent has required fields", () => {
+		const event: RpcExecutionCompleteEvent = {
+			type: "execution_complete",
+			runId: "run_abc",
+			status: "completed",
+			stats: {
+				sessionFile: "/tmp/session.json",
+				sessionId: "sess_123",
+				userMessages: 5,
+				assistantMessages: 5,
+				toolCalls: 3,
+				toolResults: 3,
+				totalMessages: 10,
+				tokens: { input: 1000, output: 500, cacheRead: 200, cacheWrite: 100, total: 1800 },
+				cost: 0.05,
+			},
+		};
+		assert.equal(event.type, "execution_complete");
+		assert.equal(event.runId, "run_abc");
+		assert.equal(event.status, "completed");
+		assert.ok(event.stats);
+		assert.equal(event.stats.sessionId, "sess_123");
+	});
+
+	it("RpcCostUpdateEvent has required fields", () => {
+		const event: RpcCostUpdateEvent = {
+			type: "cost_update",
+			runId: "run_abc",
+			turnCost: 0.01,
+			cumulativeCost: 0.05,
+			tokens: { input: 500, output: 200, cacheRead: 100, cacheWrite: 50 },
+		};
+		assert.equal(event.type, "cost_update");
+		assert.equal(event.runId, "run_abc");
+		assert.equal(event.turnCost, 0.01);
+		assert.equal(event.cumulativeCost, 0.05);
+		assert.ok(event.tokens);
+	});
+
+	it("SessionStats has all expected fields", () => {
+		const stats: SessionStats = {
+			sessionFile: "/tmp/session.json",
+			sessionId: "s1",
+			userMessages: 10,
+			assistantMessages: 10,
+			toolCalls: 5,
+			toolResults: 5,
+			totalMessages: 20,
+			tokens: { input: 2000, output: 1000, cacheRead: 500, cacheWrite: 200, total: 3700 },
+			cost: 0.10,
+		};
+		assert.equal(stats.sessionId, "s1");
+		assert.equal(stats.userMessages, 10);
+		assert.equal(stats.tokens.total, 3700);
+		assert.equal(stats.cost, 0.10);
+	});
+
+	it("RpcProtocolVersion accepts 1 and 2", () => {
+		const v1: RpcProtocolVersion = 1;
+		const v2: RpcProtocolVersion = 2;
+		assert.equal(v1, 1);
+		assert.equal(v2, 2);
+	});
+
+	it("RpcV2Event discriminated union covers both event types", () => {
+		const events: RpcV2Event[] = [
+			{
+				type: "execution_complete",
+				runId: "r1",
+				status: "completed",
+				stats: {
+					sessionFile: undefined,
+					sessionId: "s1",
+					userMessages: 1,
+					assistantMessages: 1,
+					toolCalls: 0,
+					toolResults: 0,
+					totalMessages: 2,
+					tokens: { input: 100, output: 50, cacheRead: 0, cacheWrite: 0, total: 150 },
+					cost: 0.001,
+				},
+			},
+			{
+				type: "cost_update",
+				runId: "r1",
+				turnCost: 0.001,
+				cumulativeCost: 0.001,
+				tokens: { input: 100, output: 50, cacheRead: 0, cacheWrite: 0 },
+			},
+		];
+		assert.equal(events.length, 2);
+		assert.equal(events[0].type, "execution_complete");
+		assert.equal(events[1].type, "cost_update");
+	});
+});
+
+// ============================================================================
+// RpcClient Construction Tests
+// ============================================================================
+
+describe("RpcClient construction", () => {
+	it("creates with default options", () => {
+		const client = new RpcClient();
+		assert.ok(client);
+	});
+
+	it("creates with custom options", () => {
+		const client = new RpcClient({
+			cliPath: "/usr/local/bin/gsd",
+			cwd: "/tmp",
+			env: { NODE_ENV: "test" },
+			provider: "anthropic",
+			model: "claude-sonnet",
+			args: ["--verbose"],
+		});
+		assert.ok(client);
+	});
+});
+
+// ============================================================================
+// events() Generator Tests
+// ============================================================================
+
+describe("events() async generator", () => {
+	it("yields events from a mock stream in order", async () => {
+		const client = new RpcClient();
+
+		// Reach into the client to set up a mock process with a PassThrough stdout
+		const mockStdout = new PassThrough();
+		const mockStderr = new PassThrough();
+		const mockStdin = new PassThrough();
+
+		// Simulate a started process by setting internal state
+		// We use Object.assign to set private fields for testing
+		const clientAny = client as any;
+		clientAny.process = {
+			stdout: mockStdout,
+			stderr: mockStderr,
+			stdin: mockStdin,
+			exitCode: null,
+			kill: () => {},
+			on: (event: string, handler: (...args: any[]) => void) => {
+				if (event === "exit") {
+					// Store exit handler so we can trigger it
+					clientAny._testExitHandler = handler;
+				}
+			},
+			removeListener: () => {},
+		};
+
+		// Attach the JSONL reader like start() does
+		clientAny.stopReadingStdout = attachJsonlLineReader(mockStdout, (line: string) => {
+			clientAny.handleLine(line);
+		});
+
+		// Collect events from the generator
+		const received: SdkAgentEvent[] = [];
+		const genPromise = (async () => {
+			for await (const event of client.events()) {
+				received.push(event);
+				if (event.type === "done") break;
+			}
+		})();
+
+		// Simulate server sending events
+		await new Promise((r) => setTimeout(r, 20));
+		mockStdout.write(serializeJsonLine({ type: "agent_start", runId: "r1" }));
+		await new Promise((r) => setTimeout(r, 20));
+		mockStdout.write(serializeJsonLine({ type: "token", text: "hello" }));
+		await new Promise((r) => setTimeout(r, 20));
+		mockStdout.write(serializeJsonLine({ type: "done" }));
+
+		await genPromise;
+
+		assert.equal(received.length, 3);
+		assert.equal(received[0].type, "agent_start");
+		assert.equal(received[1].type, "token");
+		assert.equal(received[2].type, "done");
+	});
+
+	it("terminates when process exits", async () => {
+		const client = new RpcClient();
+		const mockStdout = new PassThrough();
+		const mockStderr = new PassThrough();
+		const mockStdin = new PassThrough();
+
+		const exitHandlers: Array<() => void> = [];
+		const clientAny = client as any;
+		clientAny.process = {
+			stdout: mockStdout,
+			stderr: mockStderr,
+			stdin: mockStdin,
+			exitCode: null,
+			kill: () => {},
+			on: (event: string, handler: () => void) => {
+				if (event === "exit") exitHandlers.push(handler);
+			},
+			removeListener: (event: string, handler: () => void) => {
+				const idx = exitHandlers.indexOf(handler);
+				if (idx !== -1) exitHandlers.splice(idx, 1);
+			},
+		};
+
+		clientAny.stopReadingStdout = attachJsonlLineReader(mockStdout, (line: string) => {
+			clientAny.handleLine(line);
+		});
+
+		const received: SdkAgentEvent[] = [];
+		const genPromise = (async () => {
+			for await (const event of client.events()) {
+				received.push(event);
+			}
+		})();
+
+		// Send one event, then simulate process exit
+		await new Promise((r) => setTimeout(r, 20));
+		mockStdout.write(serializeJsonLine({ type: "agent_start" }));
+		await new Promise((r) => setTimeout(r, 20));
+
+		// Fire exit handlers
+		for (const h of exitHandlers) h();
+
+		await genPromise;
+
+		assert.equal(received.length, 1);
+		assert.equal(received[0].type, "agent_start");
+	});
+
+	it("throws if client not started", async () => {
+		const client = new RpcClient();
+		await assert.rejects(async () => {
+			// eslint-disable-next-line @typescript-eslint/no-unused-vars
+			for await (const _event of client.events()) {
+				// should not reach
+			}
+		}, /Client not started/);
+	});
+});
+
+// ============================================================================
+// sendUIResponse Serialization Test
+// ============================================================================
+
+describe("sendUIResponse serialization", () => {
+	it("writes correct JSONL to stdin", () => {
+		const client = new RpcClient();
+		const chunks: string[] = [];
+		const mockStdin = {
+			write: (data: string) => {
+				chunks.push(data);
+				return true;
+			},
+		};
+
+		const clientAny = client as any;
+		clientAny.process = { stdin: mockStdin };
+
+		client.sendUIResponse("ui_1", { value: "hello" });
+
+		assert.equal(chunks.length, 1);
+		const parsed = JSON.parse(chunks[0].trim());
+		assert.equal(parsed.type, "extension_ui_response");
+		assert.equal(parsed.id, "ui_1");
+		assert.equal(parsed.value, "hello");
+	});
+
+	it("serializes confirmed response", () => {
+		const client = new RpcClient();
+		const chunks: string[] = [];
+		const mockStdin = {
+			write: (data: string) => {
+				chunks.push(data);
+				return true;
+			},
+		};
+		const clientAny = client as any;
+		clientAny.process = { stdin: mockStdin };
+
+		client.sendUIResponse("ui_2", { confirmed: true });
+
+		const parsed = JSON.parse(chunks[0].trim());
+		assert.equal(parsed.confirmed, true);
+		assert.equal(parsed.id, "ui_2");
+	});
+
+	it("serializes cancelled response", () => {
+		const client = new RpcClient();
+		const chunks: string[] = [];
+		const mockStdin = {
+			write: (data: string) => {
+				chunks.push(data);
+				return true;
+			},
+		};
+		const clientAny = client as any;
+		clientAny.process = { stdin: mockStdin };
+
+		client.sendUIResponse("ui_3", { cancelled: true });
+
+		const parsed = JSON.parse(chunks[0].trim());
+		assert.equal(parsed.cancelled, true);
+	});
+});
+
+// ============================================================================
+// init/shutdown/subscribe Serialization Tests
+// ============================================================================
+
+describe("v2 command serialization", () => {
+	// Helper: capture what the client sends to stdin
+	function createMockClient(): { client: RpcClient; sent: any[]; respondNext: (data?: any) => void } {
+		const client = new RpcClient();
+		const sent: any[] = [];
+		let respondFn: ((data: any) => void) | null = null;
+
+		const clientAny = client as any;
+		clientAny.process = {
+			stdin: {
+				write: (data: string) => {
+					const parsed = JSON.parse(data.trim());
+					sent.push(parsed);
+					// Auto-respond with success after a tick
+					if (respondFn) {
+						setTimeout(() => respondFn!(parsed), 5);
+					}
+					return true;
+				},
+			},
+			stderr: new PassThrough(),
+			exitCode: null,
+			kill: () => {},
+			on: () => {},
+			removeListener: () => {},
+		};
+
+		const respondNext = (overrides: any = {}) => {
+			respondFn = (parsed) => {
+				const response = {
+					type: "response",
+					id: parsed.id,
+					command: parsed.type,
+					success: true,
+					data: {},
+					...overrides,
+				};
+				clientAny.handleLine(JSON.stringify(response));
+			};
+		};
+
+		return { client, sent, respondNext };
+	}
+
+	it("init sends correct v2 init command", async () => {
+		const { client, sent, respondNext } = createMockClient();
+		respondNext({ data: { protocolVersion: 2, sessionId: "s1", capabilities: { events: [], commands: [] } } });
+
+		const result = await client.init({ clientId: "test-app" });
+
+		assert.equal(sent.length, 1);
+		assert.equal(sent[0].type, "init");
+		assert.equal(sent[0].protocolVersion, 2);
+		assert.equal(sent[0].clientId, "test-app");
+		assert.equal(result.protocolVersion, 2);
+		assert.equal(result.sessionId, "s1");
+	});
+
+	it("shutdown sends shutdown command", async () => {
+		const { client, sent, respondNext } = createMockClient();
+
+		// Override the process exit wait
+		const clientAny = client as any;
+		const originalProcess = clientAny.process;
+		const exitHandlers: Array<(code: number) => void> = [];
+		clientAny.process = {
+			...originalProcess,
+			on: (event: string, handler: (code: number) => void) => {
+				if (event === "exit") exitHandlers.push(handler);
+			},
+		};
+
+		respondNext();
+
+		// Call shutdown and simulate process exit
+		const shutdownPromise = client.shutdown();
+		await new Promise((r) => setTimeout(r, 20));
+		for (const h of exitHandlers) h(0);
+
+		await shutdownPromise;
+
+		assert.equal(sent.length, 1);
+		assert.equal(sent[0].type, "shutdown");
+	});
+
+	it("subscribe sends subscribe command with event list", async () => {
+		const { client, sent, respondNext } = createMockClient();
+		respondNext();
+
+		await client.subscribe(["execution_complete", "cost_update"]);
+
+		assert.equal(sent.length, 1);
+		assert.equal(sent[0].type, "subscribe");
+		assert.deepEqual(sent[0].events, ["execution_complete", "cost_update"]);
+	});
+
+	it("subscribe with wildcard", async () => {
+		const { client, sent, respondNext } = createMockClient();
+		respondNext();
+
+		await client.subscribe(["*"]);
+
+		assert.equal(sent[0].events.length, 1);
+		assert.equal(sent[0].events[0], "*");
+	});
+});
--- a/packages/rpc-client/src/rpc-client.ts
+++ b/packages/rpc-client/src/rpc-client.ts
@ -0,0 +1,666 @@
+/**
+ * RPC Client for programmatic access to the coding agent.
+ *
+ * Spawns the agent in RPC mode and provides a typed API for all operations.
+ * This is a standalone SDK client — all types are inlined with zero internal
+ * package dependencies.
+ */
+
+import { type ChildProcess, spawn } from "node:child_process";
+import { attachJsonlLineReader, serializeJsonLine } from "./jsonl.js";
+import type {
+	BashResult,
+	CompactionResult,
+	ImageContent,
+	ModelInfo,
+	RpcCommand,
+	RpcInitResult,
+	RpcResponse,
+	RpcSessionState,
+	RpcSlashCommand,
+	ThinkingLevel,
+	SessionStats,
+} from "./rpc-types.js";
+
+// ============================================================================
+// Types
+// ============================================================================
+
+/** Distributive Omit that works with union types */
+type DistributiveOmit<T, K extends keyof T> = T extends unknown ? Omit<T, K> : never;
+
+/** RpcCommand without the id field (for internal send) */
+type RpcCommandBody = DistributiveOmit<RpcCommand, "id">;
+
+/** Agent event — a loosely-typed record from the server. The `type` field is always present. */
+export interface SdkAgentEvent {
+	type: string;
+	[key: string]: unknown;
+}
+
+export interface RpcClientOptions {
+	/** Path to the CLI entry point (default: searches for dist/cli.js) */
+	cliPath?: string;
+	/** Working directory for the agent */
+	cwd?: string;
+	/** Environment variables */
+	env?: Record<string, string>;
+	/** Provider to use */
+	provider?: string;
+	/** Model ID to use */
+	model?: string;
+	/** Additional CLI arguments */
+	args?: string[];
+}
+
+export type RpcEventListener = (event: SdkAgentEvent) => void;
+
+// ============================================================================
+// RPC Client
+// ============================================================================
+
+export class RpcClient {
+	private process: ChildProcess | null = null;
+	private stopReadingStdout: (() => void) | null = null;
+	private _stderrHandler?: (data: Buffer) => void;
+	private eventListeners: RpcEventListener[] = [];
+	private pendingRequests: Map<string, { resolve: (response: RpcResponse) => void; reject: (error: Error) => void }> =
+		new Map();
+	private requestId = 0;
+	private stderr = "";
+	private _stopped = false;
+
+	constructor(private options: RpcClientOptions = {}) {}
+
+	/**
+	 * Start the RPC agent process.
+	 */
+	async start(): Promise<void> {
+		if (this.process) {
+			throw new Error("Client already started");
+		}
+
+		this._stopped = false;
+
+		const cliPath = this.options.cliPath ?? "dist/cli.js";
+		const args = ["--mode", "rpc"];
+
+		if (this.options.provider) {
+			args.push("--provider", this.options.provider);
+		}
+		if (this.options.model) {
+			args.push("--model", this.options.model);
+		}
+		if (this.options.args) {
+			args.push(...this.options.args);
+		}
+
+		this.process = spawn("node", [cliPath, ...args], {
+			cwd: this.options.cwd,
+			env: { ...process.env, ...this.options.env },
+			stdio: ["pipe", "pipe", "pipe"],
+		});
+
+		// Collect stderr for debugging
+		this._stderrHandler = (data: Buffer) => {
+			this.stderr += data.toString();
+		};
+		this.process.stderr?.on("data", this._stderrHandler);
+
+		// Set up strict JSONL reader for stdout.
+		this.stopReadingStdout = attachJsonlLineReader(this.process.stdout!, (line) => {
+			this.handleLine(line);
+		});
+
+		// Detect unexpected subprocess exit and reject all pending requests
+		this.process.on("exit", (code, signal) => {
+			if (this.pendingRequests.size > 0) {
+				const reason = signal ? `signal ${signal}` : `code ${code}`;
+				const error = new Error(`Agent process exited unexpectedly (${reason}). Stderr: ${this.stderr}`);
+				for (const [id, pending] of this.pendingRequests) {
+					this.pendingRequests.delete(id);
+					pending.reject(error);
+				}
+			}
+		});
+
+		// Wait a moment for process to initialize
+		await new Promise((resolve) => setTimeout(resolve, 100));
+
+		if (this.process.exitCode !== null) {
+			throw new Error(`Agent process exited immediately with code ${this.process.exitCode}. Stderr: ${this.stderr}`);
+		}
+	}
+
+	/**
+	 * Stop the RPC agent process.
+	 */
+	async stop(): Promise<void> {
+		if (!this.process) return;
+
+		this._stopped = true;
+
+		this.stopReadingStdout?.();
+		this.stopReadingStdout = null;
+		if (this._stderrHandler) {
+			this.process.stderr?.removeListener("data", this._stderrHandler);
+			this._stderrHandler = undefined;
+		}
+		this.process.kill("SIGTERM");
+
+		// Wait for process to exit
+		await new Promise<void>((resolve) => {
+			const timeout = setTimeout(() => {
+				this.process?.kill("SIGKILL");
+				resolve();
+			}, 1000);
+
+			this.process?.on("exit", () => {
+				clearTimeout(timeout);
+				resolve();
+			});
+		});
+
+		this.process = null;
+		this.pendingRequests.clear();
+	}
+
+	/**
+	 * Subscribe to agent events via callback.
+	 */
+	onEvent(listener: RpcEventListener): () => void {
+		this.eventListeners.push(listener);
+		return () => {
+			const index = this.eventListeners.indexOf(listener);
+			if (index !== -1) {
+				this.eventListeners.splice(index, 1);
+			}
+		};
+	}
+
+	/**
+	 * Async generator that yields agent events as they arrive.
+	 *
+	 * Usage:
+	 * ```ts
+	 * for await (const event of client.events()) {
+	 *   console.log(event.type, event);
+	 * }
+	 * ```
+	 *
+	 * The generator terminates when:
+	 * - `stop()` is called
+	 * - The agent process exits
+	 * - The consumer breaks out of the loop
+	 */
+	async *events(): AsyncGenerator<SdkAgentEvent, void, undefined> {
+		if (!this.process) {
+			throw new Error("Client not started — call start() before events()");
+		}
+
+		if (this._stopped) {
+			return;
+		}
+
+		const buffer: SdkAgentEvent[] = [];
+		let resolve: ((value: void) => void) | null = null;
+		let done = false;
+
+		// When a new event arrives, either push to buffer or wake up the awaiting generator
+		const listener = (event: SdkAgentEvent) => {
+			buffer.push(event);
+			if (resolve) {
+				const r = resolve;
+				resolve = null;
+				r();
+			}
+		};
+
+		// When the process exits, signal the generator to stop
+		const onExit = () => {
+			done = true;
+			if (resolve) {
+				const r = resolve;
+				resolve = null;
+				r();
+			}
+		};
+
+		const unsubscribe = this.onEvent(listener);
+		this.process.on("exit", onExit);
+
+		try {
+			while (!done && !this._stopped) {
+				// Drain buffer first
+				while (buffer.length > 0) {
+					yield buffer.shift()!;
+				}
+
+				// If done after draining, break
+				if (done || this._stopped) {
+					break;
+				}
+
+				// Wait for next event or process exit
+				await new Promise<void>((r) => {
+					resolve = r;
+				});
+			}
+
+			// Drain any remaining events that arrived with the exit signal
+			while (buffer.length > 0) {
+				yield buffer.shift()!;
+			}
+		} finally {
+			unsubscribe();
+			this.process?.removeListener("exit", onExit);
+		}
+	}
+
+	/**
+	 * Get collected stderr output (useful for debugging).
+	 */
+	getStderr(): string {
+		return this.stderr;
+	}
+
+	// =========================================================================
+	// Command Methods
+	// =========================================================================
+
+	/**
+	 * Send a prompt to the agent.
+	 * Returns immediately after sending; use onEvent() or events() to receive streaming events.
+	 * Use waitForIdle() to wait for completion.
+	 */
+	async prompt(message: string, images?: ImageContent[]): Promise<void> {
+		await this.send({ type: "prompt", message, images });
+	}
+
+	/**
+	 * Queue a steering message to interrupt the agent mid-run.
+	 */
+	async steer(message: string, images?: ImageContent[]): Promise<void> {
+		await this.send({ type: "steer", message, images });
+	}
+
+	/**
+	 * Queue a follow-up message to be processed after the agent finishes.
+	 */
+	async followUp(message: string, images?: ImageContent[]): Promise<void> {
+		await this.send({ type: "follow_up", message, images });
+	}
+
+	/**
+	 * Abort current operation.
+	 */
+	async abort(): Promise<void> {
+		await this.send({ type: "abort" });
+	}
+
+	/**
+	 * Start a new session, optionally with parent tracking.
+	 * @param parentSession - Optional parent session path for lineage tracking
+	 * @returns Object with `cancelled: true` if an extension cancelled the new session
+	 */
+	async newSession(parentSession?: string): Promise<{ cancelled: boolean }> {
+		const response = await this.send({ type: "new_session", parentSession });
+		return this.getData(response);
+	}
+
+	/**
+	 * Get current session state.
+	 */
+	async getState(): Promise<RpcSessionState> {
+		const response = await this.send({ type: "get_state" });
+		return this.getData(response);
+	}
+
+	/**
+	 * Set model by provider and ID.
+	 */
+	async setModel(provider: string, modelId: string): Promise<{ provider: string; id: string }> {
+		const response = await this.send({ type: "set_model", provider, modelId });
+		return this.getData(response);
+	}
+
+	/**
+	 * Cycle to next model.
+	 */
+	async cycleModel(): Promise<{
+		model: { provider: string; id: string };
+		thinkingLevel: ThinkingLevel;
+		isScoped: boolean;
+	} | null> {
+		const response = await this.send({ type: "cycle_model" });
+		return this.getData(response);
+	}
+
+	/**
+	 * Get list of available models.
+	 */
+	async getAvailableModels(): Promise<ModelInfo[]> {
+		const response = await this.send({ type: "get_available_models" });
+		return this.getData<{ models: ModelInfo[] }>(response).models;
+	}
+
+	/**
+	 * Set thinking level.
+	 */
+	async setThinkingLevel(level: ThinkingLevel): Promise<void> {
+		await this.send({ type: "set_thinking_level", level });
+	}
+
+	/**
+	 * Cycle thinking level.
+	 */
+	async cycleThinkingLevel(): Promise<{ level: ThinkingLevel } | null> {
+		const response = await this.send({ type: "cycle_thinking_level" });
+		return this.getData(response);
+	}
+
+	/**
+	 * Set steering mode.
+	 */
+	async setSteeringMode(mode: "all" | "one-at-a-time"): Promise<void> {
+		await this.send({ type: "set_steering_mode", mode });
+	}
+
+	/**
+	 * Set follow-up mode.
+	 */
+	async setFollowUpMode(mode: "all" | "one-at-a-time"): Promise<void> {
+		await this.send({ type: "set_follow_up_mode", mode });
+	}
+
+	/**
+	 * Compact session context.
+	 */
+	async compact(customInstructions?: string): Promise<CompactionResult> {
+		const response = await this.send({ type: "compact", customInstructions });
+		return this.getData(response);
+	}
+
+	/**
+	 * Set auto-compaction enabled/disabled.
+	 */
+	async setAutoCompaction(enabled: boolean): Promise<void> {
+		await this.send({ type: "set_auto_compaction", enabled });
+	}
+
+	/**
+	 * Set auto-retry enabled/disabled.
+	 */
+	async setAutoRetry(enabled: boolean): Promise<void> {
+		await this.send({ type: "set_auto_retry", enabled });
+	}
+
+	/**
+	 * Abort in-progress retry.
+	 */
+	async abortRetry(): Promise<void> {
+		await this.send({ type: "abort_retry" });
+	}
+
+	/**
+	 * Execute a bash command.
+	 */
+	async bash(command: string): Promise<BashResult> {
+		const response = await this.send({ type: "bash", command });
+		return this.getData(response);
+	}
+
+	/**
+	 * Abort running bash command.
+	 */
+	async abortBash(): Promise<void> {
+		await this.send({ type: "abort_bash" });
+	}
+
+	/**
+	 * Get session statistics.
+	 */
+	async getSessionStats(): Promise<SessionStats> {
+		const response = await this.send({ type: "get_session_stats" });
+		return this.getData(response);
+	}
+
+	/**
+	 * Export session to HTML.
+	 */
+	async exportHtml(outputPath?: string): Promise<{ path: string }> {
+		const response = await this.send({ type: "export_html", outputPath });
+		return this.getData(response);
+	}
+
+	/**
+	 * Switch to a different session file.
+	 * @returns Object with `cancelled: true` if an extension cancelled the switch
+	 */
+	async switchSession(sessionPath: string): Promise<{ cancelled: boolean }> {
+		const response = await this.send({ type: "switch_session", sessionPath });
+		return this.getData(response);
+	}
+
+	/**
+	 * Fork from a specific message.
+	 * @returns Object with `text` (the message text) and `cancelled` (if extension cancelled)
+	 */
+	async fork(entryId: string): Promise<{ text: string; cancelled: boolean }> {
+		const response = await this.send({ type: "fork", entryId });
+		return this.getData(response);
+	}
+
+	/**
+	 * Get messages available for forking.
+	 */
+	async getForkMessages(): Promise<Array<{ entryId: string; text: string }>> {
+		const response = await this.send({ type: "get_fork_messages" });
+		return this.getData<{ messages: Array<{ entryId: string; text: string }> }>(response).messages;
+	}
+
+	/**
+	 * Get text of last assistant message.
+	 */
+	async getLastAssistantText(): Promise<string | null> {
+		const response = await this.send({ type: "get_last_assistant_text" });
+		return this.getData<{ text: string | null }>(response).text;
+	}
+
+	/**
+	 * Set the session display name.
+	 */
+	async setSessionName(name: string): Promise<void> {
+		await this.send({ type: "set_session_name", name });
+	}
+
+	/**
+	 * Get all messages in the session.
+	 * Messages are returned as opaque objects — the internal structure may vary.
+	 */
+	async getMessages(): Promise<unknown[]> {
+		const response = await this.send({ type: "get_messages" });
+		return this.getData<{ messages: unknown[] }>(response).messages;
+	}
+
+	/**
+	 * Get available commands (extension commands, prompt templates, skills).
+	 */
+	async getCommands(): Promise<RpcSlashCommand[]> {
+		const response = await this.send({ type: "get_commands" });
+		return this.getData<{ commands: RpcSlashCommand[] }>(response).commands;
+	}
+
+	/**
+	 * Send a UI response to a pending extension_ui_request.
+	 * Fire-and-forget — no request/response correlation.
+	 */
+	sendUIResponse(id: string, response: { value?: string; values?: string[]; confirmed?: boolean; cancelled?: boolean }): void {
+		if (!this.process?.stdin) {
+			throw new Error("Client not started");
+		}
+		this.process.stdin.write(serializeJsonLine({
+			type: "extension_ui_response",
+			id,
+			...response,
+		}));
+	}
+
+	/**
+	 * Initialize a v2 protocol session. Must be sent as the first command.
+	 * Returns the negotiated protocol version, session ID, and server capabilities.
+	 */
+	async init(options?: { clientId?: string }): Promise<RpcInitResult> {
+		const response = await this.send({ type: "init", protocolVersion: 2, clientId: options?.clientId });
+		return this.getData<RpcInitResult>(response);
+	}
+
+	/**
+	 * Request a graceful shutdown of the agent process.
+	 * Waits for the response before the process exits.
+	 */
+	async shutdown(): Promise<void> {
+		await this.send({ type: "shutdown" });
+		// Wait for process to exit after shutdown acknowledgment
+		if (this.process) {
+			await new Promise<void>((resolve) => {
+				const timeout = setTimeout(() => {
+					this.process?.kill("SIGKILL");
+					resolve();
+				}, 5000);
+				this.process?.on("exit", () => {
+					clearTimeout(timeout);
+					resolve();
+				});
+			});
+		}
+	}
+
+	/**
+	 * Subscribe to specific event types (v2 only).
+	 * Pass ["*"] to receive all events, or a list of event type strings to filter.
+	 */
+	async subscribe(events: string[]): Promise<void> {
+		await this.send({ type: "subscribe", events });
+	}
+
+	// =========================================================================
+	// Helpers
+	// =========================================================================
+
+	/**
+	 * Wait for agent to become idle (no streaming).
+	 * Resolves when agent_end event is received.
+	 */
+	waitForIdle(timeout = 60000): Promise<void> {
+		return new Promise((resolve, reject) => {
+			const timer = setTimeout(() => {
+				unsubscribe();
+				reject(new Error(`Timeout waiting for agent to become idle. Stderr: ${this.stderr}`));
+			}, timeout);
+
+			const unsubscribe = this.onEvent((event) => {
+				if (event.type === "agent_end") {
+					clearTimeout(timer);
+					unsubscribe();
+					resolve();
+				}
+			});
+		});
+	}
+
+	/**
+	 * Collect events until agent becomes idle.
+	 */
+	collectEvents(timeout = 60000): Promise<SdkAgentEvent[]> {
+		return new Promise((resolve, reject) => {
+			const events: SdkAgentEvent[] = [];
+			const timer = setTimeout(() => {
+				unsubscribe();
+				reject(new Error(`Timeout collecting events. Stderr: ${this.stderr}`));
+			}, timeout);
+
+			const unsubscribe = this.onEvent((event) => {
+				events.push(event);
+				if (event.type === "agent_end") {
+					clearTimeout(timer);
+					unsubscribe();
+					resolve(events);
+				}
+			});
+		});
+	}
+
+	/**
+	 * Send prompt and wait for completion, returning all events.
+	 */
+	async promptAndWait(message: string, images?: ImageContent[], timeout = 60000): Promise<SdkAgentEvent[]> {
+		const eventsPromise = this.collectEvents(timeout);
+		await this.prompt(message, images);
+		return eventsPromise;
+	}
+
+	// =========================================================================
+	// Internal
+	// =========================================================================
+
+	private handleLine(line: string): void {
+		try {
+			const data = JSON.parse(line);
+
+			// Check if it's a response to a pending request
+			if (data.type === "response" && data.id && this.pendingRequests.has(data.id)) {
+				const pending = this.pendingRequests.get(data.id)!;
+				this.pendingRequests.delete(data.id);
+				pending.resolve(data as RpcResponse);
+				return;
+			}
+
+			// Otherwise it's an event — dispatch to listeners
+			for (const listener of this.eventListeners) {
+				listener(data as SdkAgentEvent);
+			}
+		} catch {
+			// Ignore non-JSON lines
+		}
+	}
+
+	private async send(command: RpcCommandBody): Promise<RpcResponse> {
+		if (!this.process?.stdin) {
+			throw new Error("Client not started");
+		}
+
+		const id = `req_${++this.requestId}`;
+		const fullCommand = { ...command, id } as RpcCommand;
+
+		return new Promise((resolve, reject) => {
+			const timeout = setTimeout(() => {
+				this.pendingRequests.delete(id);
+				reject(new Error(`Timeout waiting for response to ${command.type}. Stderr: ${this.stderr}`));
+			}, 30000);
+
+			this.pendingRequests.set(id, {
+				resolve: (response) => {
+					clearTimeout(timeout);
+					resolve(response);
+				},
+				reject: (error) => {
+					clearTimeout(timeout);
+					reject(error);
+				},
+			});
+
+			this.process!.stdin!.write(serializeJsonLine(fullCommand));
+		});
+	}
+
+	private getData<T>(response: RpcResponse): T {
+		if (!response.success) {
+			const errorResponse = response as Extract<RpcResponse, { success: false }>;
+			throw new Error(errorResponse.error);
+		}
+		// Type assertion: we trust response.data matches T based on the command sent.
+		const successResponse = response as Extract<RpcResponse, { success: true; data: unknown }>;
+		return successResponse.data as T;
+	}
+}
--- a/packages/rpc-client/src/rpc-types.ts
+++ b/packages/rpc-client/src/rpc-types.ts
@ -0,0 +1,399 @@
+/**
+ * RPC protocol types for headless operation.
+ *
+ * Commands are sent as JSON lines on stdin.
+ * Responses and events are emitted as JSON lines on stdout.
+ *
+ * This file is self-contained — all types that were previously imported from
+ * internal packages are inlined so that this package has zero internal
+ * dependencies.
+ */
+
+// ============================================================================
+// Inlined types (originally from internal packages)
+// ============================================================================
+
+/** Thinking budget level (inlined from agent-core) */
+export type ThinkingLevel = "off" | "minimal" | "low" | "medium" | "high" | "xhigh";
+
+/** Image attachment (inlined from pi-ai) */
+export interface ImageContent {
+	type: "image";
+	data: string; // base64 encoded image data
+	mimeType: string; // e.g., "image/jpeg", "image/png"
+}
+
+/** Model descriptor — opaque for SDK consumers */
+export interface ModelInfo {
+	provider: string;
+	id: string;
+	contextWindow?: number;
+	reasoning?: boolean;
+	[key: string]: unknown;
+}
+
+/** Session statistics (from agent-session.ts) */
+export interface SessionStats {
+	sessionFile: string | undefined;
+	sessionId: string;
+	userMessages: number;
+	assistantMessages: number;
+	toolCalls: number;
+	toolResults: number;
+	totalMessages: number;
+	tokens: {
+		input: number;
+		output: number;
+		cacheRead: number;
+		cacheWrite: number;
+		total: number;
+	};
+	cost: number;
+}
+
+/** Bash command result (from bash-executor.ts) */
+export interface BashResult {
+	/** Combined stdout + stderr output (sanitized, possibly truncated) */
+	output: string;
+	/** Process exit code (undefined if killed/cancelled) */
+	exitCode: number | undefined;
+	/** Whether the command was cancelled via signal */
+	cancelled: boolean;
+	/** Whether the output was truncated */
+	truncated: boolean;
+	/** Path to temp file containing full output (if output exceeded truncation threshold) */
+	fullOutputPath?: string;
+}
+
+/** Compaction result (from compaction.ts) */
+export interface CompactionResult<T = unknown> {
+	summary: string;
+	firstKeptEntryId: string;
+	tokensBefore: number;
+	/** Extension-specific data (e.g., ArtifactIndex, version markers for structured compaction) */
+	details?: T;
+}
+
+// ============================================================================
+// RPC Protocol Versioning
+// ============================================================================
+
+/** Supported protocol versions. v1 is the implicit default; v2 requires an init handshake. */
+export type RpcProtocolVersion = 1 | 2;
+
+// ============================================================================
+// RPC Commands (stdin)
+// ============================================================================
+
+export type RpcCommand =
+	// Prompting
+	| { id?: string; type: "prompt"; message: string; images?: ImageContent[]; streamingBehavior?: "steer" | "followUp" }
+	| { id?: string; type: "steer"; message: string; images?: ImageContent[] }
+	| { id?: string; type: "follow_up"; message: string; images?: ImageContent[] }
+	| { id?: string; type: "abort" }
+	| { id?: string; type: "new_session"; parentSession?: string }
+
+	// State
+	| { id?: string; type: "get_state" }
+
+	// Model
+	| { id?: string; type: "set_model"; provider: string; modelId: string }
+	| { id?: string; type: "cycle_model" }
+	| { id?: string; type: "get_available_models" }
+
+	// Thinking
+	| { id?: string; type: "set_thinking_level"; level: ThinkingLevel }
+	| { id?: string; type: "cycle_thinking_level" }
+
+	// Queue modes
+	| { id?: string; type: "set_steering_mode"; mode: "all" | "one-at-a-time" }
+	| { id?: string; type: "set_follow_up_mode"; mode: "all" | "one-at-a-time" }
+
+	// Compaction
+	| { id?: string; type: "compact"; customInstructions?: string }
+	| { id?: string; type: "set_auto_compaction"; enabled: boolean }
+
+	// Retry
+	| { id?: string; type: "set_auto_retry"; enabled: boolean }
+	| { id?: string; type: "abort_retry" }
+
+	// Bash
+	| { id?: string; type: "bash"; command: string }
+	| { id?: string; type: "abort_bash" }
+
+	// Session
+	| { id?: string; type: "get_session_stats" }
+	| { id?: string; type: "export_html"; outputPath?: string }
+	| { id?: string; type: "switch_session"; sessionPath: string }
+	| { id?: string; type: "fork"; entryId: string }
+	| { id?: string; type: "get_fork_messages" }
+	| { id?: string; type: "get_last_assistant_text" }
+	| { id?: string; type: "set_session_name"; name: string }
+
+	// Messages
+	| { id?: string; type: "get_messages" }
+
+	// Commands (available for invocation via prompt)
+	| { id?: string; type: "get_commands" }
+
+	// Bridge-hosted native terminal
+	| { id?: string; type: "terminal_input"; data: string }
+	| { id?: string; type: "terminal_resize"; cols: number; rows: number }
+	| { id?: string; type: "terminal_redraw" }
+
+	// v2 Protocol
+	| { id?: string; type: "init"; protocolVersion: 2; clientId?: string }
+	| { id?: string; type: "shutdown"; graceful?: boolean }
+	| { id?: string; type: "subscribe"; events: string[] };
+
+// ============================================================================
+// RPC Slash Command (for get_commands response)
+// ============================================================================
+
+/** A command available for invocation via prompt */
+export interface RpcSlashCommand {
+	/** Command name (without leading slash) */
+	name: string;
+	/** Human-readable description */
+	description?: string;
+	/** What kind of command this is */
+	source: "extension" | "prompt" | "skill";
+	/** Where the command was loaded from (undefined for extensions) */
+	location?: "user" | "project" | "path";
+	/** File path to the command source */
+	path?: string;
+}
+
+// ============================================================================
+// RPC State
+// ============================================================================
+
+export interface RpcSessionState {
+	model?: ModelInfo;
+	thinkingLevel: ThinkingLevel;
+	isStreaming: boolean;
+	isCompacting: boolean;
+	steeringMode: "all" | "one-at-a-time";
+	followUpMode: "all" | "one-at-a-time";
+	sessionFile?: string;
+	sessionId: string;
+	sessionName?: string;
+	autoCompactionEnabled: boolean;
+	autoRetryEnabled: boolean;
+	retryInProgress: boolean;
+	retryAttempt: number;
+	messageCount: number;
+	pendingMessageCount: number;
+	/** Whether extension loading has completed. Commands from `get_commands` may be incomplete until true. */
+	extensionsReady: boolean;
+}
+
+// ============================================================================
+// RPC Responses (stdout)
+// ============================================================================
+
+// Success responses with data
+export type RpcResponse =
+	// Prompting (async - events follow)
+	| { id?: string; type: "response"; command: "prompt"; success: true; runId?: string }
+	| { id?: string; type: "response"; command: "steer"; success: true; runId?: string }
+	| { id?: string; type: "response"; command: "follow_up"; success: true; runId?: string }
+	| { id?: string; type: "response"; command: "abort"; success: true }
+	| { id?: string; type: "response"; command: "new_session"; success: true; data: { cancelled: boolean } }
+
+	// State
+	| { id?: string; type: "response"; command: "get_state"; success: true; data: RpcSessionState }
+
+	// Model
+	| {
+			id?: string;
+			type: "response";
+			command: "set_model";
+			success: true;
+			data: ModelInfo;
+	  }
+	| {
+			id?: string;
+			type: "response";
+			command: "cycle_model";
+			success: true;
+			data: { model: ModelInfo; thinkingLevel: ThinkingLevel; isScoped: boolean } | null;
+	  }
+	| {
+			id?: string;
+			type: "response";
+			command: "get_available_models";
+			success: true;
+			data: { models: ModelInfo[] };
+	  }
+
+	// Thinking
+	| { id?: string; type: "response"; command: "set_thinking_level"; success: true }
+	| {
+			id?: string;
+			type: "response";
+			command: "cycle_thinking_level";
+			success: true;
+			data: { level: ThinkingLevel } | null;
+	  }
+
+	// Queue modes
+	| { id?: string; type: "response"; command: "set_steering_mode"; success: true }
+	| { id?: string; type: "response"; command: "set_follow_up_mode"; success: true }
+
+	// Compaction
+	| { id?: string; type: "response"; command: "compact"; success: true; data: CompactionResult }
+	| { id?: string; type: "response"; command: "set_auto_compaction"; success: true }
+
+	// Retry
+	| { id?: string; type: "response"; command: "set_auto_retry"; success: true }
+	| { id?: string; type: "response"; command: "abort_retry"; success: true }
+
+	// Bash
+	| { id?: string; type: "response"; command: "bash"; success: true; data: BashResult }
+	| { id?: string; type: "response"; command: "abort_bash"; success: true }
+
+	// Session
+	| { id?: string; type: "response"; command: "get_session_stats"; success: true; data: SessionStats }
+	| { id?: string; type: "response"; command: "export_html"; success: true; data: { path: string } }
+	| { id?: string; type: "response"; command: "switch_session"; success: true; data: { cancelled: boolean } }
+	| { id?: string; type: "response"; command: "fork"; success: true; data: { text: string; cancelled: boolean } }
+	| {
+			id?: string;
+			type: "response";
+			command: "get_fork_messages";
+			success: true;
+			data: { messages: Array<{ entryId: string; text: string }> };
+	  }
+	| {
+			id?: string;
+			type: "response";
+			command: "get_last_assistant_text";
+			success: true;
+			data: { text: string | null };
+	  }
+	| { id?: string; type: "response"; command: "set_session_name"; success: true }
+
+	// Messages — AgentMessage is opaque for SDK consumers
+	| { id?: string; type: "response"; command: "get_messages"; success: true; data: { messages: unknown[] } }
+
+	// Commands
+	| {
+			id?: string;
+			type: "response";
+			command: "get_commands";
+			success: true;
+			data: { commands: RpcSlashCommand[] };
+	  }
+
+	// Bridge-hosted native terminal
+	| { id?: string; type: "response"; command: "terminal_input"; success: true }
+	| { id?: string; type: "response"; command: "terminal_resize"; success: true }
+	| { id?: string; type: "response"; command: "terminal_redraw"; success: true }
+
+	// v2 Protocol
+	| { id?: string; type: "response"; command: "init"; success: true; data: RpcInitResult }
+	| { id?: string; type: "response"; command: "shutdown"; success: true }
+	| { id?: string; type: "response"; command: "subscribe"; success: true }
+
+	// Error response (any command can fail)
+	| { id?: string; type: "response"; command: string; success: false; error: string };
+
+// ============================================================================
+// v2 Protocol Types
+// ============================================================================
+
+/** Result of the init handshake (v2 only) */
+export interface RpcInitResult {
+	protocolVersion: 2;
+	sessionId: string;
+	capabilities: {
+		events: string[];
+		commands: string[];
+	};
+}
+
+/** v2 execution_complete event — emitted when a prompt/steer/follow_up finishes */
+export interface RpcExecutionCompleteEvent {
+	type: "execution_complete";
+	runId: string;
+	status: "completed" | "error" | "cancelled";
+	reason?: string;
+	stats: SessionStats;
+}
+
+/** v2 cost_update event — emitted per-turn with running cost data */
+export interface RpcCostUpdateEvent {
+	type: "cost_update";
+	runId: string;
+	turnCost: number;
+	cumulativeCost: number;
+	tokens: {
+		input: number;
+		output: number;
+		cacheRead: number;
+		cacheWrite: number;
+	};
+}
+
+/** Discriminated union of all v2-only event types */
+export type RpcV2Event = RpcExecutionCompleteEvent | RpcCostUpdateEvent;
+
+// ============================================================================
+// Extension UI Events (stdout)
+// ============================================================================
+
+/** Emitted when an extension needs user input */
+export type RpcExtensionUIRequest =
+	| { type: "extension_ui_request"; id: string; method: "select"; title: string; options: string[]; timeout?: number; allowMultiple?: boolean }
+	| { type: "extension_ui_request"; id: string; method: "confirm"; title: string; message: string; timeout?: number }
+	| {
+			type: "extension_ui_request";
+			id: string;
+			method: "input";
+			title: string;
+			placeholder?: string;
+			timeout?: number;
+	  }
+	| { type: "extension_ui_request"; id: string; method: "editor"; title: string; prefill?: string }
+	| {
+			type: "extension_ui_request";
+			id: string;
+			method: "notify";
+			message: string;
+			notifyType?: "info" | "warning" | "error";
+	  }
+	| {
+			type: "extension_ui_request";
+			id: string;
+			method: "setStatus";
+			statusKey: string;
+			statusText: string | undefined;
+	  }
+	| {
+			type: "extension_ui_request";
+			id: string;
+			method: "setWidget";
+			widgetKey: string;
+			widgetLines: string[] | undefined;
+			widgetPlacement?: "aboveEditor" | "belowEditor";
+	  }
+	| { type: "extension_ui_request"; id: string; method: "setTitle"; title: string }
+	| { type: "extension_ui_request"; id: string; method: "set_editor_text"; text: string };
+
+// ============================================================================
+// Extension UI Commands (stdin)
+// ============================================================================
+
+/** Response to an extension UI request */
+export type RpcExtensionUIResponse =
+	| { type: "extension_ui_response"; id: string; value: string }
+	| { type: "extension_ui_response"; id: string; values: string[] }
+	| { type: "extension_ui_response"; id: string; confirmed: boolean }
+	| { type: "extension_ui_response"; id: string; cancelled: true };
+
+// ============================================================================
+// Helper type for extracting command types
+// ============================================================================
+
+export type RpcCommandType = RpcCommand["type"];
--- a/packages/rpc-client/tsconfig.examples.json
+++ b/packages/rpc-client/tsconfig.examples.json
@ -0,0 +1,17 @@
+{
+  "compilerOptions": {
+    "target": "ES2024",
+    "module": "Node16",
+    "lib": ["ES2024"],
+    "strict": true,
+    "esModuleInterop": true,
+    "skipLibCheck": true,
+    "moduleResolution": "Node16",
+    "noEmit": true,
+    "types": ["node"],
+    "paths": {
+      "@gsd-build/rpc-client": ["./src/index.ts"]
+    }
+  },
+  "include": ["examples/**/*.ts"]
+}
--- a/packages/rpc-client/tsconfig.json
+++ b/packages/rpc-client/tsconfig.json
@ -0,0 +1,24 @@
+{
+  "compilerOptions": {
+    "target": "ES2024",
+    "module": "Node16",
+    "lib": ["ES2024"],
+    "strict": true,
+    "esModuleInterop": true,
+    "skipLibCheck": true,
+    "forceConsistentCasingInFileNames": true,
+    "declaration": true,
+    "declarationMap": true,
+    "sourceMap": true,
+    "inlineSources": true,
+    "inlineSourceMap": false,
+    "moduleResolution": "Node16",
+    "resolveJsonModule": true,
+    "allowImportingTsExtensions": false,
+    "types": ["node"],
+    "outDir": "./dist",
+    "rootDir": "./src"
+  },
+  "include": ["src/**/*.ts"],
+  "exclude": ["node_modules", "dist", "**/*.d.ts", "src/**/*.d.ts"]
+}
--- a/src/headless-ui.ts
+++ b/src/headless-ui.ts
@ -8,7 +8,7 @@

 import type { Readable } from 'node:stream'

-import { RpcClient, attachJsonlLineReader, serializeJsonLine } from '@gsd/pi-coding-agent'
+import { RpcClient, attachJsonlLineReader } from '@gsd/pi-coding-agent'

 // ---------------------------------------------------------------------------
 // Types
@ -34,10 +34,9 @@ export type { ExtensionUIRequest }

 export function handleExtensionUIRequest(
  event: ExtensionUIRequest,
-  writeToStdin: (data: string) => void,
+  client: RpcClient,
 ): void {
  const { id, method } = event
-  let response: Record<string, unknown>

  switch (method) {
    case 'select': {
@ -49,32 +48,30 @@ export function handleExtensionUIRequest(
        const forceOption = event.options.find(o => o.toLowerCase().includes('force start'))
        if (forceOption) selected = forceOption
      }
-      response = { type: 'extension_ui_response', id, value: selected }
+      client.sendUIResponse(id, { value: selected })
      break
    }
    case 'confirm':
-      response = { type: 'extension_ui_response', id, confirmed: true }
+      client.sendUIResponse(id, { confirmed: true })
      break
    case 'input':
-      response = { type: 'extension_ui_response', id, value: '' }
+      client.sendUIResponse(id, { value: '' })
      break
    case 'editor':
-      response = { type: 'extension_ui_response', id, value: event.prefill ?? '' }
+      client.sendUIResponse(id, { value: event.prefill ?? '' })
      break
    case 'notify':
    case 'setStatus':
    case 'setWidget':
    case 'setTitle':
    case 'set_editor_text':
-      response = { type: 'extension_ui_response', id, value: '' }
+      client.sendUIResponse(id, { value: '' })
      break
    default:
      process.stderr.write(`[headless] Warning: unknown extension_ui_request method "${method}", cancelling\n`)
-      response = { type: 'extension_ui_response', id, cancelled: true }
+      client.sendUIResponse(id, { cancelled: true })
      break
  }
-
-  writeToStdin(serializeJsonLine(response))
 }

 // ---------------------------------------------------------------------------
@ -114,7 +111,6 @@ export function formatProgress(event: Record<string, unknown>, verbose: boolean)
 // ---------------------------------------------------------------------------

 export function startSupervisedStdinReader(
-  stdinWriter: (data: string) => void,
  client: RpcClient,
  onResponse: (id: string) => void,
 ): () => void {
@ -130,12 +126,17 @@ export function startSupervisedStdinReader(
    const type = String(msg.type ?? '')

    switch (type) {
-      case 'extension_ui_response':
-        stdinWriter(line + '\n')
-        if (typeof msg.id === 'string') {
-          onResponse(msg.id)
+      case 'extension_ui_response': {
+        const id = String(msg.id ?? '')
+        const value = msg.value !== undefined ? String(msg.value) : undefined
+        const confirmed = typeof msg.confirmed === 'boolean' ? msg.confirmed : undefined
+        const cancelled = typeof msg.cancelled === 'boolean' ? msg.cancelled : undefined
+        client.sendUIResponse(id, { value, confirmed, cancelled })
+        if (id) {
+          onResponse(id)
        }
        break
+      }
      case 'prompt':
        client.prompt(String(msg.message ?? ''))
        break
--- a/src/headless.ts
+++ b/src/headless.ts
@ -17,7 +17,9 @@ import { join } from 'node:path'
 import { resolve } from 'node:path'
 import { ChildProcess } from 'node:child_process'

-import { RpcClient } from '@gsd/pi-coding-agent'
+import { RpcClient, SessionManager } from '@gsd/pi-coding-agent'
+import type { SessionInfo } from '@gsd/pi-coding-agent'
+import { getProjectSessionsDir } from './project-sessions.js'
 import { loadAndValidateAnswerFile, AnswerInjector } from './headless-answers.js'

 import {
@ -35,7 +37,7 @@ import {
  mapStatusToExitCode,
 } from './headless-events.js'

-import type { OutputFormat } from './headless-types.js'
+import type { OutputFormat, HeadlessJsonResult } from './headless-types.js'
 import { VALID_OUTPUT_FORMATS } from './headless-types.js'

 import {
@ -80,6 +82,39 @@ interface TrackedEvent {
  detail?: string
 }

+// ---------------------------------------------------------------------------
+// Resume Session Resolution
+// ---------------------------------------------------------------------------
+
+export interface ResumeSessionResult {
+  session?: SessionInfo
+  error?: string
+}
+
+/**
+ * Resolve a session prefix to a single session.
+ * Exact id match is preferred over prefix match.
+ * Returns `{ session }` on unique match or `{ error }` on 0/ambiguous matches.
+ */
+export function resolveResumeSession(sessions: SessionInfo[], prefix: string): ResumeSessionResult {
+  // Exact match takes priority
+  const exact = sessions.find(s => s.id === prefix)
+  if (exact) {
+    return { session: exact }
+  }
+
+  // Prefix match
+  const matches = sessions.filter(s => s.id.startsWith(prefix))
+  if (matches.length === 0) {
+    return { error: `No session matching '${prefix}' found` }
+  }
+  if (matches.length > 1) {
+    const list = matches.map(s => `  ${s.id}`).join('\n')
+    return { error: `Ambiguous session prefix '${prefix}' matches ${matches.length} sessions:\n${list}` }
+  }
+  return { session: matches[0] }
+}
+
 // ---------------------------------------------------------------------------
 // CLI Argument Parser
 // ---------------------------------------------------------------------------
@ -325,6 +360,40 @@ async function runHeadlessOnce(options: HeadlessOptions, restartCount: number):
  let milestoneReady = false  // tracks "Milestone X ready." for auto-chaining
  const recentEvents: TrackedEvent[] = []

+  // JSON batch mode: cost aggregation (cumulative-max pattern per K004)
+  let cumulativeCostUsd = 0
+  let cumulativeInputTokens = 0
+  let cumulativeOutputTokens = 0
+  let cumulativeCacheReadTokens = 0
+  let cumulativeCacheWriteTokens = 0
+  let lastSessionId: string | undefined
+
+  // Emit HeadlessJsonResult to stdout for --output-format json batch mode
+  function emitBatchJsonResult(): void {
+    if (options.outputFormat !== 'json') return
+    const duration = Date.now() - startTime
+    const status: HeadlessJsonResult['status'] = blocked ? 'blocked'
+      : exitCode === EXIT_CANCELLED ? 'cancelled'
+      : exitCode === EXIT_ERROR ? (totalEvents === 0 ? 'error' : 'timeout')
+      : 'success'
+    const result: HeadlessJsonResult = {
+      status,
+      exitCode,
+      sessionId: lastSessionId,
+      duration,
+      cost: {
+        total: cumulativeCostUsd,
+        input_tokens: cumulativeInputTokens,
+        output_tokens: cumulativeOutputTokens,
+        cache_read_tokens: cumulativeCacheReadTokens,
+        cache_write_tokens: cumulativeCacheWriteTokens,
+      },
+      toolCalls: toolCallCount,
+      events: totalEvents,
+    }
+    process.stdout.write(JSON.stringify(result) + '\n')
+  }
+
  function trackEvent(event: Record<string, unknown>): void {
    totalEvents++
    const type = String(event.type ?? 'unknown')
@ -345,8 +414,11 @@ async function runHeadlessOnce(options: HeadlessOptions, restartCount: number):
    if (recentEvents.length > 20) recentEvents.shift()
  }

-  // Stdin writer for sending extension_ui_response to child
-  let stdinWriter: ((data: string) => void) | null = null
+  // Client started flag — replaces old stdinWriter null-check
+  let clientStarted = false
+  // Adapter for AnswerInjector — wraps client.sendUIResponse in a writeToStdin-compatible callback
+  // Initialized after client.start(); events won't fire before then
+  let injectorStdinAdapter: (data: string) => void = () => {}

  // Supervised mode state
  const pendingResponseTimers = new Map<string, ReturnType<typeof setTimeout>>()
@ -401,20 +473,52 @@ async function runHeadlessOnce(options: HeadlessOptions, restartCount: number):
    // Answer injector: observe events for question metadata
    injector?.observeEvent(eventObj)

-    // --json mode: forward events as JSONL to stdout (filtered if --events)
-    if (options.json) {
+    // --json / --output-format stream-json: forward events as JSONL to stdout (filtered if --events)
+    // --output-format json (batch mode): suppress streaming, track cost for final result
+    if (options.json && options.outputFormat === 'stream-json') {
      const eventType = String(eventObj.type ?? '')
      if (!options.eventFilter || options.eventFilter.has(eventType)) {
        process.stdout.write(JSON.stringify(eventObj) + '\n')
      }
-    } else {
+    } else if (options.outputFormat === 'json') {
+      // Batch mode: silently track cost_update events (cumulative-max per K004)
+      const eventType = String(eventObj.type ?? '')
+      if (eventType === 'cost_update') {
+        const data = eventObj as Record<string, unknown>
+        const cumCost = data.cumulativeCost as Record<string, unknown> | undefined
+        if (cumCost) {
+          cumulativeCostUsd = Math.max(cumulativeCostUsd, Number(cumCost.costUsd ?? 0))
+          const tokens = data.tokens as Record<string, number> | undefined
+          if (tokens) {
+            cumulativeInputTokens = Math.max(cumulativeInputTokens, tokens.input ?? 0)
+            cumulativeOutputTokens = Math.max(cumulativeOutputTokens, tokens.output ?? 0)
+            cumulativeCacheReadTokens = Math.max(cumulativeCacheReadTokens, tokens.cacheRead ?? 0)
+            cumulativeCacheWriteTokens = Math.max(cumulativeCacheWriteTokens, tokens.cacheWrite ?? 0)
+          }
+        }
+      }
+      // Track sessionId from init_result
+      if (eventType === 'init_result') {
+        lastSessionId = String((eventObj as Record<string, unknown>).sessionId ?? '')
+      }
+    } else if (!options.json) {
      // Progress output to stderr
      const line = formatProgress(eventObj, !!options.verbose)
      if (line) process.stderr.write(line + '\n')
    }

+    // Handle execution_complete (v2 structured completion)
+    if (eventObj.type === 'execution_complete' && !completed) {
+      completed = true
+      const status = String(eventObj.status ?? 'success')
+      exitCode = mapStatusToExitCode(status)
+      if (eventObj.status === 'blocked') blocked = true
+      resolveCompletion()
+      return
+    }
+
    // Handle extension_ui_request
-    if (eventObj.type === 'extension_ui_request' && stdinWriter) {
+    if (eventObj.type === 'extension_ui_request' && clientStarted) {
      // Check for terminal notification before auto-responding
      if (isBlockedNotification(eventObj)) {
        blocked = true
@ -431,7 +535,7 @@ async function runHeadlessOnce(options: HeadlessOptions, restartCount: number):

      // Answer injection: try to handle with pre-supplied answers before supervised/auto
      if (injector && !FIRE_AND_FORGET_METHODS.has(String(eventObj.method ?? ''))) {
-        if (injector.tryHandle(eventObj, stdinWriter)) {
+        if (injector.tryHandle(eventObj, injectorStdinAdapter)) {
          if (completed) {
            exitCode = blocked ? EXIT_BLOCKED : EXIT_SUCCESS
            resolveCompletion()
@ -449,12 +553,12 @@ async function runHeadlessOnce(options: HeadlessOptions, restartCount: number):
        const eventId = String(eventObj.id ?? '')
        const timer = setTimeout(() => {
          pendingResponseTimers.delete(eventId)
-          handleExtensionUIRequest(eventObj as unknown as ExtensionUIRequest, stdinWriter!)
+          handleExtensionUIRequest(eventObj as unknown as ExtensionUIRequest, client)
          process.stdout.write(JSON.stringify({ type: 'supervised_timeout', id: eventId, method }) + '\n')
        }, responseTimeout)
        pendingResponseTimers.set(eventId, timer)
      } else {
-        handleExtensionUIRequest(eventObj as unknown as ExtensionUIRequest, stdinWriter)
+        handleExtensionUIRequest(eventObj as unknown as ExtensionUIRequest, client)
      }

      // If we detected a terminal notification, resolve after responding
@ -481,11 +585,17 @@ async function runHeadlessOnce(options: HeadlessOptions, restartCount: number):
    process.stderr.write('\n[headless] Interrupted, stopping child process...\n')
    interrupted = true
    exitCode = EXIT_CANCELLED
-    client.stop().finally(() => {
-      if (timeoutTimer) clearTimeout(timeoutTimer)
-      if (idleTimer) clearTimeout(idleTimer)
-      process.exit(exitCode)
-    })
+    // Kill child process — don't await, just fire and exit.
+    // The main flow may be awaiting a promise that resolves when the child dies,
+    // which would race with this handler. Exit synchronously to ensure correct exit code.
+    try { client.stop().catch(() => {}) } catch {}
+    if (timeoutTimer) clearTimeout(timeoutTimer)
+    if (idleTimer) clearTimeout(idleTimer)
+    // Emit batch JSON result if in json mode before exiting
+    if (options.outputFormat === 'json') {
+      emitBatchJsonResult()
+    }
+    process.exit(exitCode)
  }
  process.on('SIGINT', signalHandler)
  process.on('SIGTERM', signalHandler)
@ -499,22 +609,55 @@ async function runHeadlessOnce(options: HeadlessOptions, restartCount: number):
    process.exit(1)
  }

-  // Access stdin writer from the internal process
-  const internalProcess = (client as any).process as ChildProcess
-  if (!internalProcess?.stdin) {
-    process.stderr.write('[headless] Error: Cannot access child process stdin\n')
-    await client.stop()
-    if (timeoutTimer) clearTimeout(timeoutTimer)
-    process.exit(1)
+  // v2 protocol negotiation — attempt init for structured completion events
+  let v2Enabled = false
+  try {
+    await client.init({ clientId: 'gsd-headless' })
+    v2Enabled = true
+  } catch {
+    process.stderr.write('[headless] Warning: v2 init failed, falling back to v1 string-matching\n')
  }

-  stdinWriter = (data: string) => {
-    internalProcess.stdin!.write(data)
+  clientStarted = true
+
+  // --resume: resolve session ID and switch to it
+  if (options.resumeSession) {
+    const projectSessionsDir = getProjectSessionsDir(process.cwd())
+    const sessions = await SessionManager.list(process.cwd(), projectSessionsDir)
+    const result = resolveResumeSession(sessions, options.resumeSession)
+    if (result.error) {
+      process.stderr.write(`[headless] Error: ${result.error}\n`)
+      await client.stop()
+      if (timeoutTimer) clearTimeout(timeoutTimer)
+      process.exit(1)
+    }
+    const matched = result.session!
+    const switchResult = await client.switchSession(matched.path)
+    if (switchResult.cancelled) {
+      process.stderr.write(`[headless] Error: Session switch to '${matched.id}' was cancelled by an extension\n`)
+      await client.stop()
+      if (timeoutTimer) clearTimeout(timeoutTimer)
+      process.exit(1)
+    }
+    process.stderr.write(`[headless] Resuming session ${matched.id}\n`)
+  }
+
+  // Build injector adapter — wraps client.sendUIResponse for AnswerInjector's writeToStdin interface
+  injectorStdinAdapter = (data: string) => {
+    try {
+      const parsed = JSON.parse(data.trim())
+      if (parsed.type === 'extension_ui_response' && parsed.id) {
+        const { id, value, values, confirmed, cancelled } = parsed
+        client.sendUIResponse(id, { value, values, confirmed, cancelled })
+      }
+    } catch {
+      process.stderr.write('[headless] Warning: injector adapter received unparseable data\n')
+    }
  }

  // Start supervised stdin reader for orchestrator commands
  if (options.supervised) {
-    stopSupervisedReader = startSupervisedStdinReader(stdinWriter, client, (id) => {
+    stopSupervisedReader = startSupervisedStdinReader(client, (id) => {
      const timer = pendingResponseTimers.get(id)
      if (timer) {
        clearTimeout(timer)
@ -525,14 +668,18 @@ async function runHeadlessOnce(options: HeadlessOptions, restartCount: number):
    process.stdin.resume()
  }

-  // Detect child process crash
-  internalProcess.on('exit', (code) => {
-    if (!completed) {
-      const msg = `[headless] Child process exited unexpectedly with code ${code ?? 'null'}\n`
-      process.stderr.write(msg)
-      exitCode = EXIT_ERROR
-      resolveCompletion()
-    }  })
+  // Detect child process crash (read-only exit event subscription — not stdin access)
+  const internalProcess = (client as any).process as ChildProcess
+  if (internalProcess) {
+    internalProcess.on('exit', (code) => {
+      if (!completed) {
+        const msg = `[headless] Child process exited unexpectedly with code ${code ?? 'null'}\n`
+        process.stderr.write(msg)
+        exitCode = EXIT_ERROR
+        resolveCompletion()
+      }
+    })
+  }

  if (!options.json) {
    process.stderr.write(`[headless] Running /gsd ${options.command}${options.commandArgs.length > 0 ? ' ' + options.commandArgs.join(' ') : ''}...\n`)
@ -626,5 +773,8 @@ async function runHeadlessOnce(options: HeadlessOptions, restartCount: number):
    }
  }

+  // Emit structured JSON result in batch mode
+  emitBatchJsonResult()
+
  return { exitCode, interrupted }
 }
--- a/src/tests/headless-v2-migration.test.ts
+++ b/src/tests/headless-v2-migration.test.ts
@ -0,0 +1,462 @@
+/**
+ * Tests for headless v2 migration — execution_complete handling,
+ * sendUIResponse-based auto-response, and v1 fallback behavior.
+ *
+ * Uses extracted logic mirrors to avoid importing modules with native
+ * dependencies (same pattern as headless-events.test.ts and headless-detection.test.ts).
+ */
+
+import test from 'node:test'
+import assert from 'node:assert/strict'
+
+// ─── Extracted exit codes (mirrors headless-events.ts) ──────────────────────
+
+const EXIT_SUCCESS = 0
+const EXIT_ERROR = 1
+const EXIT_BLOCKED = 10
+
+function mapStatusToExitCode(status: string): number {
+  switch (status) {
+    case 'success':
+    case 'complete':
+      return EXIT_SUCCESS
+    case 'error':
+    case 'timeout':
+      return EXIT_ERROR
+    case 'blocked':
+      return EXIT_BLOCKED
+    case 'cancelled':
+      return 11
+    default:
+      return EXIT_ERROR
+  }
+}
+
+// ─── Extracted terminal detection (mirrors headless-events.ts) ──────────────
+
+const TERMINAL_PREFIXES = ['auto-mode stopped', 'step-mode stopped']
+
+function isTerminalNotification(event: Record<string, unknown>): boolean {
+  if (event.type !== 'extension_ui_request' || event.method !== 'notify') return false
+  const message = String(event.message ?? '').toLowerCase()
+  return TERMINAL_PREFIXES.some((prefix) => message.startsWith(prefix))
+}
+
+function isBlockedNotification(event: Record<string, unknown>): boolean {
+  if (event.type !== 'extension_ui_request' || event.method !== 'notify') return false
+  const message = String(event.message ?? '').toLowerCase()
+  return message.includes('blocked:')
+}
+
+// ─── Mock RpcClient ─────────────────────────────────────────────────────────
+
+interface SendUICall {
+  id: string
+  response: { value?: string; values?: string[]; confirmed?: boolean; cancelled?: boolean }
+}
+
+class MockRpcClient {
+  sendUICalls: SendUICall[] = []
+  initCalled = false
+  initShouldFail = false
+
+  sendUIResponse(id: string, response: { value?: string; values?: string[]; confirmed?: boolean; cancelled?: boolean }): void {
+    this.sendUICalls.push({ id, response })
+  }
+
+  async init(_options?: { clientId?: string }): Promise<{ protocolVersion: number }> {
+    this.initCalled = true
+    if (this.initShouldFail) {
+      throw new Error('v2 init not supported')
+    }
+    return { protocolVersion: 2 }
+  }
+}
+
+// ─── Extracted handleExtensionUIRequest (mirrors headless-ui.ts) ────────────
+
+interface ExtensionUIRequest {
+  type: 'extension_ui_request'
+  id: string
+  method: string
+  title?: string
+  options?: string[]
+  message?: string
+  prefill?: string
+  [key: string]: unknown
+}
+
+function handleExtensionUIRequest(
+  event: ExtensionUIRequest,
+  client: MockRpcClient,
+): void {
+  const { id, method } = event
+
+  switch (method) {
+    case 'select': {
+      const title = String(event.title ?? '')
+      let selected = event.options?.[0] ?? ''
+      if (title.includes('Auto-mode is running') && event.options) {
+        const forceOption = event.options.find(o => o.toLowerCase().includes('force start'))
+        if (forceOption) selected = forceOption
+      }
+      client.sendUIResponse(id, { value: selected })
+      break
+    }
+    case 'confirm':
+      client.sendUIResponse(id, { confirmed: true })
+      break
+    case 'input':
+      client.sendUIResponse(id, { value: '' })
+      break
+    case 'editor':
+      client.sendUIResponse(id, { value: event.prefill ?? '' })
+      break
+    case 'notify':
+    case 'setStatus':
+    case 'setWidget':
+    case 'setTitle':
+    case 'set_editor_text':
+      client.sendUIResponse(id, { value: '' })
+      break
+    default:
+      client.sendUIResponse(id, { cancelled: true })
+      break
+  }
+}
+
+// ─── Simulated event handler (mirrors headless.ts event handler logic) ──────
+
+interface EventHandlerState {
+  completed: boolean
+  blocked: boolean
+  exitCode: number
+  v2Enabled: boolean
+}
+
+function handleEvent(
+  eventObj: Record<string, unknown>,
+  state: EventHandlerState,
+  client: MockRpcClient,
+): void {
+  // execution_complete (v2 structured completion)
+  if (eventObj.type === 'execution_complete' && !state.completed) {
+    state.completed = true
+    const status = String(eventObj.status ?? 'success')
+    state.exitCode = mapStatusToExitCode(status)
+    if (eventObj.status === 'blocked') state.blocked = true
+    return
+  }
+
+  // extension_ui_request (v1 fallback + UI responses)
+  if (eventObj.type === 'extension_ui_request') {
+    if (isBlockedNotification(eventObj)) {
+      state.blocked = true
+    }
+
+    if (isTerminalNotification(eventObj)) {
+      state.completed = true
+    }
+
+    handleExtensionUIRequest(eventObj as unknown as ExtensionUIRequest, client)
+
+    if (state.completed) {
+      state.exitCode = state.blocked ? EXIT_BLOCKED : EXIT_SUCCESS
+      return
+    }
+  }
+}
+
+// ─── execution_complete event handling ──────────────────────────────────────
+
+test('execution_complete with status success triggers completion with EXIT_SUCCESS', () => {
+  const client = new MockRpcClient()
+  const state: EventHandlerState = { completed: false, blocked: false, exitCode: -1, v2Enabled: true }
+
+  handleEvent({ type: 'execution_complete', status: 'success' }, state, client)
+
+  assert.equal(state.completed, true)
+  assert.equal(state.exitCode, EXIT_SUCCESS)
+  assert.equal(state.blocked, false)
+})
+
+test('execution_complete with status blocked sets blocked flag and EXIT_BLOCKED', () => {
+  const client = new MockRpcClient()
+  const state: EventHandlerState = { completed: false, blocked: false, exitCode: -1, v2Enabled: true }
+
+  handleEvent({ type: 'execution_complete', status: 'blocked' }, state, client)
+
+  assert.equal(state.completed, true)
+  assert.equal(state.blocked, true)
+  assert.equal(state.exitCode, EXIT_BLOCKED)
+})
+
+test('execution_complete with status error maps to EXIT_ERROR', () => {
+  const client = new MockRpcClient()
+  const state: EventHandlerState = { completed: false, blocked: false, exitCode: -1, v2Enabled: true }
+
+  handleEvent({ type: 'execution_complete', status: 'error' }, state, client)
+
+  assert.equal(state.completed, true)
+  assert.equal(state.exitCode, EXIT_ERROR)
+})
+
+test('execution_complete with missing status defaults to success', () => {
+  const client = new MockRpcClient()
+  const state: EventHandlerState = { completed: false, blocked: false, exitCode: -1, v2Enabled: true }
+
+  handleEvent({ type: 'execution_complete' }, state, client)
+
+  assert.equal(state.completed, true)
+  assert.equal(state.exitCode, EXIT_SUCCESS)
+})
+
+test('execution_complete ignored if already completed', () => {
+  const client = new MockRpcClient()
+  const state: EventHandlerState = { completed: true, blocked: false, exitCode: EXIT_SUCCESS, v2Enabled: true }
+
+  handleEvent({ type: 'execution_complete', status: 'error' }, state, client)
+
+  // Should not change exitCode because already completed
+  assert.equal(state.exitCode, EXIT_SUCCESS)
+})
+
+// ─── v1 string-matching fallback ────────────────────────────────────────────
+
+test('v1 fallback: terminal notification still triggers completion', () => {
+  const client = new MockRpcClient()
+  const state: EventHandlerState = { completed: false, blocked: false, exitCode: -1, v2Enabled: false }
+
+  handleEvent(
+    { type: 'extension_ui_request', method: 'notify', id: 'n1', message: 'Auto-mode stopped — all slices complete' },
+    state,
+    client,
+  )
+
+  assert.equal(state.completed, true)
+  assert.equal(state.exitCode, EXIT_SUCCESS)
+})
+
+test('v1 fallback: blocked notification sets blocked flag', () => {
+  const client = new MockRpcClient()
+  const state: EventHandlerState = { completed: false, blocked: false, exitCode: -1, v2Enabled: false }
+
+  handleEvent(
+    { type: 'extension_ui_request', method: 'notify', id: 'n1', message: 'Auto-mode stopped (Blocked: plan invalid)' },
+    state,
+    client,
+  )
+
+  assert.equal(state.completed, true)
+  assert.equal(state.blocked, true)
+  assert.equal(state.exitCode, EXIT_BLOCKED)
+})
+
+test('string-matching fallback works when execution_complete never received', () => {
+  const client = new MockRpcClient()
+  const state: EventHandlerState = { completed: false, blocked: false, exitCode: -1, v2Enabled: false }
+
+  // Simulate a normal session without execution_complete
+  handleEvent({ type: 'extension_ui_request', method: 'select', id: 'q1', options: ['option1'] }, state, client)
+  assert.equal(state.completed, false)
+
+  handleEvent(
+    { type: 'extension_ui_request', method: 'notify', id: 'n1', message: 'Step-mode stopped — done' },
+    state,
+    client,
+  )
+  assert.equal(state.completed, true)
+  assert.equal(state.exitCode, EXIT_SUCCESS)
+})
+
+// ─── handleExtensionUIRequest uses client.sendUIResponse ────────────────────
+
+test('handleExtensionUIRequest select calls sendUIResponse with value', () => {
+  const client = new MockRpcClient()
+
+  handleExtensionUIRequest(
+    { type: 'extension_ui_request', id: 'sel1', method: 'select', options: ['option-a', 'option-b'] },
+    client,
+  )
+
+  assert.equal(client.sendUICalls.length, 1)
+  assert.equal(client.sendUICalls[0].id, 'sel1')
+  assert.equal(client.sendUICalls[0].response.value, 'option-a')
+})
+
+test('handleExtensionUIRequest confirm calls sendUIResponse with confirmed', () => {
+  const client = new MockRpcClient()
+
+  handleExtensionUIRequest(
+    { type: 'extension_ui_request', id: 'conf1', method: 'confirm' },
+    client,
+  )
+
+  assert.equal(client.sendUICalls.length, 1)
+  assert.equal(client.sendUICalls[0].id, 'conf1')
+  assert.equal(client.sendUICalls[0].response.confirmed, true)
+})
+
+test('handleExtensionUIRequest input calls sendUIResponse with empty value', () => {
+  const client = new MockRpcClient()
+
+  handleExtensionUIRequest(
+    { type: 'extension_ui_request', id: 'inp1', method: 'input' },
+    client,
+  )
+
+  assert.equal(client.sendUICalls.length, 1)
+  assert.equal(client.sendUICalls[0].id, 'inp1')
+  assert.equal(client.sendUICalls[0].response.value, '')
+})
+
+test('handleExtensionUIRequest notify calls sendUIResponse with empty value', () => {
+  const client = new MockRpcClient()
+
+  handleExtensionUIRequest(
+    { type: 'extension_ui_request', id: 'not1', method: 'notify', message: 'Task complete' },
+    client,
+  )
+
+  assert.equal(client.sendUICalls.length, 1)
+  assert.equal(client.sendUICalls[0].id, 'not1')
+  assert.equal(client.sendUICalls[0].response.value, '')
+})
+
+test('handleExtensionUIRequest editor calls sendUIResponse with prefill', () => {
+  const client = new MockRpcClient()
+
+  handleExtensionUIRequest(
+    { type: 'extension_ui_request', id: 'ed1', method: 'editor', prefill: 'initial text' },
+    client,
+  )
+
+  assert.equal(client.sendUICalls.length, 1)
+  assert.equal(client.sendUICalls[0].id, 'ed1')
+  assert.equal(client.sendUICalls[0].response.value, 'initial text')
+})
+
+test('handleExtensionUIRequest unknown method calls sendUIResponse with cancelled', () => {
+  const client = new MockRpcClient()
+
+  handleExtensionUIRequest(
+    { type: 'extension_ui_request', id: 'unk1', method: 'unknown_method' },
+    client,
+  )
+
+  assert.equal(client.sendUICalls.length, 1)
+  assert.equal(client.sendUICalls[0].id, 'unk1')
+  assert.equal(client.sendUICalls[0].response.cancelled, true)
+})
+
+// ─── supervised stdin reader forwarding via sendUIResponse ──────────────────
+
+test('extension_ui_response forwarding extracts fields and calls sendUIResponse', () => {
+  // Simulates what startSupervisedStdinReader does with a parsed message
+  const client = new MockRpcClient()
+
+  const msg = { type: 'extension_ui_response', id: 'resp1', value: 'chosen option', confirmed: undefined, cancelled: undefined }
+  const id = String(msg.id ?? '')
+  const value = msg.value !== undefined ? String(msg.value) : undefined
+  const confirmed = typeof msg.confirmed === 'boolean' ? msg.confirmed : undefined
+  const cancelled = typeof msg.cancelled === 'boolean' ? msg.cancelled : undefined
+  client.sendUIResponse(id, { value, confirmed, cancelled })
+
+  assert.equal(client.sendUICalls.length, 1)
+  assert.equal(client.sendUICalls[0].id, 'resp1')
+  assert.equal(client.sendUICalls[0].response.value, 'chosen option')
+  assert.equal(client.sendUICalls[0].response.confirmed, undefined)
+  assert.equal(client.sendUICalls[0].response.cancelled, undefined)
+})
+
+test('extension_ui_response with confirmed=true forwards correctly', () => {
+  const client = new MockRpcClient()
+
+  const msg = { type: 'extension_ui_response', id: 'resp2', confirmed: true }
+  const id = String(msg.id ?? '')
+  const confirmed = typeof msg.confirmed === 'boolean' ? msg.confirmed : undefined
+  client.sendUIResponse(id, { confirmed })
+
+  assert.equal(client.sendUICalls.length, 1)
+  assert.equal(client.sendUICalls[0].id, 'resp2')
+  assert.equal(client.sendUICalls[0].response.confirmed, true)
+})
+
+// ─── v2 init negotiation ────────────────────────────────────────────────────
+
+test('v2 init success sets v2Enabled', async () => {
+  const client = new MockRpcClient()
+  let v2Enabled = false
+  try {
+    await client.init({ clientId: 'gsd-headless' })
+    v2Enabled = true
+  } catch {
+    // fall back to v1
+  }
+
+  assert.equal(client.initCalled, true)
+  assert.equal(v2Enabled, true)
+})
+
+test('v2 init failure falls back gracefully (v1 mode)', async () => {
+  const client = new MockRpcClient()
+  client.initShouldFail = true
+  let v2Enabled = false
+  try {
+    await client.init({ clientId: 'gsd-headless' })
+    v2Enabled = true
+  } catch {
+    // fall back to v1 — this is expected
+  }
+
+  assert.equal(client.initCalled, true)
+  assert.equal(v2Enabled, false)
+})
+
+// ─── injector adapter ───────────────────────────────────────────────────────
+
+test('injector adapter parses serialized JSONL and calls sendUIResponse', () => {
+  const client = new MockRpcClient()
+
+  // Simulate what the adapter does
+  const data = '{"type":"extension_ui_response","id":"inj1","value":"selected"}\n'
+  const parsed = JSON.parse(data.trim())
+  if (parsed.type === 'extension_ui_response' && parsed.id) {
+    const { id, value, values, confirmed, cancelled } = parsed
+    client.sendUIResponse(id, { value, values, confirmed, cancelled })
+  }
+
+  assert.equal(client.sendUICalls.length, 1)
+  assert.equal(client.sendUICalls[0].id, 'inj1')
+  assert.equal(client.sendUICalls[0].response.value, 'selected')
+})
+
+test('injector adapter handles cancelled response', () => {
+  const client = new MockRpcClient()
+
+  const data = '{"type":"extension_ui_response","id":"inj2","cancelled":true}\n'
+  const parsed = JSON.parse(data.trim())
+  if (parsed.type === 'extension_ui_response' && parsed.id) {
+    const { id, value, values, confirmed, cancelled } = parsed
+    client.sendUIResponse(id, { value, values, confirmed, cancelled })
+  }
+
+  assert.equal(client.sendUICalls.length, 1)
+  assert.equal(client.sendUICalls[0].id, 'inj2')
+  assert.equal(client.sendUICalls[0].response.cancelled, true)
+})
+
+test('injector adapter handles multi-select values', () => {
+  const client = new MockRpcClient()
+
+  const data = '{"type":"extension_ui_response","id":"inj3","values":["a","b"]}\n'
+  const parsed = JSON.parse(data.trim())
+  if (parsed.type === 'extension_ui_response' && parsed.id) {
+    const { id, value, values, confirmed, cancelled } = parsed
+    client.sendUIResponse(id, { value, values, confirmed, cancelled })
+  }
+
+  assert.equal(client.sendUICalls.length, 1)
+  assert.equal(client.sendUICalls[0].id, 'inj3')
+  assert.deepEqual(client.sendUICalls[0].response.values, ['a', 'b'])
+})
--- a/src/tests/integration/e2e-headless.test.ts
+++ b/src/tests/integration/e2e-headless.test.ts
@ -0,0 +1,385 @@
+/**
+ * E2E integration tests for `gsd headless` runtime behavior.
+ *
+ * Spawns real `gsd headless` child processes and asserts on
+ * stdout/stderr/exit-code for: JSON batch mode, SIGINT exit code,
+ * stream-json NDJSON output, --resume error path, and invalid
+ * --output-format handling.
+ *
+ * These tests are structural — they do NOT require API keys.
+ *
+ * Prerequisite: npm run build must be run first.
+ *
+ * Run with:
+ *   node --import ./src/resources/extensions/gsd/tests/resolve-ts.mjs \
+ *        --experimental-strip-types --test \
+ *        src/tests/integration/e2e-headless.test.ts
+ */
+
+import test from "node:test";
+import assert from "node:assert/strict";
+import { spawn } from "node:child_process";
+import { existsSync, mkdtempSync, mkdirSync, rmSync } from "node:fs";
+import { join } from "node:path";
+import { tmpdir } from "node:os";
+
+const projectRoot = process.cwd();
+const loaderPath = join(projectRoot, "dist", "loader.js");
+
+if (!existsSync(loaderPath)) {
+  throw new Error("dist/loader.js not found — run: npm run build");
+}
+
+// ---------------------------------------------------------------------------
+// Helpers
+// ---------------------------------------------------------------------------
+
+type RunResult = {
+  stdout: string;
+  stderr: string;
+  code: number | null;
+  timedOut: boolean;
+};
+
+/**
+ * Spawn `node dist/loader.js ...args` and collect output.
+ */
+function runGsd(
+  args: string[],
+  timeoutMs = 30_000,
+  env: NodeJS.ProcessEnv = {},
+  cwd: string = projectRoot,
+): Promise<RunResult> {
+  return new Promise((resolve) => {
+    let stdout = "";
+    let stderr = "";
+    let timedOut = false;
+
+    const child = spawn("node", [loaderPath, ...args], {
+      cwd,
+      env: { ...process.env, ...env },
+      stdio: ["pipe", "pipe", "pipe"],
+    });
+
+    child.stdout.on("data", (chunk: Buffer) => { stdout += chunk.toString(); });
+    child.stderr.on("data", (chunk: Buffer) => { stderr += chunk.toString(); });
+
+    child.stdin.end();
+
+    const timer = setTimeout(() => {
+      timedOut = true;
+      child.kill("SIGTERM");
+    }, timeoutMs);
+
+    child.on("close", (code) => {
+      clearTimeout(timer);
+      resolve({ stdout, stderr, code, timedOut });
+    });
+  });
+}
+
+/**
+ * Spawn a child process with the ability to send signals mid-flight.
+ * Returns both the child and a promise that resolves with the result.
+ */
+function spawnGsd(
+  args: string[],
+  timeoutMs = 30_000,
+  env: NodeJS.ProcessEnv = {},
+  cwd: string = projectRoot,
+): { child: ReturnType<typeof spawn>; result: Promise<RunResult> } {
+  let stdout = "";
+  let stderr = "";
+  let timedOut = false;
+
+  const child = spawn("node", [loaderPath, ...args], {
+    cwd,
+    env: { ...process.env, ...env },
+    stdio: ["pipe", "pipe", "pipe"],
+  });
+
+  child.stdout!.on("data", (chunk: Buffer) => { stdout += chunk.toString(); });
+  child.stderr!.on("data", (chunk: Buffer) => { stderr += chunk.toString(); });
+
+  child.stdin!.end();
+
+  const timer = setTimeout(() => {
+    timedOut = true;
+    child.kill("SIGTERM");
+  }, timeoutMs);
+
+  const result = new Promise<RunResult>((resolve) => {
+    child.on("close", (code) => {
+      clearTimeout(timer);
+      resolve({ stdout, stderr, code, timedOut });
+    });
+  });
+
+  return { child, result };
+}
+
+/** Strip ANSI escape codes from a string. */
+function stripAnsi(s: string): string {
+  // eslint-disable-next-line no-control-regex
+  return s.replace(/\x1b\[[0-9;]*[A-Za-z]/g, "");
+}
+
+/** Bootstrap a temp directory with .gsd/ structure (milestones + runtime). */
+function createTempWithGsd(prefix: string): string {
+  const dir = mkdtempSync(join(tmpdir(), prefix));
+  mkdirSync(join(dir, ".gsd", "milestones"), { recursive: true });
+  mkdirSync(join(dir, ".gsd", "runtime"), { recursive: true });
+  return dir;
+}
+
+/** Assert no crash markers in output. */
+function assertNoCrashMarkers(output: string): void {
+  const crashMarkers = [
+    "SyntaxError:",
+    "ReferenceError:",
+    "TypeError: Cannot read",
+    "FATAL ERROR",
+    "ERR_MODULE_NOT_FOUND",
+    "Error: Cannot find module",
+    "SIGSEGV",
+    "SIGABRT",
+  ];
+
+  for (const marker of crashMarkers) {
+    assert.ok(
+      !output.includes(marker),
+      `output should not contain crash marker '${marker}':\n${output.slice(0, 500)}`,
+    );
+  }
+}
+
+// ===========================================================================
+// 1. JSON batch mode suppresses streaming — stdout is a single JSON result
+// ===========================================================================
+
+test("headless --output-format json emits a single HeadlessJsonResult on stdout", async (t) => {
+  const tmpDir = createTempWithGsd("gsd-e2e-json-batch-");
+  t.after(() => { rmSync(tmpDir, { recursive: true, force: true }); });
+
+  // --max-restarts 0 prevents retry loops which would emit multiple JSON results.
+  // --timeout 2000 ensures the process completes quickly.
+  // Will timeout/error (no API key) but JSON batch mode should emit one HeadlessJsonResult.
+  const result = await runGsd(
+    ["headless", "--output-format", "json", "--timeout", "2000", "--max-restarts", "0", "auto"],
+    45_000,  // generous harness timeout — process needs ~4-6s (2s timeout + startup + cleanup)
+    {},
+    tmpDir,
+  );
+
+  assert.ok(!result.timedOut, "test harness should not time out");
+  // Non-zero exit expected (no API key / timeout), but process may exit 0
+  // if auto-mode detects a conflict and completes immediately.
+  assert.ok(result.code !== null, "process should exit with a code");
+
+  const stdout = result.stdout.trim();
+  assert.ok(stdout.length > 0, `stdout should contain the JSON result, got empty. stderr: ${stripAnsi(result.stderr).slice(0, 300)}`);
+
+  // Must parse as a single JSON object (not NDJSON with multiple lines)
+  let parsed: Record<string, unknown>;
+  try {
+    parsed = JSON.parse(stdout);
+  } catch (e) {
+    assert.fail(
+      `stdout should be valid JSON, got parse error: ${(e as Error).message}\nstdout: ${stdout.slice(0, 500)}`,
+    );
+  }
+
+  // Assert HeadlessJsonResult shape
+  assert.equal(typeof parsed.status, "string", "result should have a string 'status' field");
+  assert.equal(typeof parsed.exitCode, "number", "result should have a number 'exitCode' field");
+  assert.equal(typeof parsed.duration, "number", "result should have a number 'duration' field");
+  assert.equal(typeof parsed.cost, "object", "result should have a 'cost' object");
+  assert.equal(typeof parsed.toolCalls, "number", "result should have a number 'toolCalls' field");
+  assert.equal(typeof parsed.events, "number", "result should have a number 'events' field");
+
+  // Must NOT be NDJSON (multiple newline-separated JSON objects)
+  const lines = stdout.split("\n").filter((l: string) => l.trim().length > 0);
+  assert.equal(lines.length, 1, `expected exactly one JSON line in stdout, got ${lines.length}`);
+
+  const combined = stripAnsi(result.stdout + result.stderr);
+  assertNoCrashMarkers(combined);
+});
+
+// ===========================================================================
+// 2. SIGINT produces exit code 11 (EXIT_CANCELLED)
+// ===========================================================================
+
+test("headless exits with code 11 after SIGINT", async (t) => {
+  const tmpDir = createTempWithGsd("gsd-e2e-sigint-");
+  t.after(() => { rmSync(tmpDir, { recursive: true, force: true }); });
+
+  // Spawn with long timeout and max-restarts 0 so the process stays alive
+  // waiting for completion while we send SIGINT.
+  const { child, result: resultPromise } = spawnGsd(
+    ["headless", "--timeout", "60000", "--max-restarts", "0", "--context-text", "Test context for SIGINT", "new-milestone"],
+    30_000,
+    {},
+    tmpDir,
+  );
+
+  // Wait for stderr output to confirm the process has started and registered
+  // its SIGINT handler (handler is registered before client.start in runHeadlessOnce).
+  let stderrSoFar = "";
+  await new Promise<void>((resolve) => {
+    const check = () => {
+      if (stderrSoFar.length > 0) {
+        resolve();
+      }
+    };
+    child.stderr!.on("data", (chunk: Buffer) => {
+      stderrSoFar += chunk.toString();
+      check();
+    });
+    // Fallback: resolve after 4s even if no stderr
+    setTimeout(resolve, 4000);
+  });
+
+  // Send SIGINT
+  child.kill("SIGINT");
+
+  const result = await resultPromise;
+  assert.ok(!result.timedOut, "test harness should not time out");
+
+  const stderr = stripAnsi(result.stderr);
+
+  // In environments where the process completes before SIGINT arrives
+  // (e.g., existing auto-mode session causes immediate conflict exit),
+  // exit code may be 0 or 1 instead of 11. The test verifies the
+  // handler's behavior when it can be observed.
+  if (stderr.includes("Interrupted")) {
+    // SIGINT handler fired — verify exit code 11
+    assert.strictEqual(
+      result.code, 11,
+      `SIGINT handler fired but exit code was ${result.code}, expected 11 (EXIT_CANCELLED)`,
+    );
+  } else {
+    // Process exited before SIGINT arrived — acceptable in environments
+    // with running gsd sessions that cause auto-mode conflict.
+    // Verify it at least didn't crash.
+    const combined = stripAnsi(result.stdout + result.stderr);
+    assertNoCrashMarkers(combined);
+    assert.ok(
+      result.code === 0 || result.code === 1 || result.code === 11,
+      `expected clean exit (0, 1, or 11), got ${result.code}`,
+    );
+  }
+});
+
+// ===========================================================================
+// 3. stream-json emits NDJSON on stdout (each line is valid JSON)
+// ===========================================================================
+
+test("headless --output-format stream-json emits NDJSON on stdout", async (t) => {
+  const tmpDir = createTempWithGsd("gsd-e2e-stream-json-");
+  t.after(() => { rmSync(tmpDir, { recursive: true, force: true }); });
+
+  // --max-restarts 0 to prevent retry loops that extend runtime.
+  const result = await runGsd(
+    ["headless", "--output-format", "stream-json", "--timeout", "2000", "--max-restarts", "0", "auto"],
+    45_000,  // generous harness timeout
+    {},
+    tmpDir,
+  );
+
+  assert.ok(!result.timedOut, "test harness should not time out");
+  // Non-zero exit expected (no API key / timeout), but 0 is acceptable
+  // if auto-mode completes immediately (session conflict).
+  assert.ok(result.code !== null, "process should exit with a code");
+
+  const stdout = result.stdout.trim();
+
+  // stream-json may produce zero events if the process errors before any
+  // events fire — that's valid. But if there IS stdout, every line must
+  // be valid JSON (NDJSON format).
+  if (stdout.length > 0) {
+    const lines = stdout.split("\n").filter((l: string) => l.trim().length > 0);
+    assert.ok(lines.length > 0, "if stdout has content, it should have at least one line");
+
+    for (let i = 0; i < lines.length; i++) {
+      try {
+        JSON.parse(lines[i]);
+      } catch (e) {
+        assert.fail(
+          `stdout line ${i + 1} is not valid JSON: ${(e as Error).message}\nline: ${lines[i].slice(0, 300)}`,
+        );
+      }
+    }
+
+    // Multiple NDJSON lines (not a single batch object) is expected
+    // for stream-json mode when events fire
+  }
+
+  const combined = stripAnsi(result.stdout + result.stderr);
+  assertNoCrashMarkers(combined);
+});
+
+// ===========================================================================
+// 4. --resume with nonexistent ID exits 1 with clean error
+// ===========================================================================
+
+test("headless --resume with nonexistent ID exits 1 with descriptive error", async (t) => {
+  const tmpDir = createTempWithGsd("gsd-e2e-resume-bad-");
+  t.after(() => { rmSync(tmpDir, { recursive: true, force: true }); });
+
+  const result = await runGsd(
+    ["headless", "--resume", "nonexistent-id-xyz", "--max-restarts", "0", "auto"],
+    30_000,
+    {},
+    tmpDir,
+  );
+
+  assert.ok(!result.timedOut, "test harness should not time out");
+  assert.strictEqual(result.code, 1, `expected exit 1, got ${result.code}`);
+
+  const stderr = stripAnsi(result.stderr);
+
+  // The error should mention the bad ID or "No session matching"
+  assert.ok(
+    stderr.includes("nonexistent-id-xyz") || stderr.includes("No session matching"),
+    `stderr should mention the bad session ID or 'No session matching', got:\n${stderr.slice(0, 500)}`,
+  );
+
+  const combined = stripAnsi(result.stdout + result.stderr);
+  assertNoCrashMarkers(combined);
+});
+
+// ===========================================================================
+// 5. --output-format with invalid value exits 1 with helpful message
+// ===========================================================================
+
+test("headless --output-format with invalid value exits 1", async (t) => {
+  const tmpDir = createTempWithGsd("gsd-e2e-bad-format-");
+  t.after(() => { rmSync(tmpDir, { recursive: true, force: true }); });
+
+  const result = await runGsd(
+    ["headless", "--output-format", "invalid-format", "auto"],
+    15_000,
+    {},
+    tmpDir,
+  );
+
+  assert.ok(!result.timedOut, "test harness should not time out");
+  assert.strictEqual(result.code, 1, `expected exit 1, got ${result.code}`);
+
+  const stderr = stripAnsi(result.stderr);
+
+  // Should mention valid formats
+  assert.ok(
+    stderr.includes("text") && stderr.includes("json") && stderr.includes("stream-json"),
+    `stderr should list valid output formats, got:\n${stderr.slice(0, 500)}`,
+  );
+
+  // Should mention what was provided
+  assert.ok(
+    stderr.includes("invalid-format"),
+    `stderr should echo the invalid value, got:\n${stderr.slice(0, 500)}`,
+  );
+
+  const combined = stripAnsi(result.stdout + result.stderr);
+  assertNoCrashMarkers(combined);
+});