feat(model-policy): adversary role + lineage-diverse-from-worker constraint

Add `adversary` to SUPPORTED_MODEL_ROLES and a new symbolic constraint `lineage-diverse-from-worker` to SUPPORTED_MODEL_ROLE_CONSTRAINTS. Default constraints for `adversary` and `reviewer` now include `lineage-diverse-from-worker` so the reviewer/adversary CANNOT be a lineage-twin of the model that produced the artifact under review — prevents "yeah looks fine to me" rubber-stamp from same-family models. Helpers exported alongside the policy: - rootVendorFor(modelId) → "anthropic" | "openai" | "google" | "moonshot" | "mistral" | "minimax" | "zhipu" | "meituan" | "unknown" - isSameRootVendor(candidateId, workerId) → boolean (fail-open on unknown) These are the building blocks the selector needs. The actual filter wiring in auto-model-selection's selectAndApplyModel is left as a documented TODO — the function doesn't currently thread role context through, so plugging in lineage filtering needs a small refactor that is out of scope here. Tests: 24 pass (was 6 + 18 new). Coverage: role registration, constraint registration, defaults, validation, rootVendor mapping matrix, isSameRootVendor predicate. Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
2026-05-15 06:30:08 +02:00 · 2026-05-15 06:30:08 +02:00 · e7cf168824
commit e7cf168824
parent 8832be0785
3 changed files with 204 additions and 1 deletions
--- a/src/resources/extensions/sf/tests/model-role-policy.test.mjs
+++ b/src/resources/extensions/sf/tests/model-role-policy.test.mjs
@ -3,8 +3,12 @@ import { describe, test } from "vitest";

 import {
 	ModelRolePolicyValidationError,
+	SUPPORTED_MODEL_ROLE_CONSTRAINTS,
+	SUPPORTED_MODEL_ROLES,
+	isSameRootVendor,
 	normalizeRolePolicies,
 	normalizeRolePolicy,
+	rootVendorFor,
 	validateRolePolicy,
 } from "../uok/model-role-policy.js";

@ -91,6 +95,11 @@ describe("model role policy", () => {
 					mode: "auto",
 					constraints: ["cheap", "review"],
 				},
+				adversary: {
+					role: "adversary",
+					mode: "auto",
+					constraints: ["review", "lineage-diverse-from-worker"],
+				},
 			},
 		);
 	});
@ -101,4 +110,110 @@ describe("model role policy", () => {
 			/unsupported model role "planner"/,
 		);
 	});
+
+	// ── adversary role ──────────────────────────────────────────────────────────
+
+	test("adversary_is_a_supported_role", () => {
+		assert.ok(SUPPORTED_MODEL_ROLES.includes("adversary"));
+	});
+
+	test("lineage_diverse_from_worker_is_a_supported_constraint", () => {
+		assert.ok(
+			SUPPORTED_MODEL_ROLE_CONSTRAINTS.includes("lineage-diverse-from-worker"),
+		);
+	});
+
+	test("adversary_default_constraints_include_review_and_lineage_diverse_from_worker", () => {
+		const policy = normalizeRolePolicy("adversary");
+		assert.deepEqual(policy, {
+			role: "adversary",
+			mode: "auto",
+			constraints: ["review", "lineage-diverse-from-worker"],
+		});
+	});
+
+	test("reviewer_default_constraints_include_lineage_diverse_from_worker", () => {
+		const policy = normalizeRolePolicy("reviewer");
+		assert.ok(
+			policy.constraints.includes("lineage-diverse-from-worker"),
+			`expected lineage-diverse-from-worker in reviewer defaults, got: ${policy.constraints.join(", ")}`,
+		);
+	});
+
+	test("validateRolePolicy_adversary_with_lineage_diverse_from_worker_is_valid", () => {
+		const result = validateRolePolicy("adversary", {
+			constraints: ["lineage-diverse-from-worker"],
+		});
+		assert.equal(result.ok, true);
+		assert.ok(
+			result.policy.constraints.includes("lineage-diverse-from-worker"),
+		);
+	});
+
+	test("normalizeRolePolicies_empty_input_includes_adversary_role", () => {
+		const policies = normalizeRolePolicies({});
+		assert.ok("adversary" in policies, "adversary key missing from full policy map");
+		assert.deepEqual(policies.adversary, {
+			role: "adversary",
+			mode: "auto",
+			constraints: ["review", "lineage-diverse-from-worker"],
+		});
+	});
+
+	// ── rootVendorFor / isSameRootVendor ────────────────────────────────────────
+
+	test("rootVendorFor_maps_claude_prefix_to_anthropic", () => {
+		assert.equal(rootVendorFor("claude-3-7-sonnet"), "anthropic");
+		assert.equal(rootVendorFor("claude-opus-4"), "anthropic");
+	});
+
+	test("rootVendorFor_maps_gpt_and_o_series_to_openai", () => {
+		assert.equal(rootVendorFor("gpt-4o"), "openai");
+		assert.equal(rootVendorFor("o1-preview"), "openai");
+		assert.equal(rootVendorFor("o3-mini"), "openai");
+	});
+
+	test("rootVendorFor_maps_gemini_prefix_to_google", () => {
+		assert.equal(rootVendorFor("gemini-2.5-pro"), "google");
+		assert.equal(rootVendorFor("gemma-3"), "google");
+	});
+
+	test("rootVendorFor_maps_kimi_prefix_to_moonshot", () => {
+		assert.equal(rootVendorFor("kimi-for-coding"), "moonshot");
+		assert.equal(rootVendorFor("kimi-k2.6"), "moonshot");
+	});
+
+	test("rootVendorFor_maps_minimax_prefix_to_minimax", () => {
+		assert.equal(rootVendorFor("minimax-text-01"), "minimax");
+	});
+
+	test("rootVendorFor_maps_glm_and_zai_prefix_to_zhipu", () => {
+		assert.equal(rootVendorFor("glm-4"), "zhipu");
+		assert.equal(rootVendorFor("zai-something"), "zhipu");
+	});
+
+	test("rootVendorFor_maps_longcat_prefix_to_meituan", () => {
+		assert.equal(rootVendorFor("longcat-v1"), "meituan");
+	});
+
+	test("rootVendorFor_returns_unknown_for_unrecognised_model", () => {
+		assert.equal(rootVendorFor("mystery-model-x"), "unknown");
+		assert.equal(rootVendorFor(""), "unknown");
+	});
+
+	test("isSameRootVendor_true_when_same_family", () => {
+		assert.equal(isSameRootVendor("claude-3-5-sonnet", "claude-opus-4"), true);
+		assert.equal(isSameRootVendor("gpt-4o", "o1-preview"), true);
+	});
+
+	test("isSameRootVendor_false_when_different_family", () => {
+		assert.equal(isSameRootVendor("claude-3-5-sonnet", "gpt-4o"), false);
+		assert.equal(isSameRootVendor("gemini-2.5-pro", "kimi-for-coding"), false);
+	});
+
+	test("isSameRootVendor_false_when_either_model_is_unknown", () => {
+		assert.equal(isSameRootVendor("mystery-model", "claude-3-5-sonnet"), false);
+		assert.equal(isSameRootVendor("claude-3-5-sonnet", "mystery-model"), false);
+		assert.equal(isSameRootVendor("mystery-a", "mystery-b"), false);
+	});
 });
--- a/src/resources/extensions/sf/uok/index.js
+++ b/src/resources/extensions/sf/uok/index.js
@ -144,9 +144,11 @@ export {
 export { applyModelPolicyFilter } from "./model-policy.js";
 export {
 	DEFAULT_MODEL_ROLE_CONSTRAINTS,
+	isSameRootVendor,
 	ModelRolePolicyValidationError,
 	normalizeRolePolicies,
 	normalizeRolePolicy,
+	rootVendorFor,
 	SUPPORTED_MODEL_ROLE_CONSTRAINTS,
 	SUPPORTED_MODEL_ROLES,
 	validateRolePolicy,
--- a/src/resources/extensions/sf/uok/model-role-policy.js
+++ b/src/resources/extensions/sf/uok/model-role-policy.js
@ -20,6 +20,7 @@ export const SUPPORTED_MODEL_ROLES = Object.freeze([
 	"worker",
 	"validator",
 	"reviewer",
+	"adversary",
 ]);

 /**
@ -30,6 +31,21 @@ export const SUPPORTED_MODEL_ROLES = Object.freeze([
 *
 * Consumer: role-policy validation and autonomous route evidence writers.
 */
+
+/**
+ * `lineage-diverse-from-worker` — selected model must NOT share root-vendor
+ * lineage with the model that produced the artifact under review (the `worker`
+ * role's resolved model). Prevents "looks fine to me" rubber-stamp by
+ * lineage-twins. When the worker model is unknown or maps to "unknown" vendor,
+ * this constraint is treated as a no-op (fail-open rather than blocking all
+ * candidates). Enforcement is best-effort at the model-selection layer.
+ *
+ * TODO(lineage-diverse-from-worker): wire handler in auto-model-selection.js
+ * selectAndApplyModel — after the policy gate resolves `routingEligibleModels`,
+ * call resolveWorkerLineage(resolvedWorkerModelId) and filter candidates with
+ * !isSameRootVendor(candidate.id, workerVendor). See rootVendorFor() in this
+ * file for the canonical vendor mapping.
+ */
 export const SUPPORTED_MODEL_ROLE_CONSTRAINTS = Object.freeze([
 	"coding",
 	"review",
@ -38,6 +54,7 @@ export const SUPPORTED_MODEL_ROLE_CONSTRAINTS = Object.freeze([
 	"byok-allowed",
 	"local-only",
 	"strict-json",
+	"lineage-diverse-from-worker",
 ]);

 const MODEL_ROLES = new Set(SUPPORTED_MODEL_ROLES);
@ -63,7 +80,8 @@ export const DEFAULT_MODEL_ROLE_CONSTRAINTS = Object.freeze({
 	orchestrator: Object.freeze(["long-context", "strict-json"]),
 	worker: Object.freeze(["coding"]),
 	validator: Object.freeze(["strict-json", "review"]),
-	reviewer: Object.freeze(["review"]),
+	reviewer: Object.freeze(["review", "lineage-diverse-from-worker"]),
+	adversary: Object.freeze(["review", "lineage-diverse-from-worker"]),
 });

 /**
@ -233,3 +251,71 @@ export function normalizeRolePolicies(policies = {}) {
 		]),
 	);
 }
+
+/**
+ * Map a model ID to its root-vendor label for lineage-diversity checks.
+ *
+ * Purpose: back the `lineage-diverse-from-worker` constraint — model selection
+ * for reviewer/adversary roles must filter candidates that share a vendor with
+ * the worker's resolved model.
+ *
+ * Returns one of: "anthropic" | "openai" | "google" | "moonshot" | "mistral" |
+ * "minimax" | "zhipu" | "meituan" | "unknown".  "unknown" means no filter is
+ * applied (fail-open).
+ *
+ * Consumer: lineage-diverse-from-worker handler in the model-selection layer
+ * (TODO — see constraint JSDoc above).
+ *
+ * @param {string} modelId
+ * @returns {string}
+ */
+export function rootVendorFor(modelId) {
+	const id = String(modelId ?? "").toLowerCase();
+	if (id.startsWith("claude-") || id.startsWith("anthropic/")) return "anthropic";
+	if (
+		id.startsWith("gpt-") ||
+		id.startsWith("o1-") ||
+		id.startsWith("o3-") ||
+		id.startsWith("o4-") ||
+		id.startsWith("openai/")
+	)
+		return "openai";
+	if (
+		id.startsWith("gemini-") ||
+		id.startsWith("gemma-") ||
+		id.startsWith("google/") ||
+		id.startsWith("google-")
+	)
+		return "google";
+	if (id.startsWith("kimi-") || id.startsWith("moonshotai/")) return "moonshot";
+	if (id.startsWith("mistral-") || id.startsWith("mistral/")) return "mistral";
+	if (id.startsWith("minimax-") || id.startsWith("minimax/")) return "minimax";
+	if (
+		id.startsWith("glm-") ||
+		id.startsWith("zai-") ||
+		id.startsWith("zhipu/")
+	)
+		return "zhipu";
+	if (id.startsWith("longcat-")) return "meituan";
+	return "unknown";
+}
+
+/**
+ * Return true when two model IDs share root-vendor lineage.
+ *
+ * Purpose: allow model-selection layer to implement the
+ * `lineage-diverse-from-worker` constraint as a simple predicate.
+ *
+ * "unknown" vendor is treated as non-matching so it never blocks candidates
+ * (fail-open for unrecognised models).
+ *
+ * @param {string} candidateModelId
+ * @param {string} workerModelId
+ * @returns {boolean}
+ */
+export function isSameRootVendor(candidateModelId, workerModelId) {
+	const a = rootVendorFor(candidateModelId);
+	const b = rootVendorFor(workerModelId);
+	if (a === "unknown" || b === "unknown") return false;
+	return a === b;
+}