diff --git a/packages/interfacectl-cli/dist/commands/generation-session.d.ts b/packages/interfacectl-cli/dist/commands/generation-session.d.ts
index 7d0149d..78911c5 100644
--- a/packages/interfacectl-cli/dist/commands/generation-session.d.ts
+++ b/packages/interfacectl-cli/dist/commands/generation-session.d.ts
@@ -54,7 +54,20 @@ export interface SummarizeGenerationBenchmarkCommandOptions {
     comparisonPaths?: string;
     suggestionPaths?: string;
     outDir?: string;
+    runPath?: string;
 }
+export interface ReplayGenerationBenchmarkCommandOptions {
+    specPath?: string;
+    tool?: string;
+    outDir?: string;
+    cohortId?: string;
+    sourceRunPath?: string;
+    requestedModelLabel?: string;
+    resolvedModelId?: string;
+    baseUrl?: string;
+    fingerprint?: string;
+}
+export declare function runReplayGenerationBenchmarkCommand(options: ReplayGenerationBenchmarkCommandOptions): Promise<number>;
 export declare function runInitGenerationSessionCommand(options: InitGenerationSessionCommandOptions): Promise<number>;
 export declare function runPrepareGenerationHandoffCommand(options: PrepareGenerationHandoffCommandOptions): Promise<number>;
 export declare function runRecordGenerationAttemptCommand(options: RecordGenerationAttemptCommandOptions): Promise<number>;
diff --git a/packages/interfacectl-cli/dist/commands/generation-session.d.ts.map b/packages/interfacectl-cli/dist/commands/generation-session.d.ts.map
index 77aaf71..5257f5b 100644
--- a/packages/interfacectl-cli/dist/commands/generation-session.d.ts.map
+++ b/packages/interfacectl-cli/dist/commands/generation-session.d.ts.map
@@ -1 +1 @@
-{"version":3,"file":"generation-session.d.ts","sourceRoot":"","sources":["../../src/commands/generation-session.ts"],"names":[],"mappings":"AA8BA,MAAM,WAAW,mCAAmC;IAClD,UAAU,CAAC,EAAE,MAAM,CAAC;IACpB,SAAS,CAAC,EAAE,MAAM,CAAC;IACnB,aAAa,CAAC,EAAE,MAAM,CAAC;IACvB,IAAI,CAAC,EAAE,MAAM,CAAC;IACd,SAAS,CAAC,EAAE,MAAM,CAAC;IACnB,aAAa,CAAC,EAAE,MAAM,CAAC;IACvB,gBAAgB,CAAC,EAAE,MAAM,CAAC;IAC1B,YAAY,CAAC,EAAE,MAAM,CAAC;IACtB,SAAS,CAAC,EAAE,MAAM,CAAC;CACpB;AAED,MAAM,WAAW,sCAAsC;IACrD,UAAU,CAAC,EAAE,MAAM,CAAC;IACpB,gBAAgB,CAAC,EAAE,MAAM,CAAC;IAC1B,uBAAuB,CAAC,EAAE,MAAM,CAAC;IACjC,iBAAiB,CAAC,EAAE,MAAM,CAAC;IAC3B,YAAY,CAAC,EAAE,MAAM,CAAC;IACtB,OAAO,CAAC,EAAE,MAAM,CAAC;CAClB;AAED,MAAM,WAAW,qCAAqC;IACpD,UAAU,CAAC,EAAE,MAAM,CAAC;IACpB,cAAc,CAAC,EAAE,MAAM,CAAC;CACzB;AAED,MAAM,WAAW,sCAAsC;IACrD,UAAU,CAAC,EAAE,MAAM,CAAC;IACpB,aAAa,CAAC,EAAE,MAAM,GAAG,MAAM,CAAC;IAChC,GAAG,CAAC,EAAE,MAAM,CAAC;IACb,OAAO,CAAC,EAAE,MAAM,CAAC;IACjB,gBAAgB,CAAC,EAAE,MAAM,CAAC;CAC3B;AAED,MAAM,WAAW,qCAAqC;IACpD,UAAU,CAAC,EAAE,MAAM,CAAC;IACpB,aAAa,CAAC,EAAE,MAAM,GAAG,MAAM,CAAC;IAChC,UAAU,CAAC,EAAE,MAAM,CAAC;CACrB;AAED,MAAM,WAAW,wCAAwC;IACvD,UAAU,CAAC,EAAE,MAAM,CAAC;CACrB;AAED,MAAM,WAAW,uCAAuC;IACtD,kBAAkB,CAAC,EAAE,MAAM,CAAC;IAC5B,gBAAgB,CAAC,EAAE,MAAM,CAAC;IAC1B,MAAM,CAAC,EAAE,MAAM,CAAC;CACjB;AAED,MAAM,WAAW,mCAAmC;IAClD,UAAU,CAAC,EAAE,MAAM,CAAC;IACpB,OAAO,CAAC,EAAE,MAAM,CAAC;CAClB;AAED,MAAM,WAAW,4CAA4C;IAC3D,eAAe,CAAC,EAAE,MAAM,CAAC;IACzB,UAAU,CAAC,EAAE,MAAM,CAAC;IACpB,OAAO,CAAC,EAAE,MAAM,CAAC;CAClB;AAED,MAAM,WAAW,0CAA0C;IACzD,eAAe,CAAC,EAAE,MAAM,CAAC;IACzB,eAAe,CAAC,EAAE,MAAM,CAAC;IACzB,MAAM,CAAC,EAAE,MAAM,CAAC;CACjB;AAqhED,wBAAsB,+BAA+B,CACnD,OAAO,EAAE,mCAAmC,GAC3C,OAAO,CAAC,MAAM,CAAC,CA8EjB;AAED,wBAAsB,kCAAkC,CACtD,OAAO,EAAE,sCAAsC,GAC9C,OAAO,CAAC,MAAM,CAAC,CA6DjB;AAED,wBAAsB,iCAAiC,CACrD,OAAO,EAAE,qCAAqC,GAC7C,OAAO,CAAC,MAAM,CAAC,CA+FjB;AAED,wBAAsB,kCAAkC,CACtD,OAAO,EAAE,sCAAsC,GAC9C,OAAO,CAAC,MAAM,CAAC,CA0GjB;AAED,wBAAsB,iCAAiC,CACrD,OAAO,EAAE,qCAAqC,GAC7C,OAAO,CAAC,MAAM,CAAC,CAuEjB;AAED,wBAAsB,oCAAoC,CACxD,OAAO,EAAE,wCAAwC,GAChD,OAAO,CAAC,MAAM,CAAC,CAmBjB;AAED,wBAAsB,mCAAmC,CACvD,OAAO,EAAE,uCAAuC,GAC/C,OAAO,CAAC,MAAM,CAAC,CA4CjB;AAED,wBAAsB,+BAA+B,CACnD,OAAO,EAAE,mCAAmC,GAC3C,OAAO,CAAC,MAAM,CAAC,CAuCjB;AAED,wBAAsB,wCAAwC,CAC5D,OAAO,EAAE,4CAA4C,GACpD,OAAO,CAAC,MAAM,CAAC,CA8EjB;AAED,wBAAsB,sCAAsC,CAC1D,OAAO,EAAE,0CAA0C,GAClD,OAAO,CAAC,MAAM,CAAC,CAuIjB"}
\ No newline at end of file
+{"version":3,"file":"generation-session.d.ts","sourceRoot":"","sources":["../../src/commands/generation-session.ts"],"names":[],"mappings":"AAuCA,MAAM,WAAW,mCAAmC;IAClD,UAAU,CAAC,EAAE,MAAM,CAAC;IACpB,SAAS,CAAC,EAAE,MAAM,CAAC;IACnB,aAAa,CAAC,EAAE,MAAM,CAAC;IACvB,IAAI,CAAC,EAAE,MAAM,CAAC;IACd,SAAS,CAAC,EAAE,MAAM,CAAC;IACnB,aAAa,CAAC,EAAE,MAAM,CAAC;IACvB,gBAAgB,CAAC,EAAE,MAAM,CAAC;IAC1B,YAAY,CAAC,EAAE,MAAM,CAAC;IACtB,SAAS,CAAC,EAAE,MAAM,CAAC;CACpB;AAED,MAAM,WAAW,sCAAsC;IACrD,UAAU,CAAC,EAAE,MAAM,CAAC;IACpB,gBAAgB,CAAC,EAAE,MAAM,CAAC;IAC1B,uBAAuB,CAAC,EAAE,MAAM,CAAC;IACjC,iBAAiB,CAAC,EAAE,MAAM,CAAC;IAC3B,YAAY,CAAC,EAAE,MAAM,CAAC;IACtB,OAAO,CAAC,EAAE,MAAM,CAAC;CAClB;AAED,MAAM,WAAW,qCAAqC;IACpD,UAAU,CAAC,EAAE,MAAM,CAAC;IACpB,cAAc,CAAC,EAAE,MAAM,CAAC;CACzB;AAED,MAAM,WAAW,sCAAsC;IACrD,UAAU,CAAC,EAAE,MAAM,CAAC;IACpB,aAAa,CAAC,EAAE,MAAM,GAAG,MAAM,CAAC;IAChC,GAAG,CAAC,EAAE,MAAM,CAAC;IACb,OAAO,CAAC,EAAE,MAAM,CAAC;IACjB,gBAAgB,CAAC,EAAE,MAAM,CAAC;CAC3B;AAED,MAAM,WAAW,qCAAqC;IACpD,UAAU,CAAC,EAAE,MAAM,CAAC;IACpB,aAAa,CAAC,EAAE,MAAM,GAAG,MAAM,CAAC;IAChC,UAAU,CAAC,EAAE,MAAM,CAAC;CACrB;AAED,MAAM,WAAW,wCAAwC;IACvD,UAAU,CAAC,EAAE,MAAM,CAAC;CACrB;AAED,MAAM,WAAW,uCAAuC;IACtD,kBAAkB,CAAC,EAAE,MAAM,CAAC;IAC5B,gBAAgB,CAAC,EAAE,MAAM,CAAC;IAC1B,MAAM,CAAC,EAAE,MAAM,CAAC;CACjB;AAED,MAAM,WAAW,mCAAmC;IAClD,UAAU,CAAC,EAAE,MAAM,CAAC;IACpB,OAAO,CAAC,EAAE,MAAM,CAAC;CAClB;AAED,MAAM,WAAW,4CAA4C;IAC3D,eAAe,CAAC,EAAE,MAAM,CAAC;IACzB,UAAU,CAAC,EAAE,MAAM,CAAC;IACpB,OAAO,CAAC,EAAE,MAAM,CAAC;CAClB;AAED,MAAM,WAAW,0CAA0C;IACzD,eAAe,CAAC,EAAE,MAAM,CAAC;IACzB,eAAe,CAAC,EAAE,MAAM,CAAC;IACzB,MAAM,CAAC,EAAE,MAAM,CAAC;IAChB,OAAO,CAAC,EAAE,MAAM,CAAC;CAClB;AAED,MAAM,WAAW,uCAAuC;IACtD,QAAQ,CAAC,EAAE,MAAM,CAAC;IAClB,IAAI,CAAC,EAAE,MAAM,CAAC;IACd,MAAM,CAAC,EAAE,MAAM,CAAC;IAChB,QAAQ,CAAC,EAAE,MAAM,CAAC;IAClB,aAAa,CAAC,EAAE,MAAM,CAAC;IACvB,mBAAmB,CAAC,EAAE,MAAM,CAAC;IAC7B,eAAe,CAAC,EAAE,MAAM,CAAC;IACzB,OAAO,CAAC,EAAE,MAAM,CAAC;IACjB,WAAW,CAAC,EAAE,MAAM,CAAC;CACtB;AAw+ED,wBAAsB,mCAAmC,CACvD,OAAO,EAAE,uCAAuC,GAC/C,OAAO,CAAC,MAAM,CAAC,CAgFjB;AAED,wBAAsB,+BAA+B,CACnD,OAAO,EAAE,mCAAmC,GAC3C,OAAO,CAAC,MAAM,CAAC,CA8EjB;AAED,wBAAsB,kCAAkC,CACtD,OAAO,EAAE,sCAAsC,GAC9C,OAAO,CAAC,MAAM,CAAC,CA6DjB;AAED,wBAAsB,iCAAiC,CACrD,OAAO,EAAE,qCAAqC,GAC7C,OAAO,CAAC,MAAM,CAAC,CA+FjB;AAED,wBAAsB,kCAAkC,CACtD,OAAO,EAAE,sCAAsC,GAC9C,OAAO,CAAC,MAAM,CAAC,CA0GjB;AAED,wBAAsB,iCAAiC,CACrD,OAAO,EAAE,qCAAqC,GAC7C,OAAO,CAAC,MAAM,CAAC,CAuEjB;AAED,wBAAsB,oCAAoC,CACxD,OAAO,EAAE,wCAAwC,GAChD,OAAO,CAAC,MAAM,CAAC,CAmBjB;AAED,wBAAsB,mCAAmC,CACvD,OAAO,EAAE,uCAAuC,GAC/C,OAAO,CAAC,MAAM,CAAC,CA4CjB;AAED,wBAAsB,+BAA+B,CACnD,OAAO,EAAE,mCAAmC,GAC3C,OAAO,CAAC,MAAM,CAAC,CAuCjB;AAED,wBAAsB,wCAAwC,CAC5D,OAAO,EAAE,4CAA4C,GACpD,OAAO,CAAC,MAAM,CAAC,CA8EjB;AAED,wBAAsB,sCAAsC,CAC1D,OAAO,EAAE,0CAA0C,GAClD,OAAO,CAAC,MAAM,CAAC,CA8QjB"}
\ No newline at end of file
diff --git a/packages/interfacectl-cli/dist/commands/generation-session.js b/packages/interfacectl-cli/dist/commands/generation-session.js
index 1fdd7ae..6916605 100644
--- a/packages/interfacectl-cli/dist/commands/generation-session.js
+++ b/packages/interfacectl-cli/dist/commands/generation-session.js
@@ -9,16 +9,20 @@ import { emitContractRunArtifact, } from "../utils/run-artifacts.js";
 import { writeDeterministicJsonSync } from "../utils/deterministic-json.js";
 const VALID_TOOLS = new Set(["codex", "cursor", "local-llm"]);
 const VALID_GRADES = new Set(["strong", "partial", "weak"]);
-const VALID_GUIDANCE_STRATEGIES = new Set(["prompt-summary", "json-primary", "unguided"]);
+const VALID_GUIDANCE_STRATEGIES = new Set(["prompt-summary", "baseline-primary", "json-primary", "unguided"]);
 const VALID_REVIEW_STATUSES = new Set(["accepted", "rejected"]);
 const VALID_SUGGESTION_STATUSES = new Set(["proposed", "accepted", "rejected"]);
 const VALID_SUCCESS_RULES = new Set(["pass", "pass-or-reviewed-warn"]);
+const VALID_EVALUATION_MODES = new Set(["zero-shot", "iterative"]);
+const VALID_PLATFORM_TARGETS = new Set(["web", "ios", "android"]);
+const VALID_CONSUMER_TYPES = new Set(["web-browser", "desktop-shell", "ios-native", "android-native"]);
 const ASSESSMENT_DIMENSIONS = [
     "structure",
     "components",
     "boundary",
     "visual",
     "responsiveness",
+    "platformFit",
 ];
 class SessionInputError extends Error {
     code;
@@ -79,10 +83,31 @@ function ensureGuidanceStrategy(guidanceStrategy) {
     const normalized = typeof guidanceStrategy === "string" ? guidanceStrategy.trim().toLowerCase() : "prompt-summary";
     const mapped = normalized === "prepared" ? "prompt-summary" : normalized;
     if (!VALID_GUIDANCE_STRATEGIES.has(mapped)) {
-        throw new SessionInputError(`Invalid guidance strategy "${guidanceStrategy ?? ""}". Expected prompt-summary|json-primary|unguided.`);
+        throw new SessionInputError(`Invalid guidance strategy "${guidanceStrategy ?? ""}". Expected prompt-summary|baseline-primary|json-primary|unguided.`);
     }
     return mapped;
 }
+function ensureEvaluationMode(value) {
+    const normalized = typeof value === "string" ? value.trim().toLowerCase() : "zero-shot";
+    if (!VALID_EVALUATION_MODES.has(normalized)) {
+        throw new SessionInputError(`Invalid evaluation mode "${value ?? ""}". Expected zero-shot|iterative.`);
+    }
+    return normalized;
+}
+function ensurePlatformTarget(value, label) {
+    const normalized = typeof value === "string" ? value.trim().toLowerCase() : "";
+    if (!VALID_PLATFORM_TARGETS.has(normalized)) {
+        throw new SessionInputError(`Invalid ${label} "${String(value ?? "")}". Expected web|ios|android.`);
+    }
+    return normalized;
+}
+function ensureConsumerType(value, label) {
+    const normalized = typeof value === "string" ? value.trim().toLowerCase() : "";
+    if (!VALID_CONSUMER_TYPES.has(normalized)) {
+        throw new SessionInputError(`Invalid ${label} "${String(value ?? "")}". Expected web-browser|desktop-shell|ios-native|android-native.`);
+    }
+    return normalized;
+}
 function buildDefaultSessionId() {
     return new Date().toISOString().replace(/[-:]/g, "").replace(/\.\d{3}Z$/, "Z");
 }
@@ -121,7 +146,9 @@ function normalizeAssessment(payload, filePath, options = {}) {
     const structureFallback = payload.structure;
     const grade = (key) => {
         let value = payload[key];
-        if (value === undefined && options.allowLegacyMissing && (key === "components" || key === "boundary")) {
+        if (value === undefined
+            && options.allowLegacyMissing
+            && (key === "components" || key === "boundary" || key === "platformFit")) {
             value = structureFallback;
         }
         if (!VALID_GRADES.has(value)) {
@@ -175,6 +202,7 @@ function normalizeAssessment(payload, filePath, options = {}) {
         boundary: grade("boundary"),
         visual: grade("visual"),
         responsiveness: grade("responsiveness"),
+        platformFit: grade("platformFit"),
         notes,
         ...(touchedFiles && touchedFiles.length > 0 ? { touchedFiles } : {}),
         ...(heuristics ? { heuristics } : {}),
@@ -457,6 +485,22 @@ function averageNullable(values) {
     }
     return Math.round((filtered.reduce((sum, value) => sum + value, 0) / filtered.length) * 1000) / 1000;
 }
+function readOptionalTrimmedText(filePath) {
+    if (!filePath || !fs.existsSync(filePath)) {
+        return null;
+    }
+    return fs.readFileSync(filePath, "utf8").trim();
+}
+function appendArtifactLines(lines, title, artifacts) {
+    const filtered = artifacts.filter(([, filePath]) => Boolean(filePath));
+    if (filtered.length === 0) {
+        return;
+    }
+    lines.push("", title);
+    for (const [label, filePath] of filtered) {
+        lines.push(`- ${label}: ${filePath}`);
+    }
+}
 function renderSummaryMarkdown(summary) {
     const lines = [
         "# Generation Session Summary",
@@ -496,6 +540,7 @@ function renderSummaryMarkdown(summary) {
     lines.push(`- boundary: ${summary.latestAssessment?.boundary ?? "n/a"}`);
     lines.push(`- visual: ${summary.latestAssessment?.visual ?? "n/a"}`);
     lines.push(`- responsiveness: ${summary.latestAssessment?.responsiveness ?? "n/a"}`);
+    lines.push(`- platform fit: ${summary.latestAssessment?.platformFit ?? "n/a"}`);
     lines.push(`- notes: ${summary.latestAssessment?.notes ?? "n/a"}`);
     if (summary.latestAssessment?.touchedFiles?.length) {
         lines.push(`- touched files: ${summary.latestAssessment.touchedFiles.join(", ")}`);
@@ -785,11 +830,24 @@ function renderSuggestionsMarkdown(artifact) {
     }
     return `${lines.join("\n")}\n`;
 }
-function renderBenchmarkReportMarkdown(report) {
+function renderBenchmarkReportMarkdown(report, run) {
     const lines = [
         "# Generation Benchmark Report",
         "",
         `Generated at: ${report.generatedAt}`,
+        ...(report.run
+            ? [
+                `Cohort: ${report.run.cohortId}`,
+                `Evaluation mode: ${report.run.evaluationMode}`,
+                `Tool: ${report.run.tool}`,
+                `Model label: ${report.run.model.requestedModelLabel ?? "not recorded"}`,
+                `Resolved model id: ${report.run.model.resolvedModelId ?? "not recorded"}`,
+                `Base URL: ${report.run.model.baseUrl ?? "not recorded"}`,
+                `Fingerprint: ${report.run.model.fingerprint ?? "not recorded"}`,
+                `Source spec: ${report.run.sourceSpecPath}`,
+                `Source run: ${report.run.sourceRunPath ?? "none"}`,
+            ]
+            : []),
         `Surfaces: ${report.overall.surfaceCount}`,
         `Surfaces meeting goal: ${report.overall.surfacesMeetingGoal}`,
         `Candidate fewer first-attempt blocking findings: ${report.overall.guidedFewerFirstAttemptBlockingFindings}`,
@@ -797,8 +855,13 @@ function renderBenchmarkReportMarkdown(report) {
         "",
         "## Comparisons",
     ];
-    for (const comparison of report.comparisons) {
-        lines.push(`- ${comparison.surfaceId}: baseline=${comparison.baselineGuidanceStrategy}, candidate=${comparison.guidedGuidanceStrategy}, meetsGoal=${comparison.meetsGoal}, improved dimensions=${comparison.guidedRubricBetterDimensions.join(", ") || "none"}`);
+    if (report.comparisons.length === 0) {
+        lines.push("- none");
+    }
+    else {
+        for (const comparison of report.comparisons) {
+            lines.push(`- ${comparison.surfaceId}: baseline=${comparison.baselineGuidanceStrategy}, candidate=${comparison.guidedGuidanceStrategy}, platform=${comparison.platformTarget ?? "unknown"}, consumer=${comparison.consumerType ?? "unknown"}, model=${comparison.modelLabel ?? "unknown"}, meetsGoal=${comparison.meetsGoal}, improved dimensions=${comparison.guidedRubricBetterDimensions.join(", ") || "none"}`);
+        }
     }
     lines.push("", "## Suggestion decisions");
     for (const suggestion of report.suggestions) {
@@ -811,6 +874,65 @@ function renderBenchmarkReportMarkdown(report) {
     lines.push(`- lower touched files per resolved finding: ${report.overall.heuristics.lowerTouchedFilesPerResolvedFinding}`);
     lines.push(`- lower repeated finding carryover count: ${report.overall.heuristics.lowerRepeatedFindingCarryoverCount}`);
     lines.push(`- lower reruns to acceptable outcome: ${report.overall.heuristics.lowerRerunsToAcceptableOutcome}`);
+    if (report.breakdowns) {
+        const renderBreakdownBlock = (title, entries) => {
+            lines.push("", title);
+            const keys = Object.keys(entries).sort((left, right) => left.localeCompare(right));
+            if (keys.length === 0) {
+                lines.push("- none");
+                return;
+            }
+            for (const key of keys) {
+                const entry = entries[key];
+                lines.push(`- ${key}: comparisons=${entry.comparisonCount}, surfaces=${entry.surfaceCount}, meetsGoal=${entry.surfacesMeetingGoal}, fewerBlocking=${entry.guidedFewerFirstAttemptBlockingFindings}, acceptableNoLater=${entry.guidedReachedAcceptableNoLater}`);
+            }
+        };
+        renderBreakdownBlock("## By Platform Target", report.breakdowns.byPlatformTarget);
+        renderBreakdownBlock("## By Consumer Type", report.breakdowns.byConsumerType);
+        renderBreakdownBlock("## By Model", report.breakdowns.byModelLabel);
+    }
+    if (run) {
+        lines.push("", "## Zero-Shot Evidence");
+        for (const fixture of run.fixtures) {
+            lines.push("", `### ${fixture.surfaceId}`, `- fixture: ${fixture.fixtureId}`, `- platform target: ${fixture.platformTarget}`, `- consumer type: ${fixture.consumerType}`, `- capture preset: ${fixture.capturePreset}`, `- brief path: ${fixture.brief.path}`, `- brief sha256: ${fixture.brief.sha256}`);
+            const briefText = readOptionalTrimmedText(fixture.brief.path);
+            if (briefText) {
+                lines.push("", "#### Benchmark Brief", "", "```md", briefText, "```");
+            }
+            appendArtifactLines(lines, "#### Contract Artifacts", [
+                ["source contract", fixture.paths?.sourceContractPath],
+                ["source AST", fixture.paths?.sourceAstPath],
+                ["bundle root", fixture.paths?.bundleRoot],
+                ["compiled contract", fixture.paths?.compiledContractPath],
+                ["effective AST", fixture.paths?.effectiveAstPath],
+            ]);
+            appendArtifactLines(lines, "#### Prompt And Input Artifacts", [
+                ["prepared input", fixture.paths?.preparedInputPath],
+                ["accepted suggestions", fixture.paths?.acceptedSuggestionsPath],
+                ["designer notes", fixture.paths?.designerNotesPath],
+                ["baseline validate", fixture.paths?.baselineValidatePath],
+            ]);
+            if (fixture.comparisons.length > 0) {
+                lines.push("", "#### Fixture Comparisons");
+                for (const comparison of fixture.comparisons) {
+                    lines.push(`- ${comparison.baselineGuidanceStrategy} vs ${comparison.guidedGuidanceStrategy}: ${comparison.comparisonPath}`);
+                }
+            }
+            if (fixture.sessions.length > 0) {
+                lines.push("", "#### Session Evidence");
+                for (const session of fixture.sessions) {
+                    const summary = fs.existsSync(session.summaryPath)
+                        ? readJsonFile(session.summaryPath, "generation benchmark session summary")
+                        : null;
+                    lines.push("", `##### ${session.guidanceStrategy}`, `- session id: ${session.sessionId}`, `- session dir: ${session.sessionDir}`, `- latest status: ${asString(summary?.latestStatus) ?? "not recorded"}`, `- latest outcome: ${asString(summary?.latestOutcome) ?? "not recorded"}`, `- error: ${asString(summary?.errorMessage) ?? "none"}`, `- summary path: ${session.summaryPath}`, `- guidance handoff: ${session.guidanceHandoffPath}`, `- agent input: ${session.agentInputPath}`, `- preview: ${session.previewPath ?? "not captured"}`);
+                    const agentInput = readOptionalTrimmedText(session.agentInputPath);
+                    if (agentInput) {
+                        lines.push("", "```txt", agentInput, "```");
+                    }
+                }
+            }
+        }
+    }
     return `${lines.join("\n")}\n`;
 }
 function freezeBriefFile(sessionDir, briefFile) {
@@ -900,6 +1022,35 @@ function buildPreparedPromptSummary(preparedPayload) {
         `Top repair priorities: ${topRepairs.join(", ") || "none"}`,
     ].join("\n");
 }
+function buildBaselinePrimarySummary(preparedPayload) {
+    const surface = asRecord(preparedPayload.surface);
+    const contract = asRecord(preparedPayload.contract);
+    const constraints = asRecord(preparedPayload.constraints);
+    const generation = asRecord(preparedPayload.generation);
+    const layout = asRecord(generation.layout);
+    const guidance = asRecord(generation.guidance);
+    const boundaryRules = Array.isArray(guidance.boundaryRules)
+        ? guidance.boundaryRules.filter((entry) => isRecord(entry))
+        : [];
+    const sections = Array.isArray(preparedPayload.sections)
+        ? preparedPayload.sections.filter((entry) => isRecord(entry))
+        : [];
+    const repairMap = extractRepairEntries(preparedPayload.repairMap);
+    const color = asRecord(constraints.color);
+    const motion = asRecord(constraints.motion);
+    return [
+        `Surface: ${asString(surface.id) ?? "unknown"} (${asString(surface.type) ?? "unspecified"})`,
+        `Contract: ${asString(contract.id) ?? "unknown"} v${asString(contract.version) ?? "0.0.0"}`,
+        `Required sections: ${sections.map((entry) => asString(entry.id) ?? "").filter(Boolean).join(", ") || "none recorded"}`,
+        `Boundary rules: ${boundaryRules.map((entry) => asString(entry.id) ?? "").filter(Boolean).join(", ") || "none recorded"}`,
+        `Max content width: ${typeof layout.maxContentWidth === "number" ? `${layout.maxContentWidth}px` : "unspecified"}`,
+        `Allowed colors: ${asStringArray(color.allowedValues).join(", ") || "none recorded"}`,
+        `Motion durations: ${Array.isArray(motion.allowedDurationsMs)
+            ? motion.allowedDurationsMs.map((value) => `${String(value)}ms`).join(", ")
+            : "none recorded"}`,
+        `Top repair codes: ${repairMap.slice(0, 5).map((entry) => asString(entry.code) ?? "").filter(Boolean).join(", ") || "none"}`,
+    ].join("\n");
+}
 function selectRelevantComponents(preparedPayload) {
     const sections = Array.isArray(preparedPayload.sections)
         ? preparedPayload.sections.filter((entry) => isRecord(entry))
@@ -1064,6 +1215,12 @@ function buildGuidanceHandoff(session, paths, guidanceStrategy, options = {}) {
                 preparedGuidanceSummary: buildPreparedPromptSummary(preparedPayload),
             }
             : null,
+        baselinePrimary: guidanceStrategy === "baseline-primary"
+            ? {
+                effectiveContractSummary: summarizeContractForSurface(session.contractPath, session.surfaceId),
+                baselineContractSummary: buildBaselinePrimarySummary(preparedPayload),
+            }
+            : null,
         jsonPrimary: guidanceStrategy === "json-primary"
             ? {
                 surface: asRecord(preparedPayload.surface),
@@ -1398,6 +1555,200 @@ function normalizeSuggestionReviewFile(filePath) {
         };
     });
 }
+function buildDefaultBenchmarkCohortId() {
+    return new Date().toISOString().replace(/[-:.TZ]/g, "").slice(0, 14);
+}
+function normalizeBenchmarkComparisonPairs(value, label) {
+    if (!Array.isArray(value) || value.length === 0) {
+        throw new SessionInputError(`${label} must be a non-empty array.`);
+    }
+    return value.map((entry, index) => {
+        const record = asRecord(entry);
+        return {
+            baselineGuidanceStrategy: ensureGuidanceStrategy(asString(record.baselineGuidanceStrategy) ?? (() => {
+                throw new SessionInputError(`${label}[${index}].baselineGuidanceStrategy is required.`);
+            })()),
+            guidedGuidanceStrategy: ensureGuidanceStrategy(asString(record.guidedGuidanceStrategy) ?? (() => {
+                throw new SessionInputError(`${label}[${index}].guidedGuidanceStrategy is required.`);
+            })()),
+        };
+    });
+}
+function loadGenerationBenchmarkSpec(specPath) {
+    const resolvedPath = path.resolve(specPath);
+    const payload = readJsonFile(resolvedPath, "generation benchmark spec");
+    const fixturesValue = payload.fixtures;
+    if (!Array.isArray(fixturesValue) || fixturesValue.length === 0) {
+        throw new SessionInputError(`Benchmark spec must include a non-empty fixtures array: ${resolvedPath}.`);
+    }
+    const guidanceStrategies = asStringArray(payload.guidanceStrategies).map((entry) => ensureGuidanceStrategy(entry));
+    if (guidanceStrategies.length < 2) {
+        throw new SessionInputError(`Benchmark spec must freeze at least two guidance strategies: ${resolvedPath}.`);
+    }
+    const comparisonPairs = normalizeBenchmarkComparisonPairs(payload.comparisonPairs, "comparisonPairs");
+    const attemptBudget = Number(payload.attemptBudget);
+    if (!Number.isInteger(attemptBudget) || attemptBudget < 1) {
+        throw new SessionInputError(`Benchmark spec attemptBudget must be a positive integer: ${resolvedPath}.`);
+    }
+    return {
+        schemaVersion: 1,
+        specId: asString(payload.specId) ?? path.basename(resolvedPath, path.extname(resolvedPath)),
+        generatedAt: asString(payload.generatedAt) ?? new Date().toISOString(),
+        evaluationMode: ensureEvaluationMode(asString(payload.evaluationMode) ?? "zero-shot"),
+        attemptBudget,
+        guidanceStrategies,
+        comparisonPairs,
+        ...(asString(payload.suiteId) ? { suiteId: asString(payload.suiteId) ?? undefined } : {}),
+        ...(asString(payload.suiteName) ? { suiteName: asString(payload.suiteName) ?? undefined } : {}),
+        fixtures: fixturesValue.map((entry, index) => {
+            const record = asRecord(entry);
+            const brief = asRecord(record.brief);
+            const pathsRecord = record.paths !== undefined ? asRecord(record.paths) : null;
+            const fixtureComparisonPairs = record.comparisonPairs !== undefined
+                ? normalizeBenchmarkComparisonPairs(record.comparisonPairs, `fixtures[${index}].comparisonPairs`)
+                : comparisonPairs;
+            return {
+                fixtureId: asString(record.fixtureId) ?? (() => {
+                    throw new SessionInputError(`fixtures[${index}].fixtureId is required in ${resolvedPath}.`);
+                })(),
+                surfaceId: asString(record.surfaceId) ?? (() => {
+                    throw new SessionInputError(`fixtures[${index}].surfaceId is required in ${resolvedPath}.`);
+                })(),
+                brief: {
+                    path: asString(brief.path) ?? (() => {
+                        throw new SessionInputError(`fixtures[${index}].brief.path is required in ${resolvedPath}.`);
+                    })(),
+                    sha256: asString(brief.sha256) ?? (() => {
+                        throw new SessionInputError(`fixtures[${index}].brief.sha256 is required in ${resolvedPath}.`);
+                    })(),
+                },
+                platformTarget: ensurePlatformTarget(record.platformTarget, `fixtures[${index}].platformTarget`),
+                consumerType: ensureConsumerType(record.consumerType, `fixtures[${index}].consumerType`),
+                capturePreset: asString(record.capturePreset) ?? "web-browser",
+                comparisonPairs: fixtureComparisonPairs,
+                ...(pathsRecord
+                    ? {
+                        paths: {
+                            ...(asString(pathsRecord.fixtureDir) ? { fixtureDir: asString(pathsRecord.fixtureDir) ?? undefined } : {}),
+                            ...(asString(pathsRecord.sourceContractPath)
+                                ? { sourceContractPath: asString(pathsRecord.sourceContractPath) ?? undefined }
+                                : {}),
+                            ...(asString(pathsRecord.sourceAstPath)
+                                ? { sourceAstPath: asString(pathsRecord.sourceAstPath) ?? undefined }
+                                : {}),
+                            ...(asString(pathsRecord.bundleRoot)
+                                ? { bundleRoot: asString(pathsRecord.bundleRoot) ?? undefined }
+                                : {}),
+                            ...(asString(pathsRecord.compiledContractPath)
+                                ? { compiledContractPath: asString(pathsRecord.compiledContractPath) ?? undefined }
+                                : {}),
+                            ...(asString(pathsRecord.effectiveAstPath)
+                                ? { effectiveAstPath: asString(pathsRecord.effectiveAstPath) ?? undefined }
+                                : {}),
+                            ...(asString(pathsRecord.preparedInputPath)
+                                ? { preparedInputPath: asString(pathsRecord.preparedInputPath) ?? undefined }
+                                : {}),
+                            ...(asString(pathsRecord.acceptedSuggestionsPath)
+                                ? { acceptedSuggestionsPath: asString(pathsRecord.acceptedSuggestionsPath) ?? undefined }
+                                : {}),
+                            ...(asString(pathsRecord.designerNotesPath)
+                                ? { designerNotesPath: asString(pathsRecord.designerNotesPath) ?? undefined }
+                                : {}),
+                            ...(asString(pathsRecord.baselineValidatePath)
+                                ? { baselineValidatePath: asString(pathsRecord.baselineValidatePath) ?? undefined }
+                                : {}),
+                        },
+                    }
+                    : {}),
+            };
+        }),
+    };
+}
+function loadGenerationBenchmarkRun(runPath) {
+    return readJsonFile(path.resolve(runPath), "generation benchmark run");
+}
+function buildBreakdownSummary(entries) {
+    return {
+        comparisonCount: entries.length,
+        surfaceCount: new Set(entries.map((entry) => entry.surfaceId)).size,
+        surfacesMeetingGoal: entries.filter((entry) => entry.meetsGoal).length,
+        guidedFewerFirstAttemptBlockingFindings: entries.filter((entry) => entry.guidedFewerFirstAttemptBlockingFindings).length,
+        guidedReachedAcceptableNoLater: entries.filter((entry) => entry.guidedReachedAcceptableNoLater).length,
+    };
+}
+export async function runReplayGenerationBenchmarkCommand(options) {
+    try {
+        if (!options.specPath) {
+            throw new SessionInputError("--spec is required.");
+        }
+        if (!options.outDir) {
+            throw new SessionInputError("--out-dir is required.");
+        }
+        const tool = ensureSessionTool(options.tool);
+        const specPath = path.resolve(options.specPath);
+        const spec = loadGenerationBenchmarkSpec(specPath);
+        const benchmarkDir = path.resolve(options.outDir);
+        const cohortId = options.cohortId?.trim() || buildDefaultBenchmarkCohortId();
+        const runPath = path.join(benchmarkDir, "run.json");
+        const copiedSpecPath = path.join(benchmarkDir, "spec.json");
+        const sourceRunPath = options.sourceRunPath ? path.resolve(options.sourceRunPath) : null;
+        fs.mkdirSync(benchmarkDir, { recursive: true });
+        if (path.resolve(specPath) !== path.resolve(copiedSpecPath)) {
+            fs.copyFileSync(specPath, copiedSpecPath);
+        }
+        const run = {
+            schemaVersion: 1,
+            cohortId,
+            generatedAt: new Date().toISOString(),
+            evaluationMode: spec.evaluationMode,
+            tool,
+            sourceSpecPath: specPath,
+            sourceRunPath,
+            attemptBudget: spec.attemptBudget,
+            guidanceStrategies: [...spec.guidanceStrategies],
+            comparisonPairs: spec.comparisonPairs.map((pair) => ({ ...pair })),
+            model: {
+                requestedModelLabel: options.requestedModelLabel?.trim() || null,
+                resolvedModelId: options.resolvedModelId?.trim() || null,
+                baseUrl: options.baseUrl?.trim() || null,
+                fingerprint: options.fingerprint?.trim() || null,
+            },
+            ...(spec.suiteId ? { suiteId: spec.suiteId } : {}),
+            ...(spec.suiteName ? { suiteName: spec.suiteName } : {}),
+            paths: {
+                benchmarkDir,
+                specPath: copiedSpecPath,
+                runPath,
+                reportJsonPath: null,
+                reportMarkdownPath: null,
+            },
+            fixtures: spec.fixtures.map((fixture) => ({
+                ...fixture,
+                sessions: [],
+                comparisons: [],
+            })),
+        };
+        writeDeterministicJsonSync(runPath, run);
+        process.stdout.write(`${JSON.stringify({
+            ok: true,
+            run,
+            paths: {
+                specPath: copiedSpecPath,
+                runPath,
+                benchmarkDir,
+            },
+        }, null, 2)}\n`);
+        return 0;
+    }
+    catch (error) {
+        if (error instanceof SessionInputError || error instanceof AdapterInputError) {
+            writeError(error, error.code);
+            return 10;
+        }
+        writeError(error instanceof Error ? error : new Error(String(error)), "generation-session.internal");
+        return 1;
+    }
+}
 export async function runInitGenerationSessionCommand(options) {
     try {
         if (!options.bundleRoot) {
@@ -1925,8 +2276,12 @@ export async function runReviewContractDeltaSuggestionsCommand(options) {
 }
 export async function runSummarizeGenerationBenchmarkCommand(options) {
     try {
+        const run = options.runPath ? loadGenerationBenchmarkRun(options.runPath) : null;
         const comparisonPaths = parseCsvPaths(options.comparisonPaths);
-        if (comparisonPaths.length === 0) {
+        if (comparisonPaths.length === 0 && run) {
+            comparisonPaths.push(...run.fixtures.flatMap((fixture) => fixture.comparisons.map((comparison) => path.resolve(comparison.comparisonPath))));
+        }
+        if (comparisonPaths.length === 0 && !run) {
             throw new SessionInputError("--comparisons must include at least one comparison artifact path.");
         }
         const suggestionPaths = parseCsvPaths(options.suggestionPaths);
@@ -1938,21 +2293,57 @@ export async function runSummarizeGenerationBenchmarkCommand(options) {
             path: suggestionPath,
             value: readJsonFile(suggestionPath, "contract delta suggestions artifact"),
         }));
+        const fixtureMetadataByComparisonPath = new Map();
+        if (run) {
+            for (const fixture of run.fixtures) {
+                for (const comparison of fixture.comparisons) {
+                    fixtureMetadataByComparisonPath.set(path.resolve(comparison.comparisonPath), {
+                        platformTarget: fixture.platformTarget,
+                        consumerType: fixture.consumerType,
+                    });
+                }
+            }
+        }
         const report = {
-            schemaVersion: 2,
+            schemaVersion: 3,
             generatedAt: new Date().toISOString(),
-            comparisons: comparisons.map(({ path: comparisonPath, value }) => ({
-                surfaceId: value.surfaceId,
-                tool: value.tool,
-                comparisonPath,
-                meetsGoal: value.checks.meetsGoal,
-                baselineGuidanceStrategy: value.baseline.guidanceStrategy,
-                guidedGuidanceStrategy: value.guided.guidanceStrategy,
-                guidedFewerFirstAttemptBlockingFindings: value.checks.guidedFewerFirstAttemptBlockingFindings,
-                guidedReachedAcceptableNoLater: value.checks.guidedReachedAcceptableNoLater,
-                guidedRubricBetterDimensions: value.checks.guidedRubricBetterDimensions,
-                heuristics: value.heuristics.delta,
-            })),
+            ...(run
+                ? {
+                    run: {
+                        cohortId: run.cohortId,
+                        evaluationMode: run.evaluationMode,
+                        tool: run.tool,
+                        sourceSpecPath: run.sourceSpecPath,
+                        sourceRunPath: run.sourceRunPath,
+                        guidanceStrategies: [...run.guidanceStrategies],
+                        attemptBudget: run.attemptBudget,
+                        model: {
+                            requestedModelLabel: run.model.requestedModelLabel,
+                            resolvedModelId: run.model.resolvedModelId,
+                            baseUrl: run.model.baseUrl,
+                            fingerprint: run.model.fingerprint,
+                        },
+                    },
+                }
+                : {}),
+            comparisons: comparisons.map(({ path: comparisonPath, value }) => {
+                const comparisonMetadata = fixtureMetadataByComparisonPath.get(path.resolve(comparisonPath));
+                return {
+                    surfaceId: value.surfaceId,
+                    tool: value.tool,
+                    comparisonPath,
+                    meetsGoal: value.checks.meetsGoal,
+                    baselineGuidanceStrategy: value.baseline.guidanceStrategy,
+                    guidedGuidanceStrategy: value.guided.guidanceStrategy,
+                    ...(comparisonMetadata ? { platformTarget: comparisonMetadata.platformTarget } : {}),
+                    ...(comparisonMetadata ? { consumerType: comparisonMetadata.consumerType } : {}),
+                    ...(run ? { modelLabel: run.model.requestedModelLabel ?? run.model.resolvedModelId ?? "unknown" } : {}),
+                    guidedFewerFirstAttemptBlockingFindings: value.checks.guidedFewerFirstAttemptBlockingFindings,
+                    guidedReachedAcceptableNoLater: value.checks.guidedReachedAcceptableNoLater,
+                    guidedRubricBetterDimensions: value.checks.guidedRubricBetterDimensions,
+                    heuristics: value.heuristics.delta,
+                };
+            }),
             suggestions: suggestions.map(({ path: suggestionsPath, value }) => ({
                 surfaceId: value.surfaceId,
                 sessionId: value.sessionId,
@@ -1962,7 +2353,7 @@ export async function runSummarizeGenerationBenchmarkCommand(options) {
                 rejectedCount: value.suggestions.filter((entry) => entry.status === "rejected").length,
             })),
             overall: {
-                surfaceCount: comparisons.length,
+                surfaceCount: comparisons.length > 0 ? comparisons.length : (run?.fixtures.length ?? 0),
                 surfacesMeetingGoal: comparisons.filter(({ value }) => value.checks.meetsGoal).length,
                 guidedFewerFirstAttemptBlockingFindings: comparisons.filter(({ value }) => value.checks.guidedFewerFirstAttemptBlockingFindings).length,
                 guidedReachedAcceptableNoLater: comparisons.filter(({ value }) => value.checks.guidedReachedAcceptableNoLater).length,
@@ -1986,6 +2377,72 @@ export async function runSummarizeGenerationBenchmarkCommand(options) {
                     },
                 },
             },
+            ...(run
+                ? {
+                    breakdowns: {
+                        byPlatformTarget: Object.fromEntries([...new Set(run.fixtures.map((fixture) => fixture.platformTarget))]
+                            .sort((left, right) => left.localeCompare(right))
+                            .map((platformTarget) => [
+                            platformTarget,
+                            buildBreakdownSummary(comparisons
+                                .map(({ path: comparisonPath, value }) => ({
+                                ...value,
+                                __comparisonPath: comparisonPath,
+                            }))
+                                .filter((entry) => fixtureMetadataByComparisonPath.get(path.resolve(entry.__comparisonPath))?.platformTarget === platformTarget)
+                                .map((entry) => ({
+                                surfaceId: entry.surfaceId,
+                                tool: entry.tool,
+                                comparisonPath: entry.__comparisonPath,
+                                meetsGoal: entry.checks.meetsGoal,
+                                baselineGuidanceStrategy: entry.baseline.guidanceStrategy,
+                                guidedGuidanceStrategy: entry.guided.guidanceStrategy,
+                                guidedFewerFirstAttemptBlockingFindings: entry.checks.guidedFewerFirstAttemptBlockingFindings,
+                                guidedReachedAcceptableNoLater: entry.checks.guidedReachedAcceptableNoLater,
+                                guidedRubricBetterDimensions: entry.checks.guidedRubricBetterDimensions,
+                                heuristics: entry.heuristics.delta,
+                            }))),
+                        ])),
+                        byConsumerType: Object.fromEntries([...new Set(run.fixtures.map((fixture) => fixture.consumerType))]
+                            .sort((left, right) => left.localeCompare(right))
+                            .map((consumerType) => [
+                            consumerType,
+                            buildBreakdownSummary(comparisons
+                                .map(({ path: comparisonPath, value }) => ({
+                                ...value,
+                                __comparisonPath: comparisonPath,
+                            }))
+                                .filter((entry) => fixtureMetadataByComparisonPath.get(path.resolve(entry.__comparisonPath))?.consumerType === consumerType)
+                                .map((entry) => ({
+                                surfaceId: entry.surfaceId,
+                                tool: entry.tool,
+                                comparisonPath: entry.__comparisonPath,
+                                meetsGoal: entry.checks.meetsGoal,
+                                baselineGuidanceStrategy: entry.baseline.guidanceStrategy,
+                                guidedGuidanceStrategy: entry.guided.guidanceStrategy,
+                                guidedFewerFirstAttemptBlockingFindings: entry.checks.guidedFewerFirstAttemptBlockingFindings,
+                                guidedReachedAcceptableNoLater: entry.checks.guidedReachedAcceptableNoLater,
+                                guidedRubricBetterDimensions: entry.checks.guidedRubricBetterDimensions,
+                                heuristics: entry.heuristics.delta,
+                            }))),
+                        ])),
+                        byModelLabel: {
+                            [run.model.requestedModelLabel ?? run.model.resolvedModelId ?? "unknown"]: buildBreakdownSummary(comparisons.map(({ path: comparisonPath, value }) => ({
+                                surfaceId: value.surfaceId,
+                                tool: value.tool,
+                                comparisonPath,
+                                meetsGoal: value.checks.meetsGoal,
+                                baselineGuidanceStrategy: value.baseline.guidanceStrategy,
+                                guidedGuidanceStrategy: value.guided.guidanceStrategy,
+                                guidedFewerFirstAttemptBlockingFindings: value.checks.guidedFewerFirstAttemptBlockingFindings,
+                                guidedReachedAcceptableNoLater: value.checks.guidedReachedAcceptableNoLater,
+                                guidedRubricBetterDimensions: value.checks.guidedRubricBetterDimensions,
+                                heuristics: value.heuristics.delta,
+                            }))),
+                        },
+                    },
+                }
+                : {}),
         };
         const outDir = options.outDir
             ? path.resolve(options.outDir)
@@ -1994,7 +2451,17 @@ export async function runSummarizeGenerationBenchmarkCommand(options) {
         const markdownPath = path.join(outDir, "benchmark-report.md");
         writeDeterministicJsonSync(jsonPath, report);
         fs.mkdirSync(path.dirname(markdownPath), { recursive: true });
-        fs.writeFileSync(markdownPath, renderBenchmarkReportMarkdown(report), "utf8");
+        fs.writeFileSync(markdownPath, renderBenchmarkReportMarkdown(report, run), "utf8");
+        if (run && options.runPath) {
+            writeDeterministicJsonSync(path.resolve(options.runPath), {
+                ...run,
+                paths: {
+                    ...run.paths,
+                    reportJsonPath: jsonPath,
+                    reportMarkdownPath: markdownPath,
+                },
+            });
+        }
         process.stdout.write(`${JSON.stringify({
             ok: true,
             report,
diff --git a/packages/interfacectl-cli/dist/index.js b/packages/interfacectl-cli/dist/index.js
index 7de1261..ad21b44 100755
--- a/packages/interfacectl-cli/dist/index.js
+++ b/packages/interfacectl-cli/dist/index.js
@@ -15,7 +15,7 @@ import { runPrepareRuntimeCommand } from "./commands/prepare-runtime.js";
 import { runValidateGenerationCommand } from "./commands/validate-generation.js";
 import { runServeGenerationAdapterCommand } from "./commands/serve-generation-adapter.js";
 import { runEmitRunArtifactCommand } from "./commands/emit-run-artifact.js";
-import { runCaptureGenerationPreviewCommand, runCompareGenerationSessionsCommand, runInitGenerationSessionCommand, runPrepareGenerationHandoffCommand, runRecordGenerationAttemptCommand, runReviewContractDeltaSuggestionsCommand, runReviewGenerationAttemptCommand, runSuggestContractDeltasCommand, runSummarizeGenerationSessionCommand, runSummarizeGenerationBenchmarkCommand, } from "./commands/generation-session.js";
+import { runCaptureGenerationPreviewCommand, runCompareGenerationSessionsCommand, runInitGenerationSessionCommand, runPrepareGenerationHandoffCommand, runReplayGenerationBenchmarkCommand, runRecordGenerationAttemptCommand, runReviewContractDeltaSuggestionsCommand, runReviewGenerationAttemptCommand, runSuggestContractDeltasCommand, runSummarizeGenerationSessionCommand, runSummarizeGenerationBenchmarkCommand, } from "./commands/generation-session.js";
 import { runInitCommand } from "./commands/init.js";
 import { runAnalyzeCommand } from "./commands/analyze.js";
 import { runAuthCaptureCommand, runAuthClearCommand, runAuthListCommandWithOptions, runAuthTestCommand, } from "./commands/auth.js";
@@ -251,7 +251,7 @@ program
     .requiredOption("--surface <id>", "Surface identifier")
     .requiredOption("--workspace-root <path>", "Workspace root for emitted run artifacts")
     .option("--tool <tool>", "Generation tool identifier (codex|cursor|local-llm)")
-    .option("--guidance-strategy <strategy>", "Session guidance strategy (prompt-summary|json-primary|unguided)")
+    .option("--guidance-strategy <strategy>", "Session guidance strategy (prompt-summary|baseline-primary|json-primary|unguided)")
     .option("--guidance-mode <mode>", "Legacy alias for --guidance-strategy (prepared|unguided)")
     .option("--brief-file <path>", "Optional implementation brief file to freeze into the session")
     .option("--session <id>", "Optional session identifier")
@@ -273,7 +273,7 @@ program
     .command("prepare-generation-handoff")
     .description("Build one canonical strategy-aware guidance handoff artifact for a tracked generation session")
     .requiredOption("--session-dir <path>", "Path to the generation session directory")
-    .option("--guidance-strategy <strategy>", "Optional guidance strategy override (prompt-summary|json-primary|unguided)")
+    .option("--guidance-strategy <strategy>", "Optional guidance strategy override (prompt-summary|baseline-primary|json-primary|unguided)")
     .option("--accepted-suggestions <path>", "Optional accepted suggestions JSON file")
     .option("--designer-notes <path>", "Optional designer notes JSON file")
     .option("--finding-codes <codes>", "Optional comma-separated finding codes to match against repair guidance")
@@ -378,16 +378,43 @@ program
 program
     .command("summarize-generation-benchmark")
     .description("Aggregate one or more comparison and suggestion artifacts into a benchmark report")
-    .requiredOption("--comparisons <paths>", "Comma-separated generation session comparison JSON paths")
+    .option("--comparisons <paths>", "Comma-separated generation session comparison JSON paths")
     .option("--suggestions <paths>", "Comma-separated contract delta suggestion JSON paths")
+    .option("--run-path <path>", "Optional benchmark run manifest to enrich the benchmark report")
     .option("--out-dir <path>", "Output directory for the benchmark report")
     .action(async (options) => {
     process.exitCode = await runSummarizeGenerationBenchmarkCommand({
         comparisonPaths: options.comparisons,
         suggestionPaths: options.suggestions,
+        runPath: options.runPath,
         outDir: options.outDir,
     });
 });
+program
+    .command("replay-generation-benchmark")
+    .description("Freeze a benchmark spec into a new replayable benchmark run manifest")
+    .requiredOption("--spec <path>", "Path to the benchmark spec JSON file")
+    .requiredOption("--tool <tool>", "Generation tool identifier (codex|cursor|local-llm)")
+    .requiredOption("--out-dir <path>", "Output directory for the replay run")
+    .option("--cohort-id <id>", "Optional cohort id override")
+    .option("--source-run <path>", "Optional source benchmark run manifest")
+    .option("--requested-model-label <label>", "Optional requested model label")
+    .option("--resolved-model-id <id>", "Optional resolved runtime model id")
+    .option("--base-url <url>", "Optional model base URL")
+    .option("--fingerprint <value>", "Optional model/runtime fingerprint")
+    .action(async (options) => {
+    process.exitCode = await runReplayGenerationBenchmarkCommand({
+        specPath: options.spec,
+        tool: options.tool,
+        outDir: options.outDir,
+        cohortId: options.cohortId,
+        sourceRunPath: options.sourceRun,
+        requestedModelLabel: options.requestedModelLabel,
+        resolvedModelId: options.resolvedModelId,
+        baseUrl: options.baseUrl,
+        fingerprint: options.fingerprint,
+    });
+});
 program
     .command("validate-generation")
     .description("Validate generated UI against a compiled generation bundle")
diff --git a/packages/interfacectl-cli/schemas/contract-delta-suggestions.schema.json b/packages/interfacectl-cli/schemas/contract-delta-suggestions.schema.json
index 6ae46f3..8c69190 100644
--- a/packages/interfacectl-cli/schemas/contract-delta-suggestions.schema.json
+++ b/packages/interfacectl-cli/schemas/contract-delta-suggestions.schema.json
@@ -24,7 +24,7 @@
     },
     "guidanceStrategy": {
       "type": "string",
-      "enum": ["prompt-summary", "json-primary", "unguided"]
+      "enum": ["prompt-summary", "baseline-primary", "json-primary", "unguided"]
     },
     "generatedAt": {
       "type": "string",
diff --git a/packages/interfacectl-cli/schemas/generation-assessment.schema.json b/packages/interfacectl-cli/schemas/generation-assessment.schema.json
index b9cf311..7b4d3db 100644
--- a/packages/interfacectl-cli/schemas/generation-assessment.schema.json
+++ b/packages/interfacectl-cli/schemas/generation-assessment.schema.json
@@ -4,7 +4,7 @@
   "title": "GenerationAssessment",
   "type": "object",
   "additionalProperties": false,
-  "required": ["structure", "components", "boundary", "visual", "responsiveness", "notes"],
+  "required": ["structure", "components", "boundary", "visual", "responsiveness", "platformFit", "notes"],
   "properties": {
     "structure": {
       "type": "string",
@@ -26,6 +26,10 @@
       "type": "string",
       "enum": ["strong", "partial", "weak"]
     },
+    "platformFit": {
+      "type": "string",
+      "enum": ["strong", "partial", "weak"]
+    },
     "notes": {
       "type": "string",
       "minLength": 1
diff --git a/packages/interfacectl-cli/schemas/generation-benchmark-report.schema.json b/packages/interfacectl-cli/schemas/generation-benchmark-report.schema.json
index dc5a84a..06b972f 100644
--- a/packages/interfacectl-cli/schemas/generation-benchmark-report.schema.json
+++ b/packages/interfacectl-cli/schemas/generation-benchmark-report.schema.json
@@ -8,12 +8,68 @@
   "properties": {
     "schemaVersion": {
       "type": "number",
-      "const": 2
+      "const": 3
     },
     "generatedAt": {
       "type": "string",
       "format": "date-time"
     },
+    "run": {
+      "type": "object",
+      "additionalProperties": false,
+      "required": ["cohortId", "evaluationMode", "tool", "sourceSpecPath", "sourceRunPath", "guidanceStrategies", "attemptBudget", "model"],
+      "properties": {
+        "cohortId": {
+          "type": "string",
+          "minLength": 1
+        },
+        "evaluationMode": {
+          "type": "string",
+          "enum": ["zero-shot", "iterative"]
+        },
+        "tool": {
+          "type": "string",
+          "enum": ["codex", "cursor", "local-llm"]
+        },
+        "sourceSpecPath": {
+          "type": "string",
+          "minLength": 1
+        },
+        "sourceRunPath": {
+          "type": ["string", "null"]
+        },
+        "guidanceStrategies": {
+          "type": "array",
+          "items": {
+            "type": "string",
+            "enum": ["prompt-summary", "baseline-primary", "json-primary", "unguided"]
+          }
+        },
+        "attemptBudget": {
+          "type": "number",
+          "minimum": 1
+        },
+        "model": {
+          "type": "object",
+          "additionalProperties": false,
+          "required": ["requestedModelLabel", "resolvedModelId", "baseUrl", "fingerprint"],
+          "properties": {
+            "requestedModelLabel": {
+              "type": ["string", "null"]
+            },
+            "resolvedModelId": {
+              "type": ["string", "null"]
+            },
+            "baseUrl": {
+              "type": ["string", "null"]
+            },
+            "fingerprint": {
+              "type": ["string", "null"]
+            }
+          }
+        }
+      }
+    },
     "comparisons": {
       "type": "array",
       "items": {
@@ -44,16 +100,27 @@
             "type": "string",
             "minLength": 1
           },
+          "platformTarget": {
+            "type": "string",
+            "enum": ["web", "ios", "android"]
+          },
+          "consumerType": {
+            "type": "string",
+            "enum": ["web-browser", "desktop-shell", "ios-native", "android-native"]
+          },
+          "modelLabel": {
+            "type": ["string", "null"]
+          },
           "meetsGoal": {
             "type": "boolean"
           },
           "baselineGuidanceStrategy": {
             "type": "string",
-            "enum": ["prompt-summary", "json-primary", "unguided"]
+            "enum": ["prompt-summary", "baseline-primary", "json-primary", "unguided"]
           },
           "guidedGuidanceStrategy": {
             "type": "string",
-            "enum": ["prompt-summary", "json-primary", "unguided"]
+            "enum": ["prompt-summary", "baseline-primary", "json-primary", "unguided"]
           },
           "guidedFewerFirstAttemptBlockingFindings": {
             "type": "boolean"
@@ -65,7 +132,7 @@
             "type": "array",
             "items": {
               "type": "string",
-              "enum": ["structure", "components", "boundary", "visual", "responsiveness"]
+              "enum": ["structure", "components", "boundary", "visual", "responsiveness", "platformFit"]
             }
           },
           "heuristics": {
@@ -154,6 +221,31 @@
           "$ref": "#/$defs/benchmarkHeuristicsSummary"
         }
       }
+    },
+    "breakdowns": {
+      "type": "object",
+      "additionalProperties": false,
+      "required": ["byPlatformTarget", "byConsumerType", "byModelLabel"],
+      "properties": {
+        "byPlatformTarget": {
+          "type": "object",
+          "additionalProperties": {
+            "$ref": "#/$defs/breakdownSummary"
+          }
+        },
+        "byConsumerType": {
+          "type": "object",
+          "additionalProperties": {
+            "$ref": "#/$defs/breakdownSummary"
+          }
+        },
+        "byModelLabel": {
+          "type": "object",
+          "additionalProperties": {
+            "$ref": "#/$defs/breakdownSummary"
+          }
+        }
+      }
     }
   },
   "$defs": {
@@ -262,6 +354,39 @@
           "$ref": "#/$defs/benchmarkAverageDelta"
         }
       }
+    },
+    "breakdownSummary": {
+      "type": "object",
+      "additionalProperties": false,
+      "required": [
+        "comparisonCount",
+        "surfaceCount",
+        "surfacesMeetingGoal",
+        "guidedFewerFirstAttemptBlockingFindings",
+        "guidedReachedAcceptableNoLater"
+      ],
+      "properties": {
+        "comparisonCount": {
+          "type": "number",
+          "minimum": 0
+        },
+        "surfaceCount": {
+          "type": "number",
+          "minimum": 0
+        },
+        "surfacesMeetingGoal": {
+          "type": "number",
+          "minimum": 0
+        },
+        "guidedFewerFirstAttemptBlockingFindings": {
+          "type": "number",
+          "minimum": 0
+        },
+        "guidedReachedAcceptableNoLater": {
+          "type": "number",
+          "minimum": 0
+        }
+      }
     }
   }
 }
diff --git a/packages/interfacectl-cli/schemas/generation-benchmark-run.schema.json b/packages/interfacectl-cli/schemas/generation-benchmark-run.schema.json
new file mode 100644
index 0000000..b6b19f6
--- /dev/null
+++ b/packages/interfacectl-cli/schemas/generation-benchmark-run.schema.json
@@ -0,0 +1,235 @@
+{
+  "$schema": "https://json-schema.org/draft/2020-12/schema",
+  "$id": "https://surfaces.dev/schemas/generation-benchmark-run.schema.json",
+  "title": "GenerationBenchmarkRun",
+  "type": "object",
+  "additionalProperties": false,
+  "required": [
+    "schemaVersion",
+    "cohortId",
+    "generatedAt",
+    "evaluationMode",
+    "tool",
+    "sourceSpecPath",
+    "sourceRunPath",
+    "attemptBudget",
+    "guidanceStrategies",
+    "comparisonPairs",
+    "model",
+    "paths",
+    "fixtures"
+  ],
+  "properties": {
+    "schemaVersion": {
+      "type": "number",
+      "const": 1
+    },
+    "cohortId": {
+      "type": "string",
+      "minLength": 1
+    },
+    "generatedAt": {
+      "type": "string",
+      "format": "date-time"
+    },
+    "evaluationMode": {
+      "type": "string",
+      "enum": ["zero-shot", "iterative"]
+    },
+    "tool": {
+      "type": "string",
+      "enum": ["codex", "cursor", "local-llm"]
+    },
+    "sourceSpecPath": {
+      "type": "string",
+      "minLength": 1
+    },
+    "sourceRunPath": {
+      "type": ["string", "null"]
+    },
+    "attemptBudget": {
+      "type": "number",
+      "minimum": 1
+    },
+    "guidanceStrategies": {
+      "type": "array",
+      "items": {
+        "type": "string",
+        "enum": ["prompt-summary", "baseline-primary", "json-primary", "unguided"]
+      }
+    },
+    "comparisonPairs": {
+      "type": "array",
+      "items": {
+        "$ref": "#/$defs/comparisonPair"
+      }
+    },
+    "model": {
+      "type": "object",
+      "additionalProperties": false,
+      "required": ["requestedModelLabel", "resolvedModelId", "baseUrl", "fingerprint"],
+      "properties": {
+        "requestedModelLabel": { "type": ["string", "null"] },
+        "resolvedModelId": { "type": ["string", "null"] },
+        "baseUrl": { "type": ["string", "null"] },
+        "fingerprint": { "type": ["string", "null"] }
+      }
+    },
+    "suiteId": {
+      "type": "string"
+    },
+    "suiteName": {
+      "type": "string"
+    },
+    "paths": {
+      "type": "object",
+      "additionalProperties": false,
+      "required": ["benchmarkDir", "specPath", "runPath", "reportJsonPath", "reportMarkdownPath"],
+      "properties": {
+        "benchmarkDir": { "type": "string", "minLength": 1 },
+        "specPath": { "type": "string", "minLength": 1 },
+        "runPath": { "type": "string", "minLength": 1 },
+        "reportJsonPath": { "type": ["string", "null"] },
+        "reportMarkdownPath": { "type": ["string", "null"] }
+      }
+    },
+    "fixtures": {
+      "type": "array",
+      "items": {
+        "$ref": "#/$defs/fixture"
+      }
+    }
+  },
+  "$defs": {
+    "comparisonPair": {
+      "type": "object",
+      "additionalProperties": false,
+      "required": ["baselineGuidanceStrategy", "guidedGuidanceStrategy"],
+      "properties": {
+        "baselineGuidanceStrategy": {
+          "type": "string",
+          "enum": ["prompt-summary", "baseline-primary", "json-primary", "unguided"]
+        },
+        "guidedGuidanceStrategy": {
+          "type": "string",
+          "enum": ["prompt-summary", "baseline-primary", "json-primary", "unguided"]
+        }
+      }
+    },
+    "brief": {
+      "type": "object",
+      "additionalProperties": false,
+      "required": ["path", "sha256"],
+      "properties": {
+        "path": { "type": "string", "minLength": 1 },
+        "sha256": { "type": "string", "minLength": 1 }
+      }
+    },
+    "fixturePaths": {
+      "type": "object",
+      "additionalProperties": false,
+      "properties": {
+        "fixtureDir": { "type": "string" },
+        "sourceContractPath": { "type": "string" },
+        "sourceAstPath": { "type": "string" },
+        "bundleRoot": { "type": "string" },
+        "compiledContractPath": { "type": "string" },
+        "effectiveAstPath": { "type": "string" },
+        "preparedInputPath": { "type": "string" },
+        "acceptedSuggestionsPath": { "type": "string" },
+        "designerNotesPath": { "type": "string" },
+        "baselineValidatePath": { "type": "string" }
+      }
+    },
+    "sessionRef": {
+      "type": "object",
+      "additionalProperties": false,
+      "required": [
+        "guidanceStrategy",
+        "sessionId",
+        "sessionDir",
+        "transcriptPath",
+        "guidanceHandoffPath",
+        "agentInputPath",
+        "explainabilityPath",
+        "summaryPath",
+        "previewPath"
+      ],
+      "properties": {
+        "guidanceStrategy": {
+          "type": "string",
+          "enum": ["prompt-summary", "baseline-primary", "json-primary", "unguided"]
+        },
+        "sessionId": { "type": "string", "minLength": 1 },
+        "sessionDir": { "type": "string", "minLength": 1 },
+        "transcriptPath": { "type": "string", "minLength": 1 },
+        "guidanceHandoffPath": { "type": "string", "minLength": 1 },
+        "agentInputPath": { "type": "string", "minLength": 1 },
+        "explainabilityPath": { "type": "string", "minLength": 1 },
+        "summaryPath": { "type": "string", "minLength": 1 },
+        "previewPath": { "type": ["string", "null"] }
+      }
+    },
+    "comparisonRef": {
+      "type": "object",
+      "additionalProperties": false,
+      "required": ["baselineGuidanceStrategy", "guidedGuidanceStrategy", "comparisonDir", "comparisonPath"],
+      "properties": {
+        "baselineGuidanceStrategy": {
+          "type": "string",
+          "enum": ["prompt-summary", "baseline-primary", "json-primary", "unguided"]
+        },
+        "guidedGuidanceStrategy": {
+          "type": "string",
+          "enum": ["prompt-summary", "baseline-primary", "json-primary", "unguided"]
+        },
+        "comparisonDir": { "type": "string", "minLength": 1 },
+        "comparisonPath": { "type": "string", "minLength": 1 }
+      }
+    },
+    "fixture": {
+      "type": "object",
+      "additionalProperties": false,
+      "required": [
+        "fixtureId",
+        "surfaceId",
+        "brief",
+        "platformTarget",
+        "consumerType",
+        "capturePreset",
+        "comparisonPairs",
+        "sessions",
+        "comparisons"
+      ],
+      "properties": {
+        "fixtureId": { "type": "string", "minLength": 1 },
+        "surfaceId": { "type": "string", "minLength": 1 },
+        "brief": { "$ref": "#/$defs/brief" },
+        "platformTarget": {
+          "type": "string",
+          "enum": ["web", "ios", "android"]
+        },
+        "consumerType": {
+          "type": "string",
+          "enum": ["web-browser", "desktop-shell", "ios-native", "android-native"]
+        },
+        "capturePreset": { "type": "string", "minLength": 1 },
+        "comparisonPairs": {
+          "type": "array",
+          "items": { "$ref": "#/$defs/comparisonPair" }
+        },
+        "paths": {
+          "$ref": "#/$defs/fixturePaths"
+        },
+        "sessions": {
+          "type": "array",
+          "items": { "$ref": "#/$defs/sessionRef" }
+        },
+        "comparisons": {
+          "type": "array",
+          "items": { "$ref": "#/$defs/comparisonRef" }
+        }
+      }
+    }
+  }
+}
diff --git a/packages/interfacectl-cli/schemas/generation-benchmark-spec.schema.json b/packages/interfacectl-cli/schemas/generation-benchmark-spec.schema.json
new file mode 100644
index 0000000..89b0227
--- /dev/null
+++ b/packages/interfacectl-cli/schemas/generation-benchmark-spec.schema.json
@@ -0,0 +1,159 @@
+{
+  "$schema": "https://json-schema.org/draft/2020-12/schema",
+  "$id": "https://surfaces.dev/schemas/generation-benchmark-spec.schema.json",
+  "title": "GenerationBenchmarkSpec",
+  "type": "object",
+  "additionalProperties": false,
+  "required": [
+    "schemaVersion",
+    "specId",
+    "generatedAt",
+    "evaluationMode",
+    "attemptBudget",
+    "guidanceStrategies",
+    "comparisonPairs",
+    "fixtures"
+  ],
+  "properties": {
+    "schemaVersion": {
+      "type": "number",
+      "const": 1
+    },
+    "specId": {
+      "type": "string",
+      "minLength": 1
+    },
+    "generatedAt": {
+      "type": "string",
+      "format": "date-time"
+    },
+    "evaluationMode": {
+      "type": "string",
+      "enum": ["zero-shot", "iterative"]
+    },
+    "attemptBudget": {
+      "type": "number",
+      "minimum": 1
+    },
+    "guidanceStrategies": {
+      "type": "array",
+      "items": {
+        "type": "string",
+        "enum": ["prompt-summary", "baseline-primary", "json-primary", "unguided"]
+      }
+    },
+    "comparisonPairs": {
+      "type": "array",
+      "items": {
+        "$ref": "#/$defs/comparisonPair"
+      }
+    },
+    "suiteId": {
+      "type": "string"
+    },
+    "suiteName": {
+      "type": "string"
+    },
+    "fixtures": {
+      "type": "array",
+      "items": {
+        "$ref": "#/$defs/fixture"
+      }
+    }
+  },
+  "$defs": {
+    "comparisonPair": {
+      "type": "object",
+      "additionalProperties": false,
+      "required": ["baselineGuidanceStrategy", "guidedGuidanceStrategy"],
+      "properties": {
+        "baselineGuidanceStrategy": {
+          "type": "string",
+          "enum": ["prompt-summary", "baseline-primary", "json-primary", "unguided"]
+        },
+        "guidedGuidanceStrategy": {
+          "type": "string",
+          "enum": ["prompt-summary", "baseline-primary", "json-primary", "unguided"]
+        }
+      }
+    },
+    "brief": {
+      "type": "object",
+      "additionalProperties": false,
+      "required": ["path", "sha256"],
+      "properties": {
+        "path": {
+          "type": "string",
+          "minLength": 1
+        },
+        "sha256": {
+          "type": "string",
+          "minLength": 1
+        }
+      }
+    },
+    "fixturePaths": {
+      "type": "object",
+      "additionalProperties": false,
+      "properties": {
+        "fixtureDir": { "type": "string" },
+        "sourceContractPath": { "type": "string" },
+        "sourceAstPath": { "type": "string" },
+        "bundleRoot": { "type": "string" },
+        "compiledContractPath": { "type": "string" },
+        "effectiveAstPath": { "type": "string" },
+        "preparedInputPath": { "type": "string" },
+        "acceptedSuggestionsPath": { "type": "string" },
+        "designerNotesPath": { "type": "string" },
+        "baselineValidatePath": { "type": "string" }
+      }
+    },
+    "fixture": {
+      "type": "object",
+      "additionalProperties": false,
+      "required": [
+        "fixtureId",
+        "surfaceId",
+        "brief",
+        "platformTarget",
+        "consumerType",
+        "capturePreset",
+        "comparisonPairs"
+      ],
+      "properties": {
+        "fixtureId": {
+          "type": "string",
+          "minLength": 1
+        },
+        "surfaceId": {
+          "type": "string",
+          "minLength": 1
+        },
+        "brief": {
+          "$ref": "#/$defs/brief"
+        },
+        "platformTarget": {
+          "type": "string",
+          "enum": ["web", "ios", "android"]
+        },
+        "consumerType": {
+          "type": "string",
+          "enum": ["web-browser", "desktop-shell", "ios-native", "android-native"]
+        },
+        "capturePreset": {
+          "type": "string",
+          "minLength": 1
+        },
+        "comparisonPairs": {
+          "type": "array",
+          "items": {
+            "$ref": "#/$defs/comparisonPair"
+          }
+        },
+        "paths": {
+          "$ref": "#/$defs/fixturePaths"
+        }
+      }
+    }
+  }
+}
diff --git a/packages/interfacectl-cli/schemas/generation-guidance-handoff.schema.json b/packages/interfacectl-cli/schemas/generation-guidance-handoff.schema.json
index 38f447c..0a49919 100644
--- a/packages/interfacectl-cli/schemas/generation-guidance-handoff.schema.json
+++ b/packages/interfacectl-cli/schemas/generation-guidance-handoff.schema.json
@@ -15,6 +15,7 @@
     "session",
     "runtimeGuidance",
     "promptSummary",
+    "baselinePrimary",
     "jsonPrimary"
   ],
   "properties": {
@@ -36,7 +37,7 @@
     },
     "guidanceStrategy": {
       "type": "string",
-      "enum": ["prompt-summary", "json-primary", "unguided"]
+      "enum": ["prompt-summary", "baseline-primary", "json-primary", "unguided"]
     },
     "generatedAt": {
       "type": "string",
@@ -168,6 +169,26 @@
         }
       ]
     },
+    "baselinePrimary": {
+      "oneOf": [
+        {
+          "type": "null"
+        },
+        {
+          "type": "object",
+          "additionalProperties": false,
+          "required": ["effectiveContractSummary", "baselineContractSummary"],
+          "properties": {
+            "effectiveContractSummary": {
+              "type": "string"
+            },
+            "baselineContractSummary": {
+              "type": "string"
+            }
+          }
+        }
+      ]
+    },
     "jsonPrimary": {
       "oneOf": [
         {
diff --git a/packages/interfacectl-cli/schemas/generation-session-comparison.schema.json b/packages/interfacectl-cli/schemas/generation-session-comparison.schema.json
index a5f807c..22ce358 100644
--- a/packages/interfacectl-cli/schemas/generation-session-comparison.schema.json
+++ b/packages/interfacectl-cli/schemas/generation-session-comparison.schema.json
@@ -94,7 +94,7 @@
         "rubric": {
           "type": "object",
           "additionalProperties": false,
-          "required": ["structure", "components", "boundary", "visual", "responsiveness"],
+          "required": ["structure", "components", "boundary", "visual", "responsiveness", "platformFit"],
           "properties": {
             "structure": {
               "$ref": "#/$defs/rubricDelta"
@@ -110,6 +110,9 @@
             },
             "responsiveness": {
               "$ref": "#/$defs/rubricDelta"
+            },
+            "platformFit": {
+              "$ref": "#/$defs/rubricDelta"
             }
           }
         }
@@ -136,7 +139,7 @@
           "type": "array",
           "items": {
             "type": "string",
-            "enum": ["structure", "components", "boundary", "visual", "responsiveness"]
+            "enum": ["structure", "components", "boundary", "visual", "responsiveness", "platformFit"]
           }
         },
         "meetsGoal": {
@@ -253,7 +256,7 @@
     "assessment": {
       "type": "object",
       "additionalProperties": false,
-      "required": ["structure", "components", "boundary", "visual", "responsiveness", "notes"],
+      "required": ["structure", "components", "boundary", "visual", "responsiveness", "platformFit", "notes"],
       "properties": {
         "structure": {
           "type": "string",
@@ -275,6 +278,10 @@
           "type": "string",
           "enum": ["strong", "partial", "weak"]
         },
+        "platformFit": {
+          "type": "string",
+          "enum": ["strong", "partial", "weak"]
+        },
         "notes": {
           "type": "string",
           "minLength": 1
@@ -350,7 +357,7 @@
         },
         "guidanceStrategy": {
           "type": "string",
-          "enum": ["prompt-summary", "json-primary", "unguided"]
+          "enum": ["prompt-summary", "baseline-primary", "json-primary", "unguided"]
         },
         "attemptCount": {
           "type": "number",
diff --git a/packages/interfacectl-cli/schemas/generation-session-summary.schema.json b/packages/interfacectl-cli/schemas/generation-session-summary.schema.json
index ea99d19..a975f7d 100644
--- a/packages/interfacectl-cli/schemas/generation-session-summary.schema.json
+++ b/packages/interfacectl-cli/schemas/generation-session-summary.schema.json
@@ -43,7 +43,7 @@
     },
     "guidanceStrategy": {
       "type": "string",
-      "enum": ["prompt-summary", "json-primary", "unguided"]
+      "enum": ["prompt-summary", "baseline-primary", "json-primary", "unguided"]
     },
     "attemptCount": {
       "type": "number",
@@ -249,7 +249,7 @@
     "assessment": {
       "type": "object",
       "additionalProperties": false,
-      "required": ["structure", "components", "boundary", "visual", "responsiveness", "notes"],
+      "required": ["structure", "components", "boundary", "visual", "responsiveness", "platformFit", "notes"],
       "properties": {
         "structure": {
           "type": "string",
@@ -271,6 +271,10 @@
           "type": "string",
           "enum": ["strong", "partial", "weak"]
         },
+        "platformFit": {
+          "type": "string",
+          "enum": ["strong", "partial", "weak"]
+        },
         "notes": {
           "type": "string",
           "minLength": 1
diff --git a/packages/interfacectl-cli/schemas/generation-session.schema.json b/packages/interfacectl-cli/schemas/generation-session.schema.json
index b73d7e9..cb6636d 100644
--- a/packages/interfacectl-cli/schemas/generation-session.schema.json
+++ b/packages/interfacectl-cli/schemas/generation-session.schema.json
@@ -40,7 +40,7 @@
     },
     "guidanceStrategy": {
       "type": "string",
-      "enum": ["prompt-summary", "json-primary", "unguided"]
+      "enum": ["prompt-summary", "baseline-primary", "json-primary", "unguided"]
     },
     "workspaceRoot": {
       "type": "string",
diff --git a/packages/interfacectl-cli/src/commands/generation-session.ts b/packages/interfacectl-cli/src/commands/generation-session.ts
index cda3ff3..5844444 100644
--- a/packages/interfacectl-cli/src/commands/generation-session.ts
+++ b/packages/interfacectl-cli/src/commands/generation-session.ts
@@ -20,13 +20,22 @@ import { stringifyDeterministicJson, writeDeterministicJsonSync } from "../utils
 type SessionTool = "codex" | "cursor" | "local-llm";
 type AssessmentGrade = "strong" | "partial" | "weak";
 type ValidateStatus = "pass" | "warn" | "block";
-type GuidanceStrategy = "prompt-summary" | "json-primary" | "unguided";
+type GuidanceStrategy = "prompt-summary" | "baseline-primary" | "json-primary" | "unguided";
 type SessionSuccessRule = "pass" | "pass-or-reviewed-warn";
 type AttemptReviewStatus = "accepted" | "rejected";
 type AttemptOutcome = ValidateStatus | "accepted-warn";
 type SuggestionStatus = "proposed" | "accepted" | "rejected";
-
-type AssessmentDimension = "structure" | "components" | "boundary" | "visual" | "responsiveness";
+type EvaluationMode = "zero-shot" | "iterative";
+type PlatformTarget = "web" | "ios" | "android";
+type ConsumerType = "web-browser" | "desktop-shell" | "ios-native" | "android-native";
+
+type AssessmentDimension =
+  | "structure"
+  | "components"
+  | "boundary"
+  | "visual"
+  | "responsiveness"
+  | "platformFit";
 
 export interface InitGenerationSessionCommandOptions {
   bundleRoot?: string;
@@ -93,6 +102,19 @@ export interface SummarizeGenerationBenchmarkCommandOptions {
   comparisonPaths?: string;
   suggestionPaths?: string;
   outDir?: string;
+  runPath?: string;
+}
+
+export interface ReplayGenerationBenchmarkCommandOptions {
+  specPath?: string;
+  tool?: string;
+  outDir?: string;
+  cohortId?: string;
+  sourceRunPath?: string;
+  requestedModelLabel?: string;
+  resolvedModelId?: string;
+  baseUrl?: string;
+  fingerprint?: string;
 }
 
 interface GenerationAssessment {
@@ -101,6 +123,7 @@ interface GenerationAssessment {
   boundary: AssessmentGrade;
   visual: AssessmentGrade;
   responsiveness: AssessmentGrade;
+  platformFit: AssessmentGrade;
   notes: string;
   touchedFiles?: string[];
   heuristics?: GenerationAssessmentHeuristics;
@@ -368,8 +391,23 @@ interface ContractDeltaSuggestionsArtifact {
 }
 
 interface GenerationBenchmarkReport {
-  schemaVersion: 2;
+  schemaVersion: 3;
   generatedAt: string;
+  run?: {
+    cohortId: string;
+    evaluationMode: EvaluationMode;
+    tool: SessionTool;
+    sourceSpecPath: string;
+    sourceRunPath: string | null;
+    guidanceStrategies: GuidanceStrategy[];
+    attemptBudget: number;
+    model: {
+      requestedModelLabel: string | null;
+      resolvedModelId: string | null;
+      baseUrl: string | null;
+      fingerprint: string | null;
+    };
+  };
   comparisons: Array<{
     surfaceId: string;
     tool: SessionTool;
@@ -377,6 +415,9 @@ interface GenerationBenchmarkReport {
     meetsGoal: boolean;
     baselineGuidanceStrategy: GuidanceStrategy;
     guidedGuidanceStrategy: GuidanceStrategy;
+    platformTarget?: PlatformTarget;
+    consumerType?: ConsumerType;
+    modelLabel?: string | null;
     guidedFewerFirstAttemptBlockingFindings: boolean;
     guidedReachedAcceptableNoLater: boolean;
     guidedRubricBetterDimensions: AssessmentDimension[];
@@ -400,6 +441,19 @@ interface GenerationBenchmarkReport {
     proposedSuggestionCount: number;
     heuristics: GenerationBenchmarkHeuristicsSummary;
   };
+  breakdowns?: {
+    byPlatformTarget: Record<string, GenerationBenchmarkBreakdownSummary>;
+    byConsumerType: Record<string, GenerationBenchmarkBreakdownSummary>;
+    byModelLabel: Record<string, GenerationBenchmarkBreakdownSummary>;
+  };
+}
+
+interface GenerationBenchmarkBreakdownSummary {
+  comparisonCount: number;
+  surfaceCount: number;
+  surfacesMeetingGoal: number;
+  guidedFewerFirstAttemptBlockingFindings: number;
+  guidedReachedAcceptableNoLater: number;
 }
 
 interface GenerationAssessmentHeuristics {
@@ -480,6 +534,10 @@ interface GenerationGuidanceHandoff {
     effectiveContractSummary: string;
     preparedGuidanceSummary: string;
   } | null;
+  baselinePrimary: {
+    effectiveContractSummary: string;
+    baselineContractSummary: string;
+  } | null;
   jsonPrimary: {
     surface: Record<string, unknown>;
     contract: Record<string, unknown>;
@@ -507,18 +565,115 @@ interface LoadedAttempt {
   previewMetadataPath?: string;
 }
 
+interface GenerationBenchmarkSpecFixture {
+  fixtureId: string;
+  surfaceId: string;
+  brief: GenerationBrief;
+  platformTarget: PlatformTarget;
+  consumerType: ConsumerType;
+  capturePreset: string;
+  comparisonPairs: Array<{
+    baselineGuidanceStrategy: GuidanceStrategy;
+    guidedGuidanceStrategy: GuidanceStrategy;
+  }>;
+  paths?: {
+    fixtureDir?: string;
+    sourceContractPath?: string;
+    sourceAstPath?: string;
+    bundleRoot?: string;
+    compiledContractPath?: string;
+    effectiveAstPath?: string;
+    preparedInputPath?: string;
+    acceptedSuggestionsPath?: string;
+    designerNotesPath?: string;
+    baselineValidatePath?: string;
+  };
+}
+
+interface GenerationBenchmarkSpec {
+  schemaVersion: 1;
+  specId: string;
+  generatedAt: string;
+  evaluationMode: EvaluationMode;
+  attemptBudget: number;
+  guidanceStrategies: GuidanceStrategy[];
+  comparisonPairs: Array<{
+    baselineGuidanceStrategy: GuidanceStrategy;
+    guidedGuidanceStrategy: GuidanceStrategy;
+  }>;
+  suiteId?: string;
+  suiteName?: string;
+  fixtures: GenerationBenchmarkSpecFixture[];
+}
+
+interface GenerationBenchmarkRunFixture extends GenerationBenchmarkSpecFixture {
+  sessions: Array<{
+    guidanceStrategy: GuidanceStrategy;
+    sessionId: string;
+    sessionDir: string;
+    transcriptPath: string;
+    guidanceHandoffPath: string;
+    agentInputPath: string;
+    explainabilityPath: string;
+    summaryPath: string;
+    previewPath: string | null;
+  }>;
+  comparisons: Array<{
+    baselineGuidanceStrategy: GuidanceStrategy;
+    guidedGuidanceStrategy: GuidanceStrategy;
+    comparisonDir: string;
+    comparisonPath: string;
+  }>;
+}
+
+interface GenerationBenchmarkRun {
+  schemaVersion: 1;
+  cohortId: string;
+  generatedAt: string;
+  evaluationMode: EvaluationMode;
+  tool: SessionTool;
+  sourceSpecPath: string;
+  sourceRunPath: string | null;
+  attemptBudget: number;
+  guidanceStrategies: GuidanceStrategy[];
+  comparisonPairs: Array<{
+    baselineGuidanceStrategy: GuidanceStrategy;
+    guidedGuidanceStrategy: GuidanceStrategy;
+  }>;
+  model: {
+    requestedModelLabel: string | null;
+    resolvedModelId: string | null;
+    baseUrl: string | null;
+    fingerprint: string | null;
+  };
+  suiteId?: string;
+  suiteName?: string;
+  paths: {
+    benchmarkDir: string;
+    specPath: string;
+    runPath: string;
+    reportJsonPath: string | null;
+    reportMarkdownPath: string | null;
+  };
+  fixtures: GenerationBenchmarkRunFixture[];
+}
+
 const VALID_TOOLS = new Set<SessionTool>(["codex", "cursor", "local-llm"]);
 const VALID_GRADES = new Set<AssessmentGrade>(["strong", "partial", "weak"]);
-const VALID_GUIDANCE_STRATEGIES = new Set<GuidanceStrategy>(["prompt-summary", "json-primary", "unguided"]);
+const VALID_GUIDANCE_STRATEGIES = new Set<GuidanceStrategy>(["prompt-summary", "baseline-primary", "json-primary", "unguided"]);
 const VALID_REVIEW_STATUSES = new Set<AttemptReviewStatus>(["accepted", "rejected"]);
 const VALID_SUGGESTION_STATUSES = new Set<SuggestionStatus>(["proposed", "accepted", "rejected"]);
 const VALID_SUCCESS_RULES = new Set<SessionSuccessRule>(["pass", "pass-or-reviewed-warn"]);
+const VALID_EVALUATION_MODES = new Set<EvaluationMode>(["zero-shot", "iterative"]);
+const VALID_PLATFORM_TARGETS = new Set<PlatformTarget>(["web", "ios", "android"]);
+const VALID_CONSUMER_TYPES = new Set<ConsumerType>(["web-browser", "desktop-shell", "ios-native", "android-native"]);
 const ASSESSMENT_DIMENSIONS: AssessmentDimension[] = [
   "structure",
   "components",
   "boundary",
   "visual",
   "responsiveness",
+  "platformFit",
 ];
 
 class SessionInputError extends Error {
@@ -595,12 +750,38 @@ function ensureGuidanceStrategy(guidanceStrategy?: string): GuidanceStrategy {
   const mapped = normalized === "prepared" ? "prompt-summary" : normalized;
   if (!VALID_GUIDANCE_STRATEGIES.has(mapped as GuidanceStrategy)) {
     throw new SessionInputError(
-      `Invalid guidance strategy "${guidanceStrategy ?? ""}". Expected prompt-summary|json-primary|unguided.`,
+      `Invalid guidance strategy "${guidanceStrategy ?? ""}". Expected prompt-summary|baseline-primary|json-primary|unguided.`,
     );
   }
   return mapped as GuidanceStrategy;
 }
 
+function ensureEvaluationMode(value?: string): EvaluationMode {
+  const normalized = typeof value === "string" ? value.trim().toLowerCase() : "zero-shot";
+  if (!VALID_EVALUATION_MODES.has(normalized as EvaluationMode)) {
+    throw new SessionInputError(`Invalid evaluation mode "${value ?? ""}". Expected zero-shot|iterative.`);
+  }
+  return normalized as EvaluationMode;
+}
+
+function ensurePlatformTarget(value: unknown, label: string): PlatformTarget {
+  const normalized = typeof value === "string" ? value.trim().toLowerCase() : "";
+  if (!VALID_PLATFORM_TARGETS.has(normalized as PlatformTarget)) {
+    throw new SessionInputError(`Invalid ${label} "${String(value ?? "")}". Expected web|ios|android.`);
+  }
+  return normalized as PlatformTarget;
+}
+
+function ensureConsumerType(value: unknown, label: string): ConsumerType {
+  const normalized = typeof value === "string" ? value.trim().toLowerCase() : "";
+  if (!VALID_CONSUMER_TYPES.has(normalized as ConsumerType)) {
+    throw new SessionInputError(
+      `Invalid ${label} "${String(value ?? "")}". Expected web-browser|desktop-shell|ios-native|android-native.`,
+    );
+  }
+  return normalized as ConsumerType;
+}
+
 function buildDefaultSessionId(): string {
   return new Date().toISOString().replace(/[-:]/g, "").replace(/\.\d{3}Z$/, "Z");
 }
@@ -647,7 +828,11 @@ function normalizeAssessment(
   const structureFallback = payload.structure;
   const grade = (key: AssessmentDimension) => {
     let value = payload[key];
-    if (value === undefined && options.allowLegacyMissing && (key === "components" || key === "boundary")) {
+    if (
+      value === undefined
+      && options.allowLegacyMissing
+      && (key === "components" || key === "boundary" || key === "platformFit")
+    ) {
       value = structureFallback;
     }
     if (!VALID_GRADES.has(value as AssessmentGrade)) {
@@ -711,6 +896,7 @@ function normalizeAssessment(
     boundary: grade("boundary"),
     visual: grade("visual"),
     responsiveness: grade("responsiveness"),
+    platformFit: grade("platformFit"),
     notes,
     ...(touchedFiles && touchedFiles.length > 0 ? { touchedFiles } : {}),
     ...(heuristics ? { heuristics } : {}),
@@ -1059,6 +1245,28 @@ function averageNullable(values: Array<number | null | undefined>): number | nul
   return Math.round((filtered.reduce((sum, value) => sum + value, 0) / filtered.length) * 1000) / 1000;
 }
 
+function readOptionalTrimmedText(filePath: string | null | undefined): string | null {
+  if (!filePath || !fs.existsSync(filePath)) {
+    return null;
+  }
+  return fs.readFileSync(filePath, "utf8").trim();
+}
+
+function appendArtifactLines(
+  lines: string[],
+  title: string,
+  artifacts: Array<[label: string, filePath: string | undefined]>,
+) {
+  const filtered = artifacts.filter(([, filePath]) => Boolean(filePath));
+  if (filtered.length === 0) {
+    return;
+  }
+  lines.push("", title);
+  for (const [label, filePath] of filtered) {
+    lines.push(`- ${label}: ${filePath}`);
+  }
+}
+
 function renderSummaryMarkdown(summary: GenerationSessionSummary): string {
   const lines = [
     "# Generation Session Summary",
@@ -1099,6 +1307,7 @@ function renderSummaryMarkdown(summary: GenerationSessionSummary): string {
   lines.push(`- boundary: ${summary.latestAssessment?.boundary ?? "n/a"}`);
   lines.push(`- visual: ${summary.latestAssessment?.visual ?? "n/a"}`);
   lines.push(`- responsiveness: ${summary.latestAssessment?.responsiveness ?? "n/a"}`);
+  lines.push(`- platform fit: ${summary.latestAssessment?.platformFit ?? "n/a"}`);
   lines.push(`- notes: ${summary.latestAssessment?.notes ?? "n/a"}`);
 
   if (summary.latestAssessment?.touchedFiles?.length) {
@@ -1435,11 +1644,24 @@ function renderSuggestionsMarkdown(artifact: ContractDeltaSuggestionsArtifact):
   return `${lines.join("\n")}\n`;
 }
 
-function renderBenchmarkReportMarkdown(report: GenerationBenchmarkReport): string {
+function renderBenchmarkReportMarkdown(report: GenerationBenchmarkReport, run?: GenerationBenchmarkRun | null): string {
   const lines = [
     "# Generation Benchmark Report",
     "",
     `Generated at: ${report.generatedAt}`,
+    ...(report.run
+      ? [
+          `Cohort: ${report.run.cohortId}`,
+          `Evaluation mode: ${report.run.evaluationMode}`,
+          `Tool: ${report.run.tool}`,
+          `Model label: ${report.run.model.requestedModelLabel ?? "not recorded"}`,
+          `Resolved model id: ${report.run.model.resolvedModelId ?? "not recorded"}`,
+          `Base URL: ${report.run.model.baseUrl ?? "not recorded"}`,
+          `Fingerprint: ${report.run.model.fingerprint ?? "not recorded"}`,
+          `Source spec: ${report.run.sourceSpecPath}`,
+          `Source run: ${report.run.sourceRunPath ?? "none"}`,
+        ]
+      : []),
     `Surfaces: ${report.overall.surfaceCount}`,
     `Surfaces meeting goal: ${report.overall.surfacesMeetingGoal}`,
     `Candidate fewer first-attempt blocking findings: ${report.overall.guidedFewerFirstAttemptBlockingFindings}`,
@@ -1448,10 +1670,14 @@ function renderBenchmarkReportMarkdown(report: GenerationBenchmarkReport): strin
     "## Comparisons",
   ];
 
-  for (const comparison of report.comparisons) {
-    lines.push(
-      `- ${comparison.surfaceId}: baseline=${comparison.baselineGuidanceStrategy}, candidate=${comparison.guidedGuidanceStrategy}, meetsGoal=${comparison.meetsGoal}, improved dimensions=${comparison.guidedRubricBetterDimensions.join(", ") || "none"}`,
-    );
+  if (report.comparisons.length === 0) {
+    lines.push("- none");
+  } else {
+    for (const comparison of report.comparisons) {
+      lines.push(
+        `- ${comparison.surfaceId}: baseline=${comparison.baselineGuidanceStrategy}, candidate=${comparison.guidedGuidanceStrategy}, platform=${comparison.platformTarget ?? "unknown"}, consumer=${comparison.consumerType ?? "unknown"}, model=${comparison.modelLabel ?? "unknown"}, meetsGoal=${comparison.meetsGoal}, improved dimensions=${comparison.guidedRubricBetterDimensions.join(", ") || "none"}`,
+      );
+    }
   }
 
   lines.push("", "## Suggestion decisions");
@@ -1469,6 +1695,97 @@ function renderBenchmarkReportMarkdown(report: GenerationBenchmarkReport): strin
   lines.push(`- lower repeated finding carryover count: ${report.overall.heuristics.lowerRepeatedFindingCarryoverCount}`);
   lines.push(`- lower reruns to acceptable outcome: ${report.overall.heuristics.lowerRerunsToAcceptableOutcome}`);
 
+  if (report.breakdowns) {
+    const renderBreakdownBlock = (title: string, entries: Record<string, GenerationBenchmarkBreakdownSummary>) => {
+      lines.push("", title);
+      const keys = Object.keys(entries).sort((left, right) => left.localeCompare(right));
+      if (keys.length === 0) {
+        lines.push("- none");
+        return;
+      }
+      for (const key of keys) {
+        const entry = entries[key];
+        lines.push(
+          `- ${key}: comparisons=${entry.comparisonCount}, surfaces=${entry.surfaceCount}, meetsGoal=${entry.surfacesMeetingGoal}, fewerBlocking=${entry.guidedFewerFirstAttemptBlockingFindings}, acceptableNoLater=${entry.guidedReachedAcceptableNoLater}`,
+        );
+      }
+    };
+    renderBreakdownBlock("## By Platform Target", report.breakdowns.byPlatformTarget);
+    renderBreakdownBlock("## By Consumer Type", report.breakdowns.byConsumerType);
+    renderBreakdownBlock("## By Model", report.breakdowns.byModelLabel);
+  }
+
+  if (run) {
+    lines.push("", "## Zero-Shot Evidence");
+    for (const fixture of run.fixtures) {
+      lines.push(
+        "",
+        `### ${fixture.surfaceId}`,
+        `- fixture: ${fixture.fixtureId}`,
+        `- platform target: ${fixture.platformTarget}`,
+        `- consumer type: ${fixture.consumerType}`,
+        `- capture preset: ${fixture.capturePreset}`,
+        `- brief path: ${fixture.brief.path}`,
+        `- brief sha256: ${fixture.brief.sha256}`,
+      );
+
+      const briefText = readOptionalTrimmedText(fixture.brief.path);
+      if (briefText) {
+        lines.push("", "#### Benchmark Brief", "", "```md", briefText, "```");
+      }
+
+      appendArtifactLines(lines, "#### Contract Artifacts", [
+        ["source contract", fixture.paths?.sourceContractPath],
+        ["source AST", fixture.paths?.sourceAstPath],
+        ["bundle root", fixture.paths?.bundleRoot],
+        ["compiled contract", fixture.paths?.compiledContractPath],
+        ["effective AST", fixture.paths?.effectiveAstPath],
+      ]);
+
+      appendArtifactLines(lines, "#### Prompt And Input Artifacts", [
+        ["prepared input", fixture.paths?.preparedInputPath],
+        ["accepted suggestions", fixture.paths?.acceptedSuggestionsPath],
+        ["designer notes", fixture.paths?.designerNotesPath],
+        ["baseline validate", fixture.paths?.baselineValidatePath],
+      ]);
+
+      if (fixture.comparisons.length > 0) {
+        lines.push("", "#### Fixture Comparisons");
+        for (const comparison of fixture.comparisons) {
+          lines.push(
+            `- ${comparison.baselineGuidanceStrategy} vs ${comparison.guidedGuidanceStrategy}: ${comparison.comparisonPath}`,
+          );
+        }
+      }
+
+      if (fixture.sessions.length > 0) {
+        lines.push("", "#### Session Evidence");
+        for (const session of fixture.sessions) {
+          const summary = fs.existsSync(session.summaryPath)
+            ? readJsonFile<JsonRecord>(session.summaryPath, "generation benchmark session summary")
+            : null;
+          lines.push(
+            "",
+            `##### ${session.guidanceStrategy}`,
+            `- session id: ${session.sessionId}`,
+            `- session dir: ${session.sessionDir}`,
+            `- latest status: ${asString(summary?.latestStatus) ?? "not recorded"}`,
+            `- latest outcome: ${asString(summary?.latestOutcome) ?? "not recorded"}`,
+            `- error: ${asString(summary?.errorMessage) ?? "none"}`,
+            `- summary path: ${session.summaryPath}`,
+            `- guidance handoff: ${session.guidanceHandoffPath}`,
+            `- agent input: ${session.agentInputPath}`,
+            `- preview: ${session.previewPath ?? "not captured"}`,
+          );
+          const agentInput = readOptionalTrimmedText(session.agentInputPath);
+          if (agentInput) {
+            lines.push("", "```txt", agentInput, "```");
+          }
+        }
+      }
+    }
+  }
+
   return `${lines.join("\n")}\n`;
 }
 
@@ -1578,6 +1895,39 @@ function buildPreparedPromptSummary(preparedPayload: ReturnType<typeof buildPrep
   ].join("\n");
 }
 
+function buildBaselinePrimarySummary(preparedPayload: ReturnType<typeof buildPreparedGenerationPayload>): string {
+  const surface = asRecord(preparedPayload.surface);
+  const contract = asRecord(preparedPayload.contract);
+  const constraints = asRecord(preparedPayload.constraints);
+  const generation = asRecord(preparedPayload.generation);
+  const layout = asRecord(generation.layout);
+  const guidance = asRecord(generation.guidance);
+  const boundaryRules = Array.isArray(guidance.boundaryRules)
+    ? guidance.boundaryRules.filter((entry): entry is JsonRecord => isRecord(entry))
+    : [];
+  const sections = Array.isArray(preparedPayload.sections)
+    ? preparedPayload.sections.filter((entry): entry is JsonRecord => isRecord(entry))
+    : [];
+  const repairMap = extractRepairEntries(preparedPayload.repairMap);
+  const color = asRecord(constraints.color);
+  const motion = asRecord(constraints.motion);
+
+  return [
+    `Surface: ${asString(surface.id) ?? "unknown"} (${asString(surface.type) ?? "unspecified"})`,
+    `Contract: ${asString(contract.id) ?? "unknown"} v${asString(contract.version) ?? "0.0.0"}`,
+    `Required sections: ${sections.map((entry) => asString(entry.id) ?? "").filter(Boolean).join(", ") || "none recorded"}`,
+    `Boundary rules: ${boundaryRules.map((entry) => asString(entry.id) ?? "").filter(Boolean).join(", ") || "none recorded"}`,
+    `Max content width: ${typeof layout.maxContentWidth === "number" ? `${layout.maxContentWidth}px` : "unspecified"}`,
+    `Allowed colors: ${asStringArray(color.allowedValues).join(", ") || "none recorded"}`,
+    `Motion durations: ${
+      Array.isArray(motion.allowedDurationsMs)
+        ? motion.allowedDurationsMs.map((value) => `${String(value)}ms`).join(", ")
+        : "none recorded"
+    }`,
+    `Top repair codes: ${repairMap.slice(0, 5).map((entry) => asString(entry.code) ?? "").filter(Boolean).join(", ") || "none"}`,
+  ].join("\n");
+}
+
 function selectRelevantComponents(preparedPayload: ReturnType<typeof buildPreparedGenerationPayload>): Array<Record<string, unknown>> {
   const sections = Array.isArray(preparedPayload.sections)
     ? preparedPayload.sections.filter((entry): entry is JsonRecord => isRecord(entry))
@@ -1765,6 +2115,12 @@ function buildGuidanceHandoff(
           preparedGuidanceSummary: buildPreparedPromptSummary(preparedPayload!),
         }
       : null,
+    baselinePrimary: guidanceStrategy === "baseline-primary"
+      ? {
+          effectiveContractSummary: summarizeContractForSurface(session.contractPath, session.surfaceId),
+          baselineContractSummary: buildBaselinePrimarySummary(preparedPayload!),
+        }
+      : null,
     jsonPrimary: guidanceStrategy === "json-primary"
       ? {
           surface: asRecord(preparedPayload!.surface),
@@ -2162,6 +2518,223 @@ function normalizeSuggestionReviewFile(filePath: string): Array<{
   });
 }
 
+function buildDefaultBenchmarkCohortId(): string {
+  return new Date().toISOString().replace(/[-:.TZ]/g, "").slice(0, 14);
+}
+
+function normalizeBenchmarkComparisonPairs(value: unknown, label: string): GenerationBenchmarkSpec["comparisonPairs"] {
+  if (!Array.isArray(value) || value.length === 0) {
+    throw new SessionInputError(`${label} must be a non-empty array.`);
+  }
+  return value.map((entry, index) => {
+    const record = asRecord(entry);
+    return {
+      baselineGuidanceStrategy: ensureGuidanceStrategy(
+        asString(record.baselineGuidanceStrategy) ?? (() => {
+          throw new SessionInputError(`${label}[${index}].baselineGuidanceStrategy is required.`);
+        })(),
+      ),
+      guidedGuidanceStrategy: ensureGuidanceStrategy(
+        asString(record.guidedGuidanceStrategy) ?? (() => {
+          throw new SessionInputError(`${label}[${index}].guidedGuidanceStrategy is required.`);
+        })(),
+      ),
+    };
+  });
+}
+
+function loadGenerationBenchmarkSpec(specPath: string): GenerationBenchmarkSpec {
+  const resolvedPath = path.resolve(specPath);
+  const payload = readJsonFile<JsonRecord>(resolvedPath, "generation benchmark spec");
+  const fixturesValue = payload.fixtures;
+  if (!Array.isArray(fixturesValue) || fixturesValue.length === 0) {
+    throw new SessionInputError(`Benchmark spec must include a non-empty fixtures array: ${resolvedPath}.`);
+  }
+  const guidanceStrategies = asStringArray(payload.guidanceStrategies).map((entry) => ensureGuidanceStrategy(entry));
+  if (guidanceStrategies.length < 2) {
+    throw new SessionInputError(`Benchmark spec must freeze at least two guidance strategies: ${resolvedPath}.`);
+  }
+  const comparisonPairs = normalizeBenchmarkComparisonPairs(payload.comparisonPairs, "comparisonPairs");
+  const attemptBudget = Number(payload.attemptBudget);
+  if (!Number.isInteger(attemptBudget) || attemptBudget < 1) {
+    throw new SessionInputError(`Benchmark spec attemptBudget must be a positive integer: ${resolvedPath}.`);
+  }
+
+  return {
+    schemaVersion: 1,
+    specId: asString(payload.specId) ?? path.basename(resolvedPath, path.extname(resolvedPath)),
+    generatedAt: asString(payload.generatedAt) ?? new Date().toISOString(),
+    evaluationMode: ensureEvaluationMode(asString(payload.evaluationMode) ?? "zero-shot"),
+    attemptBudget,
+    guidanceStrategies,
+    comparisonPairs,
+    ...(asString(payload.suiteId) ? { suiteId: asString(payload.suiteId) ?? undefined } : {}),
+    ...(asString(payload.suiteName) ? { suiteName: asString(payload.suiteName) ?? undefined } : {}),
+    fixtures: fixturesValue.map((entry, index) => {
+      const record = asRecord(entry);
+      const brief = asRecord(record.brief);
+      const pathsRecord = record.paths !== undefined ? asRecord(record.paths) : null;
+      const fixtureComparisonPairs = record.comparisonPairs !== undefined
+        ? normalizeBenchmarkComparisonPairs(record.comparisonPairs, `fixtures[${index}].comparisonPairs`)
+        : comparisonPairs;
+      return {
+        fixtureId: asString(record.fixtureId) ?? (() => {
+          throw new SessionInputError(`fixtures[${index}].fixtureId is required in ${resolvedPath}.`);
+        })(),
+        surfaceId: asString(record.surfaceId) ?? (() => {
+          throw new SessionInputError(`fixtures[${index}].surfaceId is required in ${resolvedPath}.`);
+        })(),
+        brief: {
+          path: asString(brief.path) ?? (() => {
+            throw new SessionInputError(`fixtures[${index}].brief.path is required in ${resolvedPath}.`);
+          })(),
+          sha256: asString(brief.sha256) ?? (() => {
+            throw new SessionInputError(`fixtures[${index}].brief.sha256 is required in ${resolvedPath}.`);
+          })(),
+        },
+        platformTarget: ensurePlatformTarget(record.platformTarget, `fixtures[${index}].platformTarget`),
+        consumerType: ensureConsumerType(record.consumerType, `fixtures[${index}].consumerType`),
+        capturePreset: asString(record.capturePreset) ?? "web-browser",
+        comparisonPairs: fixtureComparisonPairs,
+        ...(pathsRecord
+          ? {
+              paths: {
+                ...(asString(pathsRecord.fixtureDir) ? { fixtureDir: asString(pathsRecord.fixtureDir) ?? undefined } : {}),
+                ...(asString(pathsRecord.sourceContractPath)
+                  ? { sourceContractPath: asString(pathsRecord.sourceContractPath) ?? undefined }
+                  : {}),
+                ...(asString(pathsRecord.sourceAstPath)
+                  ? { sourceAstPath: asString(pathsRecord.sourceAstPath) ?? undefined }
+                  : {}),
+                ...(asString(pathsRecord.bundleRoot)
+                  ? { bundleRoot: asString(pathsRecord.bundleRoot) ?? undefined }
+                  : {}),
+                ...(asString(pathsRecord.compiledContractPath)
+                  ? { compiledContractPath: asString(pathsRecord.compiledContractPath) ?? undefined }
+                  : {}),
+                ...(asString(pathsRecord.effectiveAstPath)
+                  ? { effectiveAstPath: asString(pathsRecord.effectiveAstPath) ?? undefined }
+                  : {}),
+                ...(asString(pathsRecord.preparedInputPath)
+                  ? { preparedInputPath: asString(pathsRecord.preparedInputPath) ?? undefined }
+                  : {}),
+                ...(asString(pathsRecord.acceptedSuggestionsPath)
+                  ? { acceptedSuggestionsPath: asString(pathsRecord.acceptedSuggestionsPath) ?? undefined }
+                  : {}),
+                ...(asString(pathsRecord.designerNotesPath)
+                  ? { designerNotesPath: asString(pathsRecord.designerNotesPath) ?? undefined }
+                  : {}),
+                ...(asString(pathsRecord.baselineValidatePath)
+                  ? { baselineValidatePath: asString(pathsRecord.baselineValidatePath) ?? undefined }
+                  : {}),
+              },
+            }
+          : {}),
+      };
+    }),
+  };
+}
+
+function loadGenerationBenchmarkRun(runPath: string): GenerationBenchmarkRun {
+  return readJsonFile<JsonRecord>(path.resolve(runPath), "generation benchmark run") as unknown as GenerationBenchmarkRun;
+}
+
+function buildBreakdownSummary(entries: Array<GenerationBenchmarkReport["comparisons"][number]>): GenerationBenchmarkBreakdownSummary {
+  return {
+    comparisonCount: entries.length,
+    surfaceCount: new Set(entries.map((entry) => entry.surfaceId)).size,
+    surfacesMeetingGoal: entries.filter((entry) => entry.meetsGoal).length,
+    guidedFewerFirstAttemptBlockingFindings: entries.filter(
+      (entry) => entry.guidedFewerFirstAttemptBlockingFindings,
+    ).length,
+    guidedReachedAcceptableNoLater: entries.filter((entry) => entry.guidedReachedAcceptableNoLater).length,
+  };
+}
+
+export async function runReplayGenerationBenchmarkCommand(
+  options: ReplayGenerationBenchmarkCommandOptions,
+): Promise<number> {
+  try {
+    if (!options.specPath) {
+      throw new SessionInputError("--spec is required.");
+    }
+    if (!options.outDir) {
+      throw new SessionInputError("--out-dir is required.");
+    }
+    const tool = ensureSessionTool(options.tool);
+    const specPath = path.resolve(options.specPath);
+    const spec = loadGenerationBenchmarkSpec(specPath);
+    const benchmarkDir = path.resolve(options.outDir);
+    const cohortId = options.cohortId?.trim() || buildDefaultBenchmarkCohortId();
+    const runPath = path.join(benchmarkDir, "run.json");
+    const copiedSpecPath = path.join(benchmarkDir, "spec.json");
+    const sourceRunPath = options.sourceRunPath ? path.resolve(options.sourceRunPath) : null;
+
+    fs.mkdirSync(benchmarkDir, { recursive: true });
+    if (path.resolve(specPath) !== path.resolve(copiedSpecPath)) {
+      fs.copyFileSync(specPath, copiedSpecPath);
+    }
+
+    const run: GenerationBenchmarkRun = {
+      schemaVersion: 1,
+      cohortId,
+      generatedAt: new Date().toISOString(),
+      evaluationMode: spec.evaluationMode,
+      tool,
+      sourceSpecPath: specPath,
+      sourceRunPath,
+      attemptBudget: spec.attemptBudget,
+      guidanceStrategies: [...spec.guidanceStrategies],
+      comparisonPairs: spec.comparisonPairs.map((pair) => ({ ...pair })),
+      model: {
+        requestedModelLabel: options.requestedModelLabel?.trim() || null,
+        resolvedModelId: options.resolvedModelId?.trim() || null,
+        baseUrl: options.baseUrl?.trim() || null,
+        fingerprint: options.fingerprint?.trim() || null,
+      },
+      ...(spec.suiteId ? { suiteId: spec.suiteId } : {}),
+      ...(spec.suiteName ? { suiteName: spec.suiteName } : {}),
+      paths: {
+        benchmarkDir,
+        specPath: copiedSpecPath,
+        runPath,
+        reportJsonPath: null,
+        reportMarkdownPath: null,
+      },
+      fixtures: spec.fixtures.map((fixture) => ({
+        ...fixture,
+        sessions: [],
+        comparisons: [],
+      })),
+    };
+
+    writeDeterministicJsonSync(runPath, run);
+    process.stdout.write(
+      `${JSON.stringify(
+        {
+          ok: true,
+          run,
+          paths: {
+            specPath: copiedSpecPath,
+            runPath,
+            benchmarkDir,
+          },
+        },
+        null,
+        2,
+      )}\n`,
+    );
+    return 0;
+  } catch (error) {
+    if (error instanceof SessionInputError || error instanceof AdapterInputError) {
+      writeError(error, error.code);
+      return 10;
+    }
+    writeError(error instanceof Error ? error : new Error(String(error)), "generation-session.internal");
+    return 1;
+  }
+}
+
 export async function runInitGenerationSessionCommand(
   options: InitGenerationSessionCommandOptions,
 ): Promise<number> {
@@ -2793,8 +3366,14 @@ export async function runSummarizeGenerationBenchmarkCommand(
   options: SummarizeGenerationBenchmarkCommandOptions,
 ): Promise<number> {
   try {
+    const run = options.runPath ? loadGenerationBenchmarkRun(options.runPath) : null;
     const comparisonPaths = parseCsvPaths(options.comparisonPaths);
-    if (comparisonPaths.length === 0) {
+    if (comparisonPaths.length === 0 && run) {
+      comparisonPaths.push(
+        ...run.fixtures.flatMap((fixture) => fixture.comparisons.map((comparison) => path.resolve(comparison.comparisonPath))),
+      );
+    }
+    if (comparisonPaths.length === 0 && !run) {
       throw new SessionInputError("--comparisons must include at least one comparison artifact path.");
     }
     const suggestionPaths = parseCsvPaths(options.suggestionPaths);
@@ -2806,22 +3385,61 @@ export async function runSummarizeGenerationBenchmarkCommand(
       path: suggestionPath,
       value: readJsonFile<JsonRecord>(suggestionPath, "contract delta suggestions artifact") as unknown as ContractDeltaSuggestionsArtifact,
     }));
+    const fixtureMetadataByComparisonPath = new Map<string, {
+      platformTarget: PlatformTarget;
+      consumerType: ConsumerType;
+    }>();
+    if (run) {
+      for (const fixture of run.fixtures) {
+        for (const comparison of fixture.comparisons) {
+          fixtureMetadataByComparisonPath.set(path.resolve(comparison.comparisonPath), {
+            platformTarget: fixture.platformTarget,
+            consumerType: fixture.consumerType,
+          });
+        }
+      }
+    }
 
     const report: GenerationBenchmarkReport = {
-      schemaVersion: 2,
+      schemaVersion: 3,
       generatedAt: new Date().toISOString(),
-      comparisons: comparisons.map(({ path: comparisonPath, value }) => ({
-        surfaceId: value.surfaceId,
-        tool: value.tool,
-        comparisonPath,
-        meetsGoal: value.checks.meetsGoal,
-        baselineGuidanceStrategy: value.baseline.guidanceStrategy,
-        guidedGuidanceStrategy: value.guided.guidanceStrategy,
-        guidedFewerFirstAttemptBlockingFindings: value.checks.guidedFewerFirstAttemptBlockingFindings,
-        guidedReachedAcceptableNoLater: value.checks.guidedReachedAcceptableNoLater,
-        guidedRubricBetterDimensions: value.checks.guidedRubricBetterDimensions,
-        heuristics: value.heuristics.delta,
-      })),
+      ...(run
+        ? {
+            run: {
+              cohortId: run.cohortId,
+              evaluationMode: run.evaluationMode,
+              tool: run.tool,
+              sourceSpecPath: run.sourceSpecPath,
+              sourceRunPath: run.sourceRunPath,
+              guidanceStrategies: [...run.guidanceStrategies],
+              attemptBudget: run.attemptBudget,
+              model: {
+                requestedModelLabel: run.model.requestedModelLabel,
+                resolvedModelId: run.model.resolvedModelId,
+                baseUrl: run.model.baseUrl,
+                fingerprint: run.model.fingerprint,
+              },
+            },
+          }
+        : {}),
+      comparisons: comparisons.map(({ path: comparisonPath, value }) => {
+        const comparisonMetadata = fixtureMetadataByComparisonPath.get(path.resolve(comparisonPath));
+        return {
+          surfaceId: value.surfaceId,
+          tool: value.tool,
+          comparisonPath,
+          meetsGoal: value.checks.meetsGoal,
+          baselineGuidanceStrategy: value.baseline.guidanceStrategy,
+          guidedGuidanceStrategy: value.guided.guidanceStrategy,
+          ...(comparisonMetadata ? { platformTarget: comparisonMetadata.platformTarget } : {}),
+          ...(comparisonMetadata ? { consumerType: comparisonMetadata.consumerType } : {}),
+          ...(run ? { modelLabel: run.model.requestedModelLabel ?? run.model.resolvedModelId ?? "unknown" } : {}),
+          guidedFewerFirstAttemptBlockingFindings: value.checks.guidedFewerFirstAttemptBlockingFindings,
+          guidedReachedAcceptableNoLater: value.checks.guidedReachedAcceptableNoLater,
+          guidedRubricBetterDimensions: value.checks.guidedRubricBetterDimensions,
+          heuristics: value.heuristics.delta,
+        };
+      }),
       suggestions: suggestions.map(({ path: suggestionsPath, value }) => ({
         surfaceId: value.surfaceId,
         sessionId: value.sessionId,
@@ -2831,7 +3449,7 @@ export async function runSummarizeGenerationBenchmarkCommand(
         rejectedCount: value.suggestions.filter((entry) => entry.status === "rejected").length,
       })),
       overall: {
-        surfaceCount: comparisons.length,
+        surfaceCount: comparisons.length > 0 ? comparisons.length : (run?.fixtures.length ?? 0),
         surfacesMeetingGoal: comparisons.filter(({ value }) => value.checks.meetsGoal).length,
         guidedFewerFirstAttemptBlockingFindings: comparisons.filter(
           ({ value }) => value.checks.guidedFewerFirstAttemptBlockingFindings,
@@ -2892,6 +3510,86 @@ export async function runSummarizeGenerationBenchmarkCommand(
           },
         },
       },
+      ...(run
+        ? {
+            breakdowns: {
+              byPlatformTarget: Object.fromEntries(
+                [...new Set(run.fixtures.map((fixture) => fixture.platformTarget))]
+                  .sort((left, right) => left.localeCompare(right))
+                  .map((platformTarget) => [
+                    platformTarget,
+                    buildBreakdownSummary(
+                      comparisons
+                        .map(({ path: comparisonPath, value }) => ({
+                          ...value,
+                          __comparisonPath: comparisonPath,
+                        }))
+                        .filter((entry) =>
+                          fixtureMetadataByComparisonPath.get(path.resolve(entry.__comparisonPath))?.platformTarget === platformTarget
+                        )
+                        .map((entry) => ({
+                          surfaceId: entry.surfaceId,
+                          tool: entry.tool,
+                          comparisonPath: entry.__comparisonPath,
+                          meetsGoal: entry.checks.meetsGoal,
+                          baselineGuidanceStrategy: entry.baseline.guidanceStrategy,
+                          guidedGuidanceStrategy: entry.guided.guidanceStrategy,
+                          guidedFewerFirstAttemptBlockingFindings: entry.checks.guidedFewerFirstAttemptBlockingFindings,
+                          guidedReachedAcceptableNoLater: entry.checks.guidedReachedAcceptableNoLater,
+                          guidedRubricBetterDimensions: entry.checks.guidedRubricBetterDimensions,
+                          heuristics: entry.heuristics.delta,
+                        })),
+                    ),
+                  ]),
+              ),
+              byConsumerType: Object.fromEntries(
+                [...new Set(run.fixtures.map((fixture) => fixture.consumerType))]
+                  .sort((left, right) => left.localeCompare(right))
+                  .map((consumerType) => [
+                    consumerType,
+                    buildBreakdownSummary(
+                      comparisons
+                        .map(({ path: comparisonPath, value }) => ({
+                          ...value,
+                          __comparisonPath: comparisonPath,
+                        }))
+                        .filter((entry) =>
+                          fixtureMetadataByComparisonPath.get(path.resolve(entry.__comparisonPath))?.consumerType === consumerType
+                        )
+                        .map((entry) => ({
+                          surfaceId: entry.surfaceId,
+                          tool: entry.tool,
+                          comparisonPath: entry.__comparisonPath,
+                          meetsGoal: entry.checks.meetsGoal,
+                          baselineGuidanceStrategy: entry.baseline.guidanceStrategy,
+                          guidedGuidanceStrategy: entry.guided.guidanceStrategy,
+                          guidedFewerFirstAttemptBlockingFindings: entry.checks.guidedFewerFirstAttemptBlockingFindings,
+                          guidedReachedAcceptableNoLater: entry.checks.guidedReachedAcceptableNoLater,
+                          guidedRubricBetterDimensions: entry.checks.guidedRubricBetterDimensions,
+                          heuristics: entry.heuristics.delta,
+                        })),
+                    ),
+                  ]),
+              ),
+              byModelLabel: {
+                [run.model.requestedModelLabel ?? run.model.resolvedModelId ?? "unknown"]: buildBreakdownSummary(
+                  comparisons.map(({ path: comparisonPath, value }) => ({
+                    surfaceId: value.surfaceId,
+                    tool: value.tool,
+                    comparisonPath,
+                    meetsGoal: value.checks.meetsGoal,
+                    baselineGuidanceStrategy: value.baseline.guidanceStrategy,
+                    guidedGuidanceStrategy: value.guided.guidanceStrategy,
+                    guidedFewerFirstAttemptBlockingFindings: value.checks.guidedFewerFirstAttemptBlockingFindings,
+                    guidedReachedAcceptableNoLater: value.checks.guidedReachedAcceptableNoLater,
+                    guidedRubricBetterDimensions: value.checks.guidedRubricBetterDimensions,
+                    heuristics: value.heuristics.delta,
+                  })),
+                ),
+              },
+            },
+          }
+        : {}),
     };
 
     const outDir = options.outDir
@@ -2901,7 +3599,17 @@ export async function runSummarizeGenerationBenchmarkCommand(
     const markdownPath = path.join(outDir, "benchmark-report.md");
     writeDeterministicJsonSync(jsonPath, report);
     fs.mkdirSync(path.dirname(markdownPath), { recursive: true });
-    fs.writeFileSync(markdownPath, renderBenchmarkReportMarkdown(report), "utf8");
+    fs.writeFileSync(markdownPath, renderBenchmarkReportMarkdown(report, run), "utf8");
+    if (run && options.runPath) {
+      writeDeterministicJsonSync(path.resolve(options.runPath), {
+        ...run,
+        paths: {
+          ...run.paths,
+          reportJsonPath: jsonPath,
+          reportMarkdownPath: markdownPath,
+        },
+      });
+    }
 
     process.stdout.write(
       `${JSON.stringify(
diff --git a/packages/interfacectl-cli/src/index.ts b/packages/interfacectl-cli/src/index.ts
index 656a794..d0b551b 100644
--- a/packages/interfacectl-cli/src/index.ts
+++ b/packages/interfacectl-cli/src/index.ts
@@ -21,6 +21,7 @@ import {
   runCompareGenerationSessionsCommand,
   runInitGenerationSessionCommand,
   runPrepareGenerationHandoffCommand,
+  runReplayGenerationBenchmarkCommand,
   runRecordGenerationAttemptCommand,
   runReviewContractDeltaSuggestionsCommand,
   runReviewGenerationAttemptCommand,
@@ -368,7 +369,7 @@ program
   .requiredOption("--surface <id>", "Surface identifier")
   .requiredOption("--workspace-root <path>", "Workspace root for emitted run artifacts")
   .option("--tool <tool>", "Generation tool identifier (codex|cursor|local-llm)")
-  .option("--guidance-strategy <strategy>", "Session guidance strategy (prompt-summary|json-primary|unguided)")
+  .option("--guidance-strategy <strategy>", "Session guidance strategy (prompt-summary|baseline-primary|json-primary|unguided)")
   .option("--guidance-mode <mode>", "Legacy alias for --guidance-strategy (prepared|unguided)")
   .option("--brief-file <path>", "Optional implementation brief file to freeze into the session")
   .option("--session <id>", "Optional session identifier")
@@ -391,7 +392,7 @@ program
   .command("prepare-generation-handoff")
   .description("Build one canonical strategy-aware guidance handoff artifact for a tracked generation session")
   .requiredOption("--session-dir <path>", "Path to the generation session directory")
-  .option("--guidance-strategy <strategy>", "Optional guidance strategy override (prompt-summary|json-primary|unguided)")
+  .option("--guidance-strategy <strategy>", "Optional guidance strategy override (prompt-summary|baseline-primary|json-primary|unguided)")
   .option("--accepted-suggestions <path>", "Optional accepted suggestions JSON file")
   .option("--designer-notes <path>", "Optional designer notes JSON file")
   .option("--finding-codes <codes>", "Optional comma-separated finding codes to match against repair guidance")
@@ -504,17 +505,45 @@ program
 program
   .command("summarize-generation-benchmark")
   .description("Aggregate one or more comparison and suggestion artifacts into a benchmark report")
-  .requiredOption("--comparisons <paths>", "Comma-separated generation session comparison JSON paths")
+  .option("--comparisons <paths>", "Comma-separated generation session comparison JSON paths")
   .option("--suggestions <paths>", "Comma-separated contract delta suggestion JSON paths")
+  .option("--run-path <path>", "Optional benchmark run manifest to enrich the benchmark report")
   .option("--out-dir <path>", "Output directory for the benchmark report")
   .action(async (options) => {
     process.exitCode = await runSummarizeGenerationBenchmarkCommand({
       comparisonPaths: options.comparisons,
       suggestionPaths: options.suggestions,
+      runPath: options.runPath,
       outDir: options.outDir,
     });
   });
 
+program
+  .command("replay-generation-benchmark")
+  .description("Freeze a benchmark spec into a new replayable benchmark run manifest")
+  .requiredOption("--spec <path>", "Path to the benchmark spec JSON file")
+  .requiredOption("--tool <tool>", "Generation tool identifier (codex|cursor|local-llm)")
+  .requiredOption("--out-dir <path>", "Output directory for the replay run")
+  .option("--cohort-id <id>", "Optional cohort id override")
+  .option("--source-run <path>", "Optional source benchmark run manifest")
+  .option("--requested-model-label <label>", "Optional requested model label")
+  .option("--resolved-model-id <id>", "Optional resolved runtime model id")
+  .option("--base-url <url>", "Optional model base URL")
+  .option("--fingerprint <value>", "Optional model/runtime fingerprint")
+  .action(async (options) => {
+    process.exitCode = await runReplayGenerationBenchmarkCommand({
+      specPath: options.spec,
+      tool: options.tool,
+      outDir: options.outDir,
+      cohortId: options.cohortId,
+      sourceRunPath: options.sourceRun,
+      requestedModelLabel: options.requestedModelLabel,
+      resolvedModelId: options.resolvedModelId,
+      baseUrl: options.baseUrl,
+      fingerprint: options.fingerprint,
+    });
+  });
+
 program
   .command("validate-generation")
   .description("Validate generated UI against a compiled generation bundle")
diff --git a/packages/interfacectl-cli/test/generation-benchmark.test.mjs b/packages/interfacectl-cli/test/generation-benchmark.test.mjs
index 238e3af..4bc66a4 100644
--- a/packages/interfacectl-cli/test/generation-benchmark.test.mjs
+++ b/packages/interfacectl-cli/test/generation-benchmark.test.mjs
@@ -12,6 +12,8 @@ import { validateDiffOutput } from "@surfaces/interfacectl-validator";
 import generationSessionComparisonSchema from "../schemas/generation-session-comparison.schema.json" with { type: "json" };
 import contractDeltaSuggestionsSchema from "../schemas/contract-delta-suggestions.schema.json" with { type: "json" };
 import generationBenchmarkReportSchema from "../schemas/generation-benchmark-report.schema.json" with { type: "json" };
+import generationBenchmarkSpecSchema from "../schemas/generation-benchmark-spec.schema.json" with { type: "json" };
+import generationBenchmarkRunSchema from "../schemas/generation-benchmark-run.schema.json" with { type: "json" };
 
 const __filename = fileURLToPath(import.meta.url);
 const __dirname = path.dirname(__filename);
@@ -149,6 +151,7 @@ function buildAssessment({
   boundary,
   visual,
   responsiveness,
+  platformFit,
   notes,
   heuristics,
 }) {
@@ -158,6 +161,7 @@ function buildAssessment({
     boundary,
     visual,
     responsiveness,
+    platformFit: platformFit ?? responsiveness,
     notes,
     ...(heuristics ? { heuristics } : {}),
   };
@@ -596,3 +600,240 @@ test("strategy-aware benchmark artifacts compare sessions, emit deterministic su
     await fsp.rm(tempRoot, { recursive: true, force: true });
   }
 });
+
+test("replay-generation-benchmark freezes a copied spec and model attribution into a new run manifest", async () => {
+  const tempRoot = await fsp.mkdtemp(path.join(os.tmpdir(), "interfacectl-generation-benchmark-replay-"));
+  const specPath = path.join(tempRoot, "spec.json");
+  const outDir = path.join(tempRoot, "replay-run");
+
+  try {
+    const spec = {
+      schemaVersion: 1,
+      specId: "demo-suite/spec",
+      generatedAt: "2026-04-02T00:00:00.000Z",
+      evaluationMode: "zero-shot",
+      attemptBudget: 1,
+      guidanceStrategies: ["unguided", "baseline-primary", "json-primary"],
+      comparisonPairs: [
+        {
+          baselineGuidanceStrategy: "unguided",
+          guidedGuidanceStrategy: "baseline-primary",
+        },
+        {
+          baselineGuidanceStrategy: "baseline-primary",
+          guidedGuidanceStrategy: "json-primary",
+        },
+      ],
+      suiteId: "demo-suite/default",
+      suiteName: "Demo Suite",
+      fixtures: [
+        {
+          fixtureId: "demo-surface",
+          surfaceId: "demo-surface",
+          brief: {
+            path: "/tmp/demo-brief.md",
+            sha256: "brief-hash",
+          },
+          platformTarget: "web",
+          consumerType: "desktop-shell",
+          capturePreset: "desktop-shell",
+          comparisonPairs: [
+            {
+              baselineGuidanceStrategy: "unguided",
+              guidedGuidanceStrategy: "baseline-primary",
+            },
+            {
+              baselineGuidanceStrategy: "baseline-primary",
+              guidedGuidanceStrategy: "json-primary",
+            },
+          ],
+        },
+      ],
+    };
+    await writeJson(specPath, spec);
+    validateWithSchema(spec, generationBenchmarkSpecSchema, "generation benchmark spec");
+
+    const replayResult = await runCli(
+      [
+        "replay-generation-benchmark",
+        "--spec",
+        specPath,
+        "--tool",
+        "local-llm",
+        "--out-dir",
+        outDir,
+        "--cohort-id",
+        "20260402000000",
+        "--requested-model-label",
+        "gpt-oss-20b",
+        "--resolved-model-id",
+        "openai/gpt-oss-20b",
+        "--base-url",
+        "http://127.0.0.1:1234/v1",
+        "--fingerprint",
+        "gpt-oss-20b-fingerprint",
+      ],
+      tempRoot,
+    );
+    assert.equal(replayResult.exitCode, 0, replayResult.stderr);
+
+    const replayOutput = JSON.parse(replayResult.stdout);
+    const replayRun = JSON.parse(await fsp.readFile(replayOutput.paths.runPath, "utf8"));
+    validateWithSchema(replayRun, generationBenchmarkRunSchema, "generation benchmark run");
+    assert.equal(replayRun.sourceSpecPath, specPath);
+    assert.equal(replayRun.paths.specPath, path.join(outDir, "spec.json"));
+    assert.equal(replayRun.model.requestedModelLabel, "gpt-oss-20b");
+    assert.equal(replayRun.model.resolvedModelId, "openai/gpt-oss-20b");
+    assert.equal(replayRun.fixtures[0].consumerType, "desktop-shell");
+    assert.deepEqual(replayRun.fixtures[0].comparisons, []);
+  } finally {
+    await fsp.rm(tempRoot, { recursive: true, force: true });
+  }
+});
+
+test("summarize-generation-benchmark emits a report from run evidence even when no comparisons completed", async () => {
+  const tempRoot = await fsp.mkdtemp(path.join(os.tmpdir(), "interfacectl-generation-benchmark-evidence-only-"));
+  const specPath = path.join(tempRoot, "spec.json");
+  const outDir = path.join(tempRoot, "replay-run");
+  const reportDir = path.join(tempRoot, "benchmark-report");
+
+  try {
+    const spec = {
+      schemaVersion: 1,
+      specId: "demo-suite/spec",
+      generatedAt: "2026-04-02T00:00:00.000Z",
+      evaluationMode: "zero-shot",
+      attemptBudget: 1,
+      guidanceStrategies: ["unguided", "baseline-primary"],
+      comparisonPairs: [
+        {
+          baselineGuidanceStrategy: "unguided",
+          guidedGuidanceStrategy: "baseline-primary",
+        },
+      ],
+      suiteId: "demo-suite/default",
+      suiteName: "Demo Suite",
+      fixtures: [
+        {
+          fixtureId: "demo-surface",
+          surfaceId: "demo-surface",
+          brief: {
+            path: "/tmp/demo-brief.md",
+            sha256: "brief-hash",
+          },
+          platformTarget: "web",
+          consumerType: "web-browser",
+          capturePreset: "web-browser",
+          comparisonPairs: [
+            {
+              baselineGuidanceStrategy: "unguided",
+              guidedGuidanceStrategy: "baseline-primary",
+            },
+          ],
+        },
+      ],
+    };
+    await writeJson(specPath, spec);
+
+    const replayResult = await runCli(
+      [
+        "replay-generation-benchmark",
+        "--spec",
+        specPath,
+        "--tool",
+        "local-llm",
+        "--out-dir",
+        outDir,
+        "--cohort-id",
+        "20260402000001",
+        "--requested-model-label",
+        "gpt-oss-20b",
+        "--resolved-model-id",
+        "openai/gpt-oss-20b",
+        "--base-url",
+        "http://127.0.0.1:1234/v1",
+        "--fingerprint",
+        "gpt-oss-20b-fingerprint",
+      ],
+      tempRoot,
+    );
+    assert.equal(replayResult.exitCode, 0, replayResult.stderr);
+
+    const replayOutput = JSON.parse(replayResult.stdout);
+    const replayRun = JSON.parse(await fsp.readFile(replayOutput.paths.runPath, "utf8"));
+    const sessionRoot = path.join(tempRoot, "sessions");
+    const runWithSessionsPath = path.join(outDir, "run-with-sessions.json");
+    const runWithSessions = {
+      ...replayRun,
+      fixtures: replayRun.fixtures.map((fixture) => ({
+        ...fixture,
+        sessions: [
+          {
+            guidanceStrategy: "unguided",
+            sessionId: `${fixture.surfaceId}/unguided`,
+            sessionDir: path.join(sessionRoot, fixture.surfaceId, "unguided"),
+            summaryPath: path.join(sessionRoot, fixture.surfaceId, "unguided", "summary.json"),
+            guidanceHandoffPath: path.join(sessionRoot, fixture.surfaceId, "unguided", "guidance-handoff.txt"),
+            agentInputPath: path.join(sessionRoot, fixture.surfaceId, "unguided", "agent-input.txt"),
+            previewPath: null,
+          },
+          {
+            guidanceStrategy: "baseline-primary",
+            sessionId: `${fixture.surfaceId}/baseline-primary`,
+            sessionDir: path.join(sessionRoot, fixture.surfaceId, "baseline-primary"),
+            summaryPath: path.join(sessionRoot, fixture.surfaceId, "baseline-primary", "summary.json"),
+            guidanceHandoffPath: path.join(sessionRoot, fixture.surfaceId, "baseline-primary", "guidance-handoff.txt"),
+            agentInputPath: path.join(sessionRoot, fixture.surfaceId, "baseline-primary", "agent-input.txt"),
+            previewPath: null,
+          },
+        ],
+      })),
+    };
+    await writeJson(runWithSessionsPath, runWithSessions);
+    const [unguidedSession, baselineSession] = runWithSessions.fixtures[0].sessions;
+
+    await writeJson(unguidedSession.summaryPath, {
+      schemaVersion: 1,
+      sessionId: unguidedSession.sessionId,
+      surfaceId: runWithSessions.fixtures[0].surfaceId,
+      guidanceStrategy: "unguided",
+      latestStatus: "warn",
+      latestOutcome: "warn",
+      attempts: [],
+    });
+    await writeJson(baselineSession.summaryPath, {
+      schemaVersion: 1,
+      sessionId: baselineSession.sessionId,
+      surfaceId: runWithSessions.fixtures[0].surfaceId,
+      guidanceStrategy: "baseline-primary",
+      latestStatus: "block",
+      latestOutcome: "error",
+      errorMessage: "Model crashed during compile.",
+      attempts: [],
+    });
+
+    const benchmarkResult = await runCli(
+      [
+        "summarize-generation-benchmark",
+        "--run-path",
+        runWithSessionsPath,
+        "--out-dir",
+        reportDir,
+      ],
+      tempRoot,
+    );
+    assert.equal(benchmarkResult.exitCode, 0, benchmarkResult.stderr);
+
+    const benchmarkOutput = JSON.parse(benchmarkResult.stdout);
+    const benchmarkReport = JSON.parse(await fsp.readFile(benchmarkOutput.paths.jsonPath, "utf8"));
+    validateWithSchema(benchmarkReport, generationBenchmarkReportSchema, "generation benchmark report");
+    assert.equal(benchmarkReport.overall.surfaceCount, 1);
+    assert.deepEqual(benchmarkReport.comparisons, []);
+
+    const markdown = await fsp.readFile(benchmarkOutput.paths.markdownPath, "utf8");
+    assert.match(markdown, /## Comparisons\n- none/);
+    assert.match(markdown, /- error: Model crashed during compile\./);
+  } finally {
+    await fsp.rm(tempRoot, { recursive: true, force: true });
+  }
+});
diff --git a/packages/interfacectl-cli/test/generation-session.test.mjs b/packages/interfacectl-cli/test/generation-session.test.mjs
index f6ac884..b444c9f 100644
--- a/packages/interfacectl-cli/test/generation-session.test.mjs
+++ b/packages/interfacectl-cli/test/generation-session.test.mjs
@@ -154,6 +154,7 @@ function buildAssessment({
   boundary,
   visual,
   responsiveness,
+  platformFit,
   notes,
   touchedFiles,
   heuristics,
@@ -164,6 +165,7 @@ function buildAssessment({
     boundary,
     visual,
     responsiveness,
+    platformFit: platformFit ?? responsiveness,
     notes,
     ...(touchedFiles ? { touchedFiles } : {}),
     ...(heuristics ? { heuristics } : {}),
@@ -820,6 +822,7 @@ test("generation session commands reject invalid bundle roots, duplicate session
       boundary: "weak",
       visual: "partial",
       responsiveness: "weak",
+      platformFit: "weak",
       notes: "Invalid assessment payload.",
     });