diff --git a/.forge/ralph/apply-worker-cli-v5/prd.json b/.forge/ralph/apply-worker-cli-v5/prd.json
deleted file mode 100644
index 4437cd4..0000000
--- a/.forge/ralph/apply-worker-cli-v5/prd.json
+++ /dev/null
@@ -1,58 +0,0 @@
-{
-  "project": "Webster",
-  "branchName": "ralph/apply-worker-cli-v5",
-  "prdFile": "prd.md",
-  "description": "Expose the existing apply-worker core as a weekly CLI and prove mutation, commit trailers, and validation blocking with integration tests.",
-  "userStories": [
-    {
-      "id": "US-001",
-      "title": "Add apply-worker CLI wrapper",
-      "description": "As a Webster operator, I want a Bun CLI that runs the existing apply-worker core against a weekly history directory so that selected proposal issues become validated experiment commits without manual orchestration.",
-      "acceptanceCriteria": [
-        "Add a script entrypoint following repo conventions, likely scripts/apply-worker/cli.ts, with a #!/usr/bin/env bun shebang and import.meta.main guard.",
-        "The CLI accepts a week directory argument and reads proposal.md plus decision.json from that directory.",
-        "The CLI uses existing exports from scripts/apply-worker.ts for parseDecision, parseProposal, applyMutation, runValidation, buildCommitMessage, commitExperiment, emitSkip, and writeApplyLog instead of duplicating US-001 through US-004 core logic.",
-        "For each selected issue, the CLI applies mutations, runs lint, type-check, and format-check before committing, and creates one Git commit only when all three validation checks pass.",
-        "Every successful experiment commit message includes the existing trailer format Experiment-Id: exp-NN-slug validated by buildCommitMessage.",
-        "String mismatches or validation failures are recorded as skipped experiments in apply-log.json and emit structured skip rows through emitSkip without creating a commit for that experiment.",
-        "Missing week directory, missing proposal.md, or missing decision.json produces a clear non-zero CLI error without mutating files.",
-        "Type-check passes",
-        "Lint passes with zero warnings",
-        "Format check passes",
-        "Tests pass"
-      ],
-      "technicalNotes": "Build on scripts/apply-worker.ts:287-317 for parseDecision/parseProposal, 319-357 for applyMutation, 359-369 for runValidation, 372-393 for buildCommitMessage, 395-429 for commitExperiment, and 442-457 for emitSkip/writeApplyLog. Mirror CLI entrypoint/error shape from scripts/critic-genealogy.ts:676-694 and package script style from package.json scripts. Fixture artifact shapes are visible in history/2026-04-23/decision.json and history/2026-04-23/proposal.md.",
-      "dependsOn": [],
-      "priority": 1,
-      "passes": true,
-      "notes": "Implemented in iteration 1. Files: scripts/apply-worker-cli.ts, scripts/apply-worker.ts, package.json, .forge/ralph/apply-worker-cli-v5/prd.md."
-    },
-    {
-      "id": "US-002",
-      "title": "Add apply-worker integration tests",
-      "description": "As a Webster maintainer, I want integration tests around the apply-worker CLI so that successful proposals mutate and commit correctly while broken proposals are blocked before commit.",
-      "acceptanceCriteria": [
-        "Add Bun tests under scripts/__tests__/ using the existing bun:test style from scripts/__tests__/memory.test.ts.",
-        "Create fixture proposal.md and decision.json inputs that match the existing weekly schema and proposal format shown in history/2026-04-23 artifacts.",
-        "A successful fixture run verifies the target file content changed from the Before block to the After block.",
-        "A successful fixture run verifies git history contains a commit message trailer exactly matching Experiment-Id: exp-01-<slug> for the applied issue.",
-        "A successful fixture run verifies apply-log.json records the applied experiment with status applied and a commit_sha.",
-        "A deliberately broken proposal or validation-breaking mutation does not create a Git commit for that experiment.",
-        "The blocked fixture verifies apply-log.json and/or skips.jsonl records the terminal skip reason, including validation failure when the output fails the lint/type/format floor.",
-        "Tests isolate Git state and filesystem mutations in temporary directories or fixture repositories and do not mutate Webster's real history or site files.",
-        "bun run validate passes before committing the story.",
-        "Type-check passes",
-        "Lint passes with zero warnings",
-        "Format check passes",
-        "Tests pass"
-      ],
-      "technicalNotes": "Use scripts/__tests__/memory.test.ts:1-18 as the temp-path and cleanup pattern. Exercise the CLI from US-001 rather than only unit-testing helper functions. Keep fixtures minimal but schema-faithful to history/2026-04-23/decision.json:1-25 and proposal markdown sections from history/2026-04-23/proposal.md:1-28. Inspect commit messages with git log in the isolated fixture repo. The broken-output case should prove runValidation from scripts/apply-worker.ts:359-369 prevents commitExperiment from scripts/apply-worker.ts:395-429.",
-      "dependsOn": [
-        "US-001"
-      ],
-      "priority": 2,
-      "passes": true,
-      "notes": "Implemented in iteration 2. Files: scripts/__tests__/apply-worker-cli.test.ts."
-    }
-  ]
-}
diff --git a/.forge/ralph/apply-worker-cli-v5/prd.md b/.forge/ralph/apply-worker-cli-v5/prd.md
deleted file mode 100644
index 75910b0..0000000
--- a/.forge/ralph/apply-worker-cli-v5/prd.md
+++ /dev/null
@@ -1,180 +0,0 @@
-# Apply Worker CLI v5 — Product Requirements
-
-## Overview
-
-**Problem**: Webster has the apply-worker core for parsing `proposal.md`, applying text mutations, running validation, emitting skip rows, writing `apply-log.json`, and building experiment commit messages, but the weekly operator still lacks a single CLI entrypoint and integration-level proof that the full proposal-to-commit path is safe.
-**Solution**: Add a thin CLI wrapper around the existing apply-worker core and integration tests that exercise successful mutation commits, correct `Experiment-Id` trailers, and validation-blocked broken proposals.
-**Branch**: `ralph/apply-worker-cli-v5`
-
----
-
-## Goals & Success
-
-### Primary Goal
-
-Expose the merged apply-worker core as a production CLI that can be run against a weekly history directory and can commit only validated experiment mutations.
-
-### Success Metrics
-
-| Metric | Target | How Measured |
-|--------|--------|--------------|
-| CLI entrypoint exists | `scripts/apply-worker/cli.ts` or repo-convention equivalent invokes the core from a weekly directory | Code review and `bun` execution in tests |
-| Valid experiment commits | Every applied experiment creates a Git commit with `Experiment-Id: exp-NN-slug` | Integration test inspects `git log --format=%B` |
-| Broken output is blocked | A deliberately broken proposal does not create a commit | Integration test compares commit count and apply log/skip output |
-| Quality floor | Type, lint, format, validators, markdownlint, and tests pass | `bun run validate` |
-
-### Non-Goals (Out of Scope)
-
-- Reimplementing US-001 through US-004 — the core parser, text mutation engine, validation gate, skip-row emission, and apply-log writer already exist in `scripts/apply-worker.ts`.
-- Multi-kind proposal routing — tracked separately in Layer 10 #47-#49.
-- Visual review or critic rerun gates — downstream of the apply step and not part of this remaining scope.
-- Changing proposal or decision schemas — this story consumes the existing `proposal.md` and `decision.json` shapes.
-
----
-
-## User & Context
-
-### Target User
-
-- **Who**: Webster implementation operator running the weekly landing-page improvement loop.
-- **Role**: Takes a redesigner proposal and operator decision from `history/<week>/`, applies selected edits, and promotes only safe experiments.
-- **Current Pain**: The core code exists but the operator cannot reliably run one command that reads weekly artifacts, applies each selected issue, validates, commits, and records blocked experiments.
-
-### User Journey
-
-1. **Trigger**: The weekly council produces `history/<week>/proposal.md` and `history/<week>/decision.json`.
-2. **Action**: The operator runs the apply-worker CLI against that week directory.
-3. **Outcome**: Each valid selected issue lands as its own commit with an experiment trailer; invalid or validation-breaking issues are skipped and recorded without a commit.
-
----
-
-## UX Requirements
-
-### Interaction Model
-
-Command-line only. The CLI should follow existing script conventions: executable Bun TypeScript files under `scripts/`, `#!/usr/bin/env bun`, `import.meta.main` guard, explicit usage/error output, and non-zero exits for bad invocation. Existing entrypoint patterns appear in `scripts/critic-genealogy.ts:676-694`, `scripts/validate-agents.ts:129`, and `scripts/validate-findings.ts:108`.
-
-Likely command shape:
-
-```bash
-bun scripts/apply-worker/cli.ts history/2026-04-23
-```
-
-The CLI reads:
-
-- `<weekDir>/proposal.md`
-- `<weekDir>/decision.json`
-
-The CLI writes:
-
-- `<weekDir>/apply-log.json`
-- `<weekDir>/skips.jsonl` when an experiment is skipped
-- `<weekDir>/memory.jsonl` skip rows via the existing helper
-- one Git commit per validated experiment
-
-### States to Handle
-
-| State | Description | Behavior |
-|-------|-------------|----------|
-| Empty | Week directory or required files are missing | Print usage/error and exit non-zero without mutating files |
-| Loading | CLI is applying one selected proposal issue | Log current experiment id/title and validation status to stdout/stderr |
-| Error | Proposal parse, string mismatch, validation failure, git add, or git commit fails | Record terminal skip when applicable; fail clearly for unrecoverable setup/git errors |
-| Success | All selected issues were either committed or explicitly skipped | Write `apply-log.json`; exit 0 if the run completed deterministically |
-
----
-
-## Technical Context
-
-### Patterns to Follow
-
-- **Apply-worker core**: `scripts/apply-worker.ts:287-317` — `parseDecision` and `parseProposal` already map weekly artifacts into selected proposal issues.
-- **Mutation engine**: `scripts/apply-worker.ts:319-357` — `applyMutation` performs exact string replacement and returns `string_mismatch` instead of silently proceeding.
-- **Validation floor**: `scripts/apply-worker.ts:359-369` — `runValidation` runs lint, type-check, and format-check; the CLI must treat any failure as a no-commit skip for that experiment.
-- **Commit trailer format**: `scripts/apply-worker.ts:372-393` — `buildCommitMessage` validates `exp-NN-slug` and emits `Experiment-Id: ${expId}`.
-- **Git commit helper**: `scripts/apply-worker.ts:395-429` — `commitExperiment` stages touched files and parses the commit SHA.
-- **Skip/apply-log writers**: `scripts/apply-worker.ts:442-457` — `emitSkip` and `writeApplyLog` already write terminal skip rows and `apply-log.json`.
-- **Fixture schemas**: `history/2026-04-23/decision.json:1-25` shows `week` plus `selected_issues`; `history/2026-04-23/proposal.md:1-28` shows issue headings, target files, and Before/After blocks.
-- **Test pattern**: `scripts/__tests__/memory.test.ts:1-18` uses `bun:test`, temp paths, and explicit cleanup; use the same style for integration fixtures.
-- **CLI error pattern**: `scripts/critic-genealogy.ts:676-694` guards `import.meta.main`, maps usage errors to exit 2, and unexpected failures to exit 1.
-
-### Types & Interfaces
-
-```typescript
-export interface DecisionJSON {
-  week: string;
-  selected_issues: DecisionIssue[];
-}
-
-export interface ProposalIssue {
-  index: number;
-  severity: Severity;
-  title: string;
-  files_touched: string[];
-  mutations: RawMutation[];
-}
-
-export interface ApplyExperiment {
-  exp_id: string;
-  severity: Severity;
-  title: string;
-  status: "applied" | "skipped";
-  mutations: MutationResult[];
-  commit_sha?: string;
-  skip_reason?: "string_mismatch" | "lint_failure" | "type_failure" | "format_failure";
-  skip_details?: Record<string, unknown>;
-}
-
-export interface ApplyLogJSON {
-  week: string;
-  run_timestamp: string;
-  experiments: ApplyExperiment[];
-  validation_summary: {
-    lint_passed: boolean;
-    type_check_passed: boolean;
-    format_check_passed: boolean;
-  };
-}
-```
-
-### Architecture Notes
-
-- Build strictly on top of `scripts/apply-worker.ts`; do not duplicate parser, mutation, validation, skip, log, or commit helpers.
-- If the current file must be split to support `scripts/apply-worker/cli.ts`, preserve public exports and avoid changing landed US-001-US-004 behavior except where CLI orchestration needs a missing exported helper.
-- Each selected issue should be treated as a separate experiment with deterministic id `exp-${NN}-${slug}` through the existing `buildCommitMessage` guard.
-- The hard floor is lint + type-check + format-check before commit. Full repository validation (`bun run validate`) remains the story completion gate.
-- Integration tests may need to run in a temporary Git repository or carefully isolated fixture repo so real Webster history is not mutated.
-
----
-
-## Implementation Summary
-
-### Story Overview
-
-| ID | Title | Priority | Dependencies |
-|----|-------|----------|--------------|
-| US-001 | Add apply-worker CLI wrapper | 1 | — |
-| US-002 | Add apply-worker integration tests | 2 | US-001 |
-
-### Dependency Graph
-
-```text
-US-001 (CLI wrapper around existing core)
-    ↓
-US-002 (integration tests for commits, mutation, and validation blocking)
-```
-
----
-
-## Validation Requirements
-
-Every story must pass:
-
-- [ ] Type-check: `bun run type-check`
-- [ ] Lint: `bun run lint --max-warnings 0`
-- [ ] Tests: `bun run test`
-- [ ] Format: `bun run format:check`
-- [ ] Full gate before final commit: `bun run validate`
-
----
-
-Generated: 2026-04-24T07:47:46Z
diff --git a/.forge/ralph/genealogy-gov-v1/prd.json b/.forge/ralph/genealogy-gov-v1/prd.json
deleted file mode 100644
index 705e9da..0000000
--- a/.forge/ralph/genealogy-gov-v1/prd.json
+++ /dev/null
@@ -1,75 +0,0 @@
-{
-  "project": "Webster",
-  "branchName": "ralph/genealogy-gov-v1",
-  "prdFile": "prd.md",
-  "description": "Implement Feature #55 genealogy governance layers 2-4: dedup, 13-week cap, and archive-on-idle.",
-  "userStories": [
-    {
-      "id": "US-001",
-      "title": "Layer 2 embedding dedup blocks overlapping critic specs",
-      "description": "As a Webster operator, I want new critic specs rejected when their scope substantially overlaps an existing critic so that genealogy does not create duplicate weekly agents.",
-      "acceptanceCriteria": [
-        "Add an orchestrator-side dedup helper in scripts/critic-genealogy.ts that compares a candidate NewCriticSpec against active CriticSummary entries using embedding cosine similarity over scope and description text.",
-        "Reject candidate specs with cosine similarity >= 0.60 to any active critic before registerAgent() performs POST /v1/agents.",
-        "Governance rejection prints the closest existing critic name, similarity score, and candidate scope without registering an agent or creating a session.",
-        "Dry-run mode still runs and reports the dedup decision before printing a would-register spec.",
-        "Unit tests cover below-threshold allow, exactly-0.60 reject, and above-threshold reject behavior without live Anthropic network calls.",
-        "Type-check passes",
-        "Tests pass",
-        "bun run validate passes"
-      ],
-      "technicalNotes": "Modify scripts/critic-genealogy.ts around NewCriticSpec/CriticSummary definitions (lines 31-60), active critic loading (lines 155-168), and the main flow before registerAgent() (lines 457+ and main registration section). Follow fail-fast error style from lines 339-356. Add tests in scripts/__tests__/critic-genealogy.test.ts mirroring direct helper tests at lines 93-120 and 160-203. Existing agents expose metadata.scope and description in agents/*-critic.json.",
-      "dependsOn": [],
-      "priority": 1,
-      "passes": true,
-      "notes": "Implemented in iteration 1. Files: scripts/critic-genealogy.ts, scripts/__tests__/critic-genealogy.test.ts, .forge/ralph/genealogy-gov-v1/prd.md."
-    },
-    {
-      "id": "US-002",
-      "title": "Layer 3 13-week cap with operator soft override",
-      "description": "As a Webster operator, I want a maximum of 3 new critics per 13 weeks with a deliberate override flag so that genealogy growth is bounded but not blocked in exceptional cases.",
-      "acceptanceCriteria": [
-        "Add a CLI soft-override flag, named --override-quarterly-cap or equivalent, to parseArgs() and CLIArgs in scripts/critic-genealogy.ts.",
-        "Count spawned critic specs from history/<YYYY-MM-DD>/genealogy/spec.json in the rolling 13-week window ending at args.weekDate.",
-        "Block registration when the count is already 3 or more and the override flag is false.",
-        "Allow registration when the count is 3 or more only if the override flag is true, and print an explicit operator override message.",
-        "Ignore malformed or missing non-genealogy history directories only when they are irrelevant; malformed in-window genealogy spec data fails loudly with an actionable error.",
-        "Unit tests cover count 0, count 2 allow, count 3 block, count 3 with override allow, and boundary dates at exactly 13 weeks.",
-        "Type-check passes",
-        "Tests pass",
-        "bun run validate passes"
-      ],
-      "technicalNotes": "Extend scripts/critic-genealogy.ts parseArgs() at lines 72-105 and printUsage() at lines 107-115. Use writeArtifacts() output convention at lines 570-585: each spawn writes history/<week>/genealogy/spec.json. Gate the main flow before registerAgent() and createSession(). Add parseArgs tests beside scripts/__tests__/critic-genealogy.test.ts lines 44-75 and helper tests with temporary history fixtures.",
-      "dependsOn": [
-        "US-001"
-      ],
-      "priority": 2,
-      "passes": true,
-      "notes": "Implemented in iteration 2. Files: scripts/critic-genealogy.ts, scripts/__tests__/critic-genealogy.test.ts."
-    },
-    {
-      "id": "US-003",
-      "title": "Layer 4 archive idle spawned critics",
-      "description": "As a Webster operator, I want spawned critics with no promoted findings in 8 weeks archived so that inactive council members stop consuming weekly attention and tokens.",
-      "acceptanceCriteria": [
-        "Add archive-on-idle logic in scripts/critic-genealogy.ts that evaluates spawned critics and moves idle specs from agents/<name>.json to agents/archive/<name>.json.",
-        "A spawned critic is archived only when it has 0 findings promoted across the last 8 weeks; critics with at least 1 promoted finding in that window remain active.",
-        "Original committed baseline critics are not archived by the idle rule unless history proves they were genealogy-spawned.",
-        "loadExistingCritics() continues to load only active agents/*-critic.json files and excludes agents/archive/*.json by path.",
-        "Archive actions create agents/archive/ if missing and preserve the JSON spec byte-for-byte except for formatting caused by existing JSON write conventions if needed.",
-        "Unit tests cover idle spawned critic archived, active spawned critic retained, original critic retained, and archived critic excluded from active critic summaries.",
-        "Type-check passes",
-        "Tests pass",
-        "bun run validate passes"
-      ],
-      "technicalNotes": "Implement in scripts/critic-genealogy.ts near loadExistingCritics() lines 155-168 and main startup before active critic summary logging. Use agents/*-critic.json naming shown by agents/brand-voice-critic.json and peers. Use genealogy provenance from history/<week>/genealogy/spec.json created by writeArtifacts() lines 570-585. Add tests in scripts/__tests__/critic-genealogy.test.ts next to loadExistingCritics tests at lines 78-90; use temporary fixture directories or exported pure helpers to avoid mutating real agents during tests.",
-      "dependsOn": [
-        "US-001",
-        "US-002"
-      ],
-      "priority": 3,
-      "passes": true,
-      "notes": "Implemented in iteration 3. Files: scripts/critic-genealogy.ts, scripts/__tests__/critic-genealogy.test.ts."
-    }
-  ]
-}
diff --git a/.forge/ralph/genealogy-gov-v1/prd.md b/.forge/ralph/genealogy-gov-v1/prd.md
deleted file mode 100644
index bf766f1..0000000
--- a/.forge/ralph/genealogy-gov-v1/prd.md
+++ /dev/null
@@ -1,172 +0,0 @@
-# Genealogy Governance Layers 2-4 — Product Requirements
-
-## Overview
-
-**Problem**: Webster can now spawn new critics at runtime, but without code-level governors the council can duplicate existing critic scopes, exceed a sensible growth rate, and keep idle critics in weekly runs indefinitely. That creates token-waste drift and weakens the demo claim that genealogy is controlled rather than chaotic.
-**Solution**: Implement Q5.1 governance layers 2-4 in the existing genealogy registration path: embedding-based deduplication before registration, a 13-week cap with operator soft override, and archive-on-idle pruning for critics with no promoted findings across 8 weeks.
-**Branch**: `ralph/genealogy-gov-v1`
-
----
-
-## Goals & Success
-
-### Primary Goal
-
-Bound runtime critic spawning while preserving legitimate, operator-overridable genealogy growth.
-
-### Success Metrics
-
-| Metric | Target | How Measured |
-|--------|--------|--------------|
-| Duplicate critic rejection | New critic specs with >=60% embedding cosine similarity to an existing critic are rejected before `POST /v1/agents` | Unit tests around `scripts/critic-genealogy.ts` registration path |
-| Quarterly spawn cap | More than 3 new critics in any rolling 13-week window is blocked unless an operator override flag is present | Unit tests using historical `history/*/genealogy/spec.json` fixtures |
-| Idle critic retirement | Spawned critics with 0 promoted findings over 8 weeks are moved to `agents/archive/` and excluded from active critic loading | Unit tests around archive-on-idle logic and `loadExistingCritics()` behavior |
-| Validation | `bun run validate` passes with zero lint warnings | Project validation command |
-
-### Non-Goals (Out of Scope)
-
-- Layer 1 prompt rubric edits in `prompts/second-wbs-session.md` — explicitly deferred until `feat/orch-memory-planner-v2` PR #6 merges because that branch is actively modifying the same file.
-- Redesigning planner or redesigner request schemas — Feature #55 scope is governance layers 2-4 only.
-- Deleting retired critics from Git history or the Managed Agents API — Layer 4 archives local specs recoverably rather than destructive deletion.
-- Building live embedding infrastructure beyond this path — the dedup check is local to `scripts/critic-genealogy.ts` new-critic registration.
-
----
-
-## User & Context
-
-### Target User
-
-- **Who**: Webster operator running weekly landing-page improvement sessions.
-- **Role**: Maintains a council of Claude Managed Agents and reviews automated changes before submission or deployment.
-- **Current Pain**: Runtime genealogy is powerful, but every extra critic is a recurring weekly cost. Duplicate or idle critics turn the council into an expensive echo chamber.
-
-### User Journey
-
-1. **Trigger**: Planner or genealogy detection identifies a possible unowned concern and `scripts/critic-genealogy.ts` prepares a new critic spec.
-2. **Action**: The orchestrator-side genealogy script evaluates overlap, recent spawn count, and idle critic state before registering or invoking agents.
-3. **Outcome**: Legitimate critics are registered and invoked; duplicate or over-cap critics are blocked with explicit evidence; idle spawned critics are archived before future council runs.
-
----
-
-## UX Requirements
-
-### Interaction Model
-
-This is backend/CLI orchestration. The primary interface remains:
-
-```bash
-bun scripts/critic-genealogy.ts --branch <council-branch> [--week YYYY-MM-DD] [--lp-target URL] [--dry-run]
-bun scripts/critic-genealogy.ts --fixtures <dir> [--week YYYY-MM-DD] [--lp-target URL] [--dry-run]
-```
-
-Layer 3 adds an operator soft-override flag, for example `--override-quarterly-cap`, that allows a human-approved spawn when the 13-week cap has already been reached. Layer 4 archive-on-idle should run from the same script before active critic loading/registration so archived critics are not considered active council members.
-
-### States to Handle
-
-| State | Description | Behavior |
-|-------|-------------|----------|
-| Empty | No spawned genealogy history or no archived critics yet | Dedup still compares against current `agents/*-critic.json`; cap count is 0; retire pass no-ops |
-| Loading | Embedding similarity or API-backed registration is in progress | Script prints explicit progress and continues existing fail-fast error behavior |
-| Error | Embedding request fails, malformed history exists, archive move fails, or cap blocks without override | Script exits non-zero for operational errors; governance blocks print actionable reason and skip registration |
-| Success | New spec is below 60% overlap, under cap or operator-overridden, and idle critics are archived | Script registers/invokes as today and writes artifacts; archive pass moves idle specs to `agents/archive/` |
-
----
-
-## Technical Context
-
-### Patterns to Follow
-
-- **Similar implementation**: `scripts/critic-genealogy.ts:155-168` — active critics are discovered from `agents/*-critic.json`; Layer 4 should exclude `agents/archive/` by keeping archived files outside this glob.
-- **Similar implementation**: `scripts/critic-genealogy.ts:457-477` — `registerAgent()` is the correct choke point before `POST /v1/agents`; Layer 2 and Layer 3 checks should run before this call.
-- **Similar implementation**: `scripts/critic-genealogy.ts:570-585` — `writeArtifacts()` records genealogy specs under `history/<week>/genealogy/`; Layer 3 can count recent spawns from these artifacts.
-- **Component pattern**: `scripts/critic-genealogy.ts:72-105` — CLI flags are parsed with explicit mutually-exclusive validation and `CLIError`; add the soft-override flag here.
-- **Error handling pattern**: `scripts/critic-genealogy.ts:141-152` and `scripts/critic-genealogy.ts:339-356` — invalid state fails loudly with clear error messages, no silent fallback.
-- **Test pattern**: `scripts/__tests__/critic-genealogy.test.ts:44-75` — CLI parsing tests assert accepted and rejected flags.
-- **Test pattern**: `scripts/__tests__/critic-genealogy.test.ts:78-90` — active critic loading behavior is unit-tested directly.
-- **Test pattern**: `scripts/__tests__/critic-genealogy.test.ts:160-203` — generated agent JSON behavior is tested with direct helpers and schema validation.
-
-### Types & Interfaces
-
-```typescript
-interface NewCriticSpec {
-  name: string;
-  scope: string;
-  description: string;
-  rationale: string;
-  focus_owned: string[];
-  focus_not_owned: string[];
-  severity_rubric: string;
-}
-
-interface AgentJSON {
-  name: string;
-  description: string;
-  model: string;
-  system: string;
-  tools: unknown[];
-  mcp_servers?: unknown[];
-  metadata?: Record<string, string>;
-}
-
-interface CriticSummary {
-  name: string;
-  scope: string;
-  description: string;
-}
-
-interface CLIArgs {
-  branch: string | null;
-  fixtures: string | null;
-  weekDate: string;
-  lpTarget: string;
-  dryRun: boolean;
-  // add: overrideQuarterlyCap: boolean;
-}
-```
-
-### Architecture Notes
-
-- Feature #55 is governed by `context/FEATURES.md:170` and Q5.1 in `context/DOMAIN-MODEL.md:303-333`; use the user's updated thresholds for this PRD: 60% cosine overlap, max 3 critics per 13 weeks, and 0 promoted findings in 8 weeks.
-- Existing critic specs live in `agents/*-critic.json`; active critics include the five original critics plus `visual-design-critic.json` if present.
-- Spawn artifacts live under `history/<week>/genealogy/spec.json`, created by `writeArtifacts()`.
-- Registration currently happens through `registerAgent()` after `spliceNewSpec()` creates an `AgentJSON`; governance should block before remote agent creation and before session creation.
-- Promoted findings evidence should come from existing history artifacts where available. If implementation needs a source of truth, prefer explicit history rows over inferring from current findings text.
-- Validation follows `CLAUDE.md`: zero lint warnings, full type check, format check, tests, and `bun run validate` before declaring done.
-
----
-
-## Implementation Summary
-
-### Story Overview
-
-| ID | Title | Priority | Dependencies |
-|----|-------|----------|--------------|
-| US-001 | Layer 2 embedding dedup blocks overlapping critic specs | 1 | — |
-| US-002 | Layer 3 13-week cap with operator soft override | 2 | US-001 |
-| US-003 | Layer 4 archive idle spawned critics | 3 | US-001, US-002 |
-
-### Dependency Graph
-
-```text
-US-001 (dedup guard before registration)
-    ↓
-US-002 (rolling 13-week cap + soft override)
-    ↓
-US-003 (archive-on-idle pruning)
-```
-
----
-
-## Validation Requirements
-
-Every story must pass:
-
-- [ ] Type-check: `bun run type-check`
-- [ ] Lint: `bun run lint --max-warnings 0`
-- [ ] Tests: `bun run test`
-- [ ] Format: `bun run format:check`
-- [ ] Full project gate: `bun run validate`
-
----
-
-Generated: 2026-04-24T00:00:00.000Z
diff --git a/.forge/ralph/genealogy-gov-v1/progress.txt b/.forge/ralph/genealogy-gov-v1/progress.txt
deleted file mode 100644
index 41625c8..0000000
--- a/.forge/ralph/genealogy-gov-v1/progress.txt
+++ /dev/null
@@ -1,88 +0,0 @@
-## Codebase Patterns
-
-### Archive-on-idle uses explicit decision owners
-- **Where**: `scripts/critic-genealogy.ts`
-- **Pattern**: Treat `history/<week>/genealogy/spec.json` as spawn provenance and `history/<week>/decision.json:selected_issues[].owner` as promoted-finding evidence; move agent specs with `renameSync` to preserve bytes.
-- **Example**: `archiveIdleSpawnedCritics(agentsDir, historyRoot, weekDate)` runs before `loadExistingCritics()` in `main()`.
-
-### Governance helpers stay pure and injectable
-- **Where**: `scripts/critic-genealogy.ts`
-- **Pattern**: Put governance decisions in exported pure helpers and inject data providers, then call the helper in `main()` immediately before the side-effecting API boundary.
-- **Example**: `evaluateCriticDedup(candidate, critics, embed)` runs before `registerAgent()` and is tested with deterministic vectors.
-
----
-
-## 2026-04-24T00:00:00.000Z — US-001: Layer 2 embedding dedup blocks overlapping critic specs
-
-**Status**: PASSED
-**Files changed**:
-- `scripts/critic-genealogy.ts` — added cosine-similarity dedup helper over candidate/existing critic scope and description, governance rejection output, and pre-registration gate.
-- `scripts/__tests__/critic-genealogy.test.ts` — added no-network unit coverage for below-threshold allow, exact 0.60 reject, and above-threshold reject behavior.
-- `.forge/ralph/genealogy-gov-v1/prd.md` — fixed markdownlint MD036 formatting so `bun run validate` can pass.
-- `.forge/ralph/genealogy-gov-v1/prd.json` — marked US-001 complete.
-
-**Acceptance criteria verified**:
-- [x] Add an orchestrator-side dedup helper in `scripts/critic-genealogy.ts` that compares a candidate `NewCriticSpec` against active `CriticSummary` entries using embedding cosine similarity over scope and description text.
-- [x] Reject candidate specs with cosine similarity >= 0.60 to any active critic before `registerAgent()` performs `POST /v1/agents`.
-- [x] Governance rejection prints the closest existing critic name, similarity score, and candidate scope without registering an agent or creating a session.
-- [x] Dry-run mode still runs and reports the dedup decision before printing a would-register spec.
-- [x] Unit tests cover below-threshold allow, exactly-0.60 reject, and above-threshold reject behavior without live Anthropic network calls.
-- [x] Type-check passes.
-- [x] Tests pass.
-- [x] `bun run validate` passes.
-
-**Learnings**:
-- `bun run validate` includes markdownlint over `.forge/ralph/**/*.md`; generated PRD footer emphasis triggered MD036 and had to be normalized.
-- The local package has no `cli` script, so Ralph workflow event emits fail harmlessly with `Script not found "cli"` under the required `|| true` guard.
-
----
-## 2026-04-24T08:29:55.000Z — US-002: Layer 3 13-week cap with operator soft override
-
-**Status**: PASSED
-**Files changed**:
-- `scripts/critic-genealogy.ts` — added `--override-quarterly-cap`, rolling 13-week genealogy spawn counting, malformed in-window spec validation, and pre-registration cap gate.
-- `scripts/__tests__/critic-genealogy.test.ts` — added no-network unit coverage for count 0, count 2 allow, count 3 block, count 3 override allow, exactly-13-week boundary inclusion, and malformed in-window genealogy spec failure.
-- `.forge/ralph/genealogy-gov-v1/prd.json` — marked US-002 complete.
-
-**Acceptance criteria verified**:
-- [x] Add a CLI soft-override flag, named `--override-quarterly-cap` or equivalent, to `parseArgs()` and `CLIArgs` in `scripts/critic-genealogy.ts`.
-- [x] Count spawned critic specs from `history/<YYYY-MM-DD>/genealogy/spec.json` in the rolling 13-week window ending at `args.weekDate`.
-- [x] Block registration when the count is already 3 or more and the override flag is false.
-- [x] Allow registration when the count is 3 or more only if the override flag is true, and print an explicit operator override message.
-- [x] Ignore malformed or missing non-genealogy history directories only when they are irrelevant; malformed in-window genealogy spec data fails loudly with an actionable error.
-- [x] Unit tests cover count 0, count 2 allow, count 3 block, count 3 with override allow, and boundary dates at exactly 13 weeks.
-- [x] Type-check passes.
-- [x] Tests pass.
-- [x] `bun run validate` passes.
-
-**Learnings**:
-- The registration choke point now has two pure governance gates before API side effects: dedup first, then quarterly cap before `registerAgent()` and `createSession()`.
-- Treat the 13-week boundary as inclusive: a spawn exactly 91 days before `args.weekDate` counts toward the cap.
-- Non-date history directories can be ignored; in-window `genealogy/spec.json` files must parse as agent-like JSON so broken genealogy artifacts fail loudly.
-
----
-## 2026-04-24T09:15:00.000Z — US-003: Layer 4 archive idle spawned critics
-
-**Status**: PASSED
-**Files changed**:
-- `scripts/critic-genealogy.ts` — added genealogy-spawn provenance loading, promoted-finding owner parsing from decision history, archive-on-idle moves to `agents/archive/`, and startup pruning before active critic loading.
-- `scripts/__tests__/critic-genealogy.test.ts` — added unit coverage for idle spawned critic archival, active spawned critic retention, original critic retention, archived critic exclusion from active summaries, promoted owner parsing, and spawned provenance loading.
-- `.forge/ralph/genealogy-gov-v1/prd.json` — marked US-003 complete.
-
-**Acceptance criteria verified**:
-- [x] Add archive-on-idle logic in `scripts/critic-genealogy.ts` that evaluates spawned critics and moves idle specs from `agents/<name>.json` to `agents/archive/<name>.json`.
-- [x] A spawned critic is archived only when it has 0 findings promoted across the last 8 weeks; critics with at least 1 promoted finding in that window remain active.
-- [x] Original committed baseline critics are not archived by the idle rule unless history proves they were genealogy-spawned.
-- [x] `loadExistingCritics()` continues to load only active `agents/*-critic.json` files and excludes `agents/archive/*.json` by path.
-- [x] Archive actions create `agents/archive/` if missing and preserve the JSON spec byte-for-byte except for formatting caused by existing JSON write conventions if needed.
-- [x] Unit tests cover idle spawned critic archived, active spawned critic retained, original critic retained, and archived critic excluded from active critic summaries.
-- [x] Type-check passes.
-- [x] Tests pass.
-- [x] `bun run validate` passes.
-
-**Learnings**:
-- Spawned-critic provenance should come from `history/<week>/genealogy/spec.json`, not from current agent names alone, so baseline critics are safe by default.
-- Promoted-finding evidence is explicit in `decision.json:selected_issues[].owner`; missing decision files mean no promoted findings for that week, while malformed present decision files fail loudly.
-- `renameSync` preserves archived agent JSON bytes and avoids rewriting specs during governance pruning.
-
----
diff --git a/.forge/ralph/orch-memory-planner-v1/prd.json b/.forge/ralph/orch-memory-planner-v1/prd.json
deleted file mode 100644
index 74f15e8..0000000
--- a/.forge/ralph/orch-memory-planner-v1/prd.json
+++ /dev/null
@@ -1,72 +0,0 @@
-{
-  "project": "Webster",
-  "branchName": "feat/orch-memory-planner-v1",
-  "prdFile": "prd.md",
-  "description": "Add the orchestrator step that marshals memory + verdict + monitor context, invokes webster-planner via the Managed Agents flow, parses the JSON response, writes history/<week>/plan.md, and appends a verdict-ready event to history/memory.jsonl.",
-  "userStories": [
-    {
-      "id": "US-001",
-      "title": "Memory marshaling helper",
-      "description": "As a Webster operator, I want a pure TypeScript helper that reads memory.jsonl tail plus recent verdicts plus the monitor anomaly report and returns a single concatenated user.message text so that the planner always receives the same shape of context.",
-      "acceptanceCriteria": [
-        "Add scripts/planner-context.ts exporting marshalPlannerContext(opts: { memoryPath: string; verdictDir: string; monitorPath: string; tailN?: number }): string.",
-        "The function uses the feature #51 tailN helper from src/memory (or scripts/memory) to read the last N=50 events from memoryPath; it does not re-implement tail logic.",
-        "The function reads the two most recent history/<week>/verdict.json files under verdictDir sorted by week slug descending; missing verdict files are skipped without throwing.",
-        "The function reads the monitor anomaly report text file at monitorPath; a missing monitor file is skipped without throwing.",
-        "The returned string begins with a MEMORY_TAIL section, then a RECENT_VERDICTS section, then a MONITOR_ANOMALIES section, each delimited by a stable header the test file can match.",
-        "When all three inputs are empty or missing, the function returns a string that explicitly labels the cold-start state rather than an empty string.",
-        "Add a Bun test under scripts/__tests__/planner-context.test.ts with fixtures under tmp paths verifying: tailN wiring, two-verdict ordering, missing-file skips, and cold-start labeling.",
-        "bun run type-check, bun run lint --max-warnings 0, bun test, bun run format:check pass."
-      ],
-      "technicalNotes": "Follow the style in scripts/critic-genealogy.ts and scripts/memory.ts (or src/memory). Use readFileSync + path.join; do not use async file APIs unless the existing modules already do. Keep the function free of network I/O. Reuse the feature #51 export rather than re-reading JSONL lines directly.",
-      "dependsOn": [],
-      "priority": 1,
-      "passes": true,
-      "notes": "Implemented in iteration 1. Files: scripts/planner-context.ts, scripts/__tests__/planner-context.test.ts."
-    },
-    {
-      "id": "US-002",
-      "title": "Planner invocation + plan writer",
-      "description": "As a Webster operator, I want a helper that invokes the webster-planner Managed Agent using the marshaled context, parses the structured response, writes history/<week>/plan.md, and appends a verdict-ready row to history/memory.jsonl so that downstream critics can consume the plan.",
-      "acceptanceCriteria": [
-        "Add scripts/planner-invoke.ts exporting invokePlanner(opts: { contextText: string; week: string; historyDir: string; apiKey: string }): Promise<{ planPath: string; plan: PlanRecord }>.",
-        "The function looks up or registers the webster-planner agent via POST /v1/agents, mirroring the find-or-register pattern in scripts/critic-genealogy.ts:440-556.",
-        "The function creates a session via POST /v1/sessions, sends contextText as the user.message event, and polls until the session is idle.",
-        "The function extracts the final assistant text and parses it as JSON with fields classification, next_action, direction_hint, optional new_critic_request, and rationale; next_action must be one of promote_and_experiment, hold_baseline, revert_and_retry, explore_broadly.",
-        "The function writes history/<week>/plan.md as human-readable markdown that embeds the parsed JSON in a fenced code block and prints the parsed fields as a bulleted summary above the fence.",
-        "The function appends one event row to history/memory.jsonl with event = 'verdict-ready' using the feature #51 appendEvent helper and includes refs.plan = relative path to the written plan.md.",
-        "Invalid JSON, missing required fields, or unknown next_action values raise an Error with a descriptive message and do NOT write plan.md or append to memory.jsonl.",
-        "Add a Bun test under scripts/__tests__/planner-invoke.test.ts that mocks fetch (global.fetch or bun:test mock) to exercise: happy path with a valid JSON response, malformed response rejection, and the memory.jsonl append side effect.",
-        "bun run type-check, bun run lint --max-warnings 0, bun test, bun run format:check pass."
-      ],
-      "technicalNotes": "Reuse helper names / patterns from scripts/critic-genealogy.ts (registerAgent, createSession, sendUserMessage, pollUntilIdle) rather than duplicating low-level fetch code. Keep the HTTP base URL configurable via env (ANTHROPIC_API_BASE defaulting to https://api.anthropic.com). Import appendEvent from the same module feature #51 added. Do NOT edit agents/webster-planner.json (owned by feature #50) and do NOT edit prompts/second-wbs-session.md in this story (US-003 owns that).",
-      "dependsOn": [
-        "US-001"
-      ],
-      "priority": 2,
-      "passes": true,
-      "notes": "Implemented in iteration 2. Files: scripts/planner-invoke.ts, scripts/__tests__/planner-invoke.test.ts."
-    },
-    {
-      "id": "US-003",
-      "title": "Orchestrator step in prompts/second-wbs-session.md",
-      "description": "As a Webster operator, I want a new orchestration step in prompts/second-wbs-session.md that runs BEFORE critic fan-out and calls the US-002 helper with US-001 inputs so that the planner's plan.md is ready for critics to read.",
-      "acceptanceCriteria": [
-        "Edit prompts/second-wbs-session.md to add a new numbered step titled 'Run planner' placed BEFORE the critic fan-out step.",
-        "The step shows the bash/bun invocation that marshals context via scripts/planner-context.ts and invokes the planner via scripts/planner-invoke.ts, with the week argument set to the current ISO week folder name under history/.",
-        "The step specifies that on planner error the run halts with a non-zero exit status and a pointer to the error message.",
-        "The step references history/<week>/plan.md as the output artifact consumed by later steps.",
-        "Update README.md or an adjacent doc section if the prior council flow explicitly enumerated the steps, so the step count remains accurate.",
-        "bun run validate passes."
-      ],
-      "technicalNotes": "Edit prompts/second-wbs-session.md only \u2014 do not change orchestrator-owned I/O in the helpers. The step should read like the existing numbered steps: plain bash with comments and exit-on-error semantics. Do not implement runtime invocation of critics from this file; that remains in the later fan-out step.",
-      "dependsOn": [
-        "US-001",
-        "US-002"
-      ],
-      "priority": 3,
-      "passes": true,
-      "notes": "Implemented in iteration 3. Files: prompts/second-wbs-session.md, README.md."
-    }
-  ]
-}
diff --git a/.forge/ralph/orch-memory-planner-v1/prd.md b/.forge/ralph/orch-memory-planner-v1/prd.md
deleted file mode 100644
index d50e0c7..0000000
--- a/.forge/ralph/orch-memory-planner-v1/prd.md
+++ /dev/null
@@ -1,65 +0,0 @@
-# Orchestrator Memory Marshaling + Planner Invocation (L11 #52)
-
-## Problem
-
-Webster's council flow fans out critics + redesigner, but week-over-week
-learning currently has no explicit planner step. Feature #50 ships the
-`webster-planner` Managed Agent spec. Feature #51 ships the
-`history/memory.jsonl` event substrate + `appendEvent` / `tailN` helpers.
-This feature wires the two together: an orchestrator step that runs BEFORE
-critic fan-out, invokes the planner, writes `plan.md`, and logs the event.
-
-Per ADR-0001 the orchestrator owns all JSONL I/O. The planner agent never
-touches disk — it receives marshaled context as `user.message` text and
-returns structured output the orchestrator parses.
-
-## Scope
-
-- Add a TypeScript helper module that marshals the planner's input context.
-- Add a TypeScript helper module that invokes the planner via the
-  Anthropic Agents Managed-Agents flow and writes the decoded `plan.md`.
-- Add a new orchestration step to `prompts/second-wbs-session.md` that
-  calls the helpers BEFORE the critic fan-out step.
-
-Out of scope (covered by separate features):
-
-- Plan → critic context wiring (#53).
-- Cold-start explore-broadly defaults (#54) — this feature must not
-  crash when memory tail is empty, but the dedicated cold-start logic is #54.
-- Critic-genealogy invocation of `new_critic_request` (#55).
-
-## Invariants
-
-- Orchestrator-owned I/O. No disk writes from inside the planner agent
-  prompt or tool definitions.
-- Append-only `history/memory.jsonl`. Use the `appendEvent` helper from
-  feature #51. Never mutate prior rows.
-- Zero lint warnings. `bun run validate` must pass.
-- No silent fallbacks. If the planner call fails or returns unparseable
-  output, surface the error — do not fabricate a plan.
-- No API keys in committed code. Load from environment.
-
-## Stories
-
-### US-001 — Memory marshaling helper
-
-Add `scripts/planner-context.ts` exporting a pure function that reads the
-last N memory events plus recent verdict files plus the monitor anomaly
-report and returns a single concatenated text payload suitable for the
-planner's `user.message`.
-
-### US-002 — Planner invocation + plan writer
-
-Add `scripts/planner-invoke.ts` exporting a function that registers the
-`webster-planner` agent (idempotent lookup), creates a session, sends the
-marshaled user message, polls until idle, parses the planner's JSON
-response, writes `history/<week>/plan.md`, and appends a `verdict-ready`
-row to `history/memory.jsonl` via the feature #51 helper.
-
-### US-003 — Orchestrator integration step
-
-Edit `prompts/second-wbs-session.md` to add a new numbered step that runs
-BEFORE the critic fan-out step. The step invokes the helper from US-002
-using the marshaled context from US-001, writes `plan.md` into the current
-week's `history/<week>/` directory, and halts the run if the planner call
-returns an error.
diff --git a/.forge/ralph/orch-memory-planner-v1/progress.txt b/.forge/ralph/orch-memory-planner-v1/progress.txt
deleted file mode 100644
index 09c3091..0000000
--- a/.forge/ralph/orch-memory-planner-v1/progress.txt
+++ /dev/null
@@ -1,81 +0,0 @@
-## Codebase Patterns
-
-### Planner invocation fails closed before disk writes
-- **Where**: `scripts/planner-invoke.ts`
-- **Pattern**: Parse and validate the final assistant JSON before creating `history/<week>/plan.md` or appending to `history/memory.jsonl`; failed planner output leaves no partial plan artifact.
-- **Example**: `const plan = parsePlanRecord(extractFinalAssistantText(snapshot));`
-
-### Orchestrator memory helpers import the substrate directly
-- **Where**: `scripts/planner-context.ts`
-- **Pattern**: Higher-level orchestrator helpers should import `tailN` from `scripts/memory.ts` instead of re-reading JSONL lines.
-- **Example**: `const memoryEvents = readMemoryTail(opts.tailN ?? DEFAULT_TAIL_N, opts.memoryPath);`
-
----
-
-## 2026-04-24 — US-001: Memory marshaling helper
-
-**Status**: PASSED
-**Files changed**:
-- `scripts/planner-context.ts` — added `marshalPlannerContext` with memory tail, recent verdict, monitor anomaly, and cold-start sections.
-- `scripts/__tests__/planner-context.test.ts` — added Bun coverage for tailN wiring, verdict ordering, missing-file skips, and cold-start labeling.
-
-**Acceptance criteria verified**:
-- [x] Add scripts/planner-context.ts exporting marshalPlannerContext(opts: { memoryPath: string; verdictDir: string; monitorPath: string; tailN?: number }): string.
-- [x] The function uses the feature #51 tailN helper from src/memory (or scripts/memory) to read the last N=50 events from memoryPath; it does not re-implement tail logic.
-- [x] The function reads the two most recent history/<week>/verdict.json files under verdictDir sorted by week slug descending; missing verdict files are skipped without throwing.
-- [x] The function reads the monitor anomaly report text file at monitorPath; a missing monitor file is skipped without throwing.
-- [x] The returned string begins with a MEMORY_TAIL section, then a RECENT_VERDICTS section, then a MONITOR_ANOMALIES section, each delimited by a stable header the test file can match.
-- [x] When all three inputs are empty or missing, the function returns a string that explicitly labels the cold-start state rather than an empty string.
-- [x] Add a Bun test under scripts/__tests__/planner-context.test.ts with fixtures under tmp paths verifying: tailN wiring, two-verdict ordering, missing-file skips, and cold-start labeling.
-- [x] bun run type-check, bun run lint --max-warnings 0, bun test, bun run format:check pass.
-
-**Learnings**:
-- `scripts/memory.ts` exposes `tailN(n, logPath)`, so callers pass the count first and the memory path second.
-- No prior `progress.txt` existed for this PRD directory, so this iteration created it with the reusable pattern section.
-
----
-
-## 2026-04-24 — US-002: Planner invocation + plan writer
-
-**Status**: PASSED
-**Files changed**:
-- `scripts/planner-invoke.ts` — added `invokePlanner` with Managed Agent lookup/registration, session creation, context message send, idle polling, strict plan JSON parsing, plan markdown writing, and `verdict-ready` memory append.
-- `scripts/__tests__/planner-invoke.test.ts` — added Bun fetch-mock coverage for a valid planner response, malformed JSON rejection, unknown `next_action` rejection, and memory append side effects.
-
-**Acceptance criteria verified**:
-- [x] Add scripts/planner-invoke.ts exporting invokePlanner(opts: { contextText: string; week: string; historyDir: string; apiKey: string }): Promise<{ planPath: string; plan: PlanRecord }>.
-- [x] The function looks up or registers the webster-planner agent via POST /v1/agents, mirroring the find-or-register pattern in scripts/critic-genealogy.ts:440-556.
-- [x] The function creates a session via POST /v1/sessions, sends contextText as the user.message event, and polls until the session is idle.
-- [x] The function extracts the final assistant text and parses it as JSON with fields classification, next_action, direction_hint, optional new_critic_request, and rationale; next_action must be one of promote_and_experiment, hold_baseline, revert_and_retry, explore_broadly.
-- [x] The function writes history/<week>/plan.md as human-readable markdown that embeds the parsed JSON in a fenced code block and prints the parsed fields as a bulleted summary above the fence.
-- [x] The function appends one event row to history/memory.jsonl with event = 'verdict-ready' using the feature #51 appendEvent helper and includes refs.plan = relative path to the written plan.md.
-- [x] Invalid JSON, missing required fields, or unknown next_action values raise an Error with a descriptive message and do NOT write plan.md or append to memory.jsonl.
-- [x] Add a Bun test under scripts/__tests__/planner-invoke.test.ts that mocks fetch (global.fetch or bun:test mock) to exercise: happy path with a valid JSON response, malformed response rejection, and the memory.jsonl append side effect.
-- [x] bun run type-check, bun run lint --max-warnings 0, bun test, bun run format:check pass.
-
-**Learnings**:
-- `environments/webster-council-env.id` is available in this worktree, so planner session creation can mirror genealogy sessions by passing `environment_id` without expanding the public `invokePlanner` options.
-- `agents/webster-planner.json` is absent in this branch even though feature #50 is marked landed elsewhere; the helper supports registration when the spec exists and reuses an already-registered planner without reading the missing file.
-- `bun run cli` is not defined in this repo, so Ralph workflow event emissions failed harmlessly under the required `|| true` wrapper.
-
----
-## 2026-04-24 — US-003: Orchestrator step in prompts/second-wbs-session.md
-
-**Status**: PASSED
-**Files changed**:
-- `prompts/second-wbs-session.md` — added fail-closed Step 3 planner orchestration before critic fan-out, marshaling context through `scripts/planner-context.ts`, invoking `scripts/planner-invoke.ts`, committing `history/<week>/plan.md` + `history/memory.jsonl`, and passing `PLAN_PATH` to downstream agents.
-- `README.md` — updated architecture diagram, weekly-flow step count, runtime estimate, and weekly-run summary to include the planner step.
-
-**Acceptance criteria verified**:
-- [x] Edit prompts/second-wbs-session.md to add a new numbered step titled 'Run planner' placed BEFORE the critic fan-out step.
-- [x] The step shows the bash/bun invocation that marshals context via scripts/planner-context.ts and invokes the planner via scripts/planner-invoke.ts, with the week argument set to the current ISO week folder name under history/.
-- [x] The step specifies that on planner error the run halts with a non-zero exit status and a pointer to the error message.
-- [x] The step references history/<week>/plan.md as the output artifact consumed by later steps.
-- [x] Update README.md or an adjacent doc section if the prior council flow explicitly enumerated the steps, so the step count remains accurate.
-- [x] bun run validate passes.
-
-**Learnings**:
-- The weekly runner uses `WEEK_DATE=$(date -u +%Y-%m-%d)` as its history folder slug, so the planner step reuses that existing ISO-8601 UTC folder naming pattern instead of introducing a second week format.
-- `bun --eval` receives user arguments at `process.argv.slice(1)`, which keeps the prompt-only invocation small without adding CLI code to the helper modules.
-
----
diff --git a/.forge/ralph/planner-agent-spec-v5/prd.json b/.forge/ralph/planner-agent-spec-v5/prd.json
deleted file mode 100644
index 4328b68..0000000
--- a/.forge/ralph/planner-agent-spec-v5/prd.json
+++ /dev/null
@@ -1,69 +0,0 @@
-{
-  "project": "Webster",
-  "branchName": "ralph/planner-agent-spec-v5",
-  "prdFile": "prd.md",
-  "description": "Add a schema-valid Opus 4.7 webster-planner Managed Agent spec and tests for its plan.md contract and registration-flow shape.",
-  "userStories": [
-    {
-      "id": "US-001",
-      "title": "Add schema-valid planner Managed Agent spec",
-      "description": "As a Webster implementation operator, I want agents/webster-planner.json to exist as an Opus 4.7 Managed Agent spec so that later orchestration can register and invoke the planner.",
-      "acceptanceCriteria": [
-        "Create agents/webster-planner.json with name \"webster-planner\", model \"claude-opus-4-7\", and required fields accepted by scripts/schemas/agent.schema.json.",
-        "The spec uses field \"system\" and does not include rejected fields such as \"system_prompt\" or \"callable_agents\".",
-        "The system prompt states that user.message supplies marshaled memory context: memory.jsonl tail, last two weeks verdict context, and monitor anomaly report.",
-        "The system prompt defines the plan.md JSON fields: classification, next_action, direction_hint, optional new_critic_request, and rationale.",
-        "The next_action enum in the system prompt includes exactly promote_and_experiment, hold_baseline, revert_and_retry, and explore_broadly.",
-        "The system prompt instructs cold-start/week-1/no-prior-verdict handling to use explore_broadly.",
-        "Feature #52 and #53 behavior is not implemented in this story.",
-        "bun run validate:agents passes"
-      ],
-      "technicalNotes": "Modify agents/webster-planner.json. Mirror the spec shape in agents/webster-redesigner.json and agents/webster-monitor.json: name, description, model, system, tools, optional mcp_servers, metadata. Follow scripts/schemas/agent.schema.json constraints: required name/description/model/system/tools, no additional properties, model enum includes claude-opus-4-7, metadata.role must be one of critic/monitor/redesigner/orchestrator. Use metadata { role: \"orchestrator\", scope: \"planning\" } because the schema does not currently allow role \"planner\". Scope guard: do not edit prompts/second-wbs-session.md, scripts/memory.ts, or council fan-out code for runtime invocation.",
-      "dependsOn": [],
-      "priority": 1,
-      "passes": true,
-      "notes": "Implemented in iteration 1. Files: agents/webster-planner.json, .forge/ralph/planner-agent-spec-v5/prd.md."
-    },
-    {
-      "id": "US-002",
-      "title": "Add planner output contract tests",
-      "description": "As a Webster implementation operator, I want tests for the planner's plan.md contract so that future orchestration can rely on stable fields and action values.",
-      "acceptanceCriteria": [
-        "Add a Bun test that reads agents/webster-planner.json and asserts its system prompt contains all required output fields: classification, next_action, direction_hint, new_critic_request, and rationale.",
-        "Add a Bun test that asserts the planner system prompt contains all four allowed next_action values: promote_and_experiment, hold_baseline, revert_and_retry, explore_broadly.",
-        "Add a Bun test that asserts the planner system prompt describes cold-start behavior for week 1/no prior verdict and ties it to explore_broadly.",
-        "Add a Bun test that asserts the planner system prompt names all three input context sources: memory.jsonl, verdict, and monitor anomaly report or alerts.",
-        "Tests fail if agents/webster-planner.json is missing or invalid JSON.",
-        "bun test passes"
-      ],
-      "technicalNotes": "Add tests under scripts/__tests__ using the existing Bun style in scripts/__tests__/validate-agents.test.ts and scripts/__tests__/critic-genealogy.test.ts: import { describe, expect, test } from \"bun:test\", read JSON with readFileSync, and resolve ROOT via import.meta.dir. Keep tests focused on the agent spec contract; do not create runtime planner invocation helpers because feature #52 owns invocation.",
-      "dependsOn": [
-        "US-001"
-      ],
-      "priority": 2,
-      "passes": true,
-      "notes": "Implemented in iteration 2. Files: scripts/__tests__/planner-agent-contract.test.ts."
-    },
-    {
-      "id": "US-003",
-      "title": "Add registration-flow guard tests and validate",
-      "description": "As a Webster implementation operator, I want tests that guard the Managed Agents registration shape so that the planner can be posted to /v1/agents and invoked through the existing session pattern later.",
-      "acceptanceCriteria": [
-        "Add or extend a test to validate agents/webster-planner.json against scripts/schemas/agent.schema.json with AJV 2020, matching scripts/__tests__/validate-agents.test.ts patterns.",
-        "Add a test that asserts the planner spec has registration-compatible top-level fields only and no research-preview callable_agents field.",
-        "Add a test or assertion that the planner spec includes tools with type agent_toolset_20260401, matching the Managed Agents beta pattern in existing agent specs.",
-        "Add a test assertion or technical note in the test name referencing the existing registration/session flow in scripts/critic-genealogy.ts: find/register agent, create session, send user.message, poll until idle.",
-        "Run bun run format:check, bun run type-check, bun run lint --max-warnings 0, bun run validate:agents, bun test, and bun run validate before declaring completion.",
-        "Do not implement scripts that call /v1/sessions or write history/<week>/plan.md; that remains feature #52."
-      ],
-      "technicalNotes": "Use the same AJV setup as scripts/__tests__/validate-agents.test.ts: Ajv2020 from ajv/dist/2020.js plus addFormats.default(ajv). Registration flow references should be grounded in scripts/critic-genealogy.ts:440-556, where registerAgent POSTs to /v1/agents, createSession POSTs to /v1/sessions, sendUserMessage POSTs to /sessions/{id}/events, and pollUntilIdle reads /sessions/{id}. This story should only test that the planner spec is compatible with that flow, not duplicate or export those helpers.",
-      "dependsOn": [
-        "US-001",
-        "US-002"
-      ],
-      "priority": 3,
-      "passes": true,
-      "notes": "Implemented in iteration 3. Files: scripts/__tests__/planner-agent-contract.test.ts."
-    }
-  ]
-}
diff --git a/.forge/ralph/planner-agent-spec-v5/prd.md b/.forge/ralph/planner-agent-spec-v5/prd.md
deleted file mode 100644
index 9ae0459..0000000
--- a/.forge/ralph/planner-agent-spec-v5/prd.md
+++ /dev/null
@@ -1,151 +0,0 @@
-# Planner Agent Spec — Product Requirements
-
-## Overview
-
-**Problem**: Webster's weekly council can critique and redesign, but Layer 11 needs an experiment-aware planning brain before the critics run. Without a schema-valid `webster-planner` Managed Agent spec, later orchestration work (#52) has no registered agent to invoke and no stable `plan.md` contract to hand to critics (#53).
-**Solution**: Add `agents/webster-planner.json` as an Opus 4.7 Managed Agent spec that matches the existing Managed Agents beta schema, reads marshaled memory context supplied by the orchestrator, and emits a `plan.md` containing a strict JSON object with `classification`, `next_action`, `direction_hint`, optional `new_critic_request`, and `rationale`.
-**Branch**: `ralph/planner-agent-spec-v5`
-
----
-
-## Goals & Success
-
-### Primary Goal
-
-Ship the planner agent spec and tests that prove it is schema-valid and aligned with Webster's registration/invocation pattern, without implementing the later orchestrator memory marshaling or council integration features.
-
-### Success Metrics
-
-| Metric | Target | How Measured |
-|--------|--------|--------------|
-| Managed Agent schema validity | `agents/webster-planner.json` passes the committed schema | `bun run validate:agents` and `bun test` |
-| Planner output contract coverage | Tests verify required `plan.md` JSON fields and `next_action` enum values | New/updated Bun tests |
-| Registration-flow alignment | Tests assert planner uses `POST /v1/agents`-compatible fields and no research-preview fields | New/updated Bun tests referencing existing schema and critic-genealogy flow |
-| Scope containment | No orchestrator prompt, memory helper, or council fan-out implementation changes | Git diff review |
-
-### Non-Goals (Out of Scope)
-
-- Implementing orchestrator memory marshaling or planner invocation — explicitly owned by feature #52.
-- Passing `plan.md` into critics/redesigner or spawning genealogy from planner output — explicitly owned by feature #53.
-- Building cold-start orchestration behavior beyond planner spec instructions — feature #54 owns runtime cold-start plumbing.
-- Changing the Managed Agent schema shape unless strictly required for the new `orchestrator` metadata role already allowed by `scripts/schemas/agent.schema.json`.
-
----
-
-## User & Context
-
-### Target User
-
-- **Who**: Webster implementation operators preparing the Layer 11 planner + experiment-aware council.
-- **Role**: They maintain Managed Agent specs, validation gates, and orchestration scripts for the hackathon submission.
-- **Current Pain**: Later features cannot safely invoke a planner because there is no registered-agent spec or tested `plan.md` output contract.
-
-### User Journey
-
-1. **Trigger**: Operator picks feature #50 from `context/FEATURES.md` and needs a schema-valid planner agent spec.
-2. **Action**: Operator adds `agents/webster-planner.json`, runs validation/tests, and confirms it follows the beta Managed Agents registration shape.
-3. **Outcome**: Feature #52 can register/invoke this planner via `/v1/agents`, `/v1/sessions`, events, and polling, then persist the returned `plan.md`.
-
----
-
-## UX Requirements
-
-### Interaction Model
-
-Backend/spec-only. Users do not interact with UI. The planner is registered through the same Managed Agents beta API shape used by existing specs and later invoked by orchestration code using the five-step pattern visible in `scripts/critic-genealogy.ts:440-556`: find/register agent, create session, send `user.message`, poll session status, inspect output.
-
-### States to Handle
-
-| State | Description | Behavior |
-|-------|-------------|----------|
-| Empty | Memory tail and prior verdicts are absent in week 1 | Planner instructions must choose `next_action: "explore_broadly"` and explain cold-start classification. |
-| Loading | Runtime session is polling after a planner `user.message` | Out of scope for #50; covered by existing pattern in `scripts/critic-genealogy.ts:503-556` and future #52. |
-| Error | Marshaled memory is contradictory, malformed, or missing key sections | Planner instructions must still emit valid `plan.md` JSON and state uncertainty in `rationale`. |
-| Success | Planner has memory tail, verdicts, and monitor anomaly report | Planner emits a single `plan.md` JSON object with an allowed `next_action` and concrete `direction_hint`. |
-
----
-
-## Technical Context
-
-### Patterns to Follow
-
-- **Managed Agent spec pattern**: `agents/webster-redesigner.json` — Opus 4.7 agent with `name`, `description`, `model`, long `system`, `tools`, `mcp_servers`, and `metadata`.
-- **Monitor context pattern**: `agents/webster-monitor.json` — reads analytics inputs, handles missing prior week, and writes structured output without proposing fixes.
-- **Registration + session pattern**: `scripts/critic-genealogy.ts:440-556` — `findAgentByName`, `registerAgent`, `createSession`, `sendUserMessage`, and `pollUntilIdle` use `/v1/agents`, `/v1/sessions`, `/events`, and polling with `managed-agents-2026-04-01` beta headers.
-- **Schema validation pattern**: `scripts/schemas/agent.schema.json` — requires `name`, `description`, `model`, `system`, and `tools`; rejects `system_prompt`, `callable_agents`, and unknown models.
-- **Agent validation tests**: `scripts/__tests__/validate-agents.test.ts` — compiles the schema with AJV 2020 and validates every `agents/*.json` file.
-- **Registration gotcha tests**: `scripts/__tests__/critic-genealogy.test.ts` — verifies generated specs preserve tools/MCP servers and remain valid against `agent.schema.json`.
-
-### Types & Interfaces
-
-```typescript
-// Existing schema-level contract from scripts/schemas/agent.schema.json
-type PlannerAgentSpec = {
-  name: string;
-  description: string;
-  model: "claude-opus-4-7" | "claude-opus-4-7-20260101";
-  system: string;
-  tools: Array<{ type: "agent_toolset_20260401" } | { type: "mcp_toolset"; mcp_server_name: string }>;
-  mcp_servers?: Array<{ type: "url"; name: string; url: string }>;
-  metadata?: { role?: "orchestrator"; scope?: string };
-};
-
-type PlannerPlan = {
-  classification: string;
-  next_action: "promote_and_experiment" | "hold_baseline" | "revert_and_retry" | "explore_broadly";
-  direction_hint: string;
-  new_critic_request?: {
-    scope: string;
-    rationale: string;
-    evidence_refs: string[];
-  };
-  rationale: string;
-};
-```
-
-### Architecture Notes
-
-- The planner is an Opus 4.7 Managed Agent per Q1 ADR-0001 and `context/FEATURES.md` feature #50.
-- The agent must not read repository files itself for memory; #50's spec should state that the orchestrator supplies marshaled `memory.jsonl` tail, last two weeks of verdicts, and monitor anomaly report in `user.message`.
-- The planner output contract is `plan.md` whose body contains one JSON object; tests can assert the system prompt includes the required schema fields and enum values.
-- The spec should likely reuse the GitHub MCP toolset pattern from `webster-redesigner`/`webster-monitor` only if the planner is instructed to commit `plan.md` itself. Feature #52 says the orchestrator extracts output and writes `history/<week>/plan.md`, so the planner spec can be agent-toolset-only unless existing Managed Agent registration expectations require MCP parity.
-- Metadata should use `role: "orchestrator"` and `scope: "planning"` because `scripts/schemas/agent.schema.json` already allows `orchestrator` but not `planner`.
-
----
-
-## Implementation Summary
-
-### Story Overview
-
-| ID | Title | Priority | Dependencies |
-|----|-------|----------|--------------|
-| US-001 | Add schema-valid planner Managed Agent spec | 1 | — |
-| US-002 | Add planner output contract tests | 2 | US-001 |
-| US-003 | Add registration-flow guard tests and validate | 3 | US-001, US-002 |
-
-### Dependency Graph
-
-```text
-US-001 (agent spec)
-    ↓
-US-002 (plan.md output contract tests)
-    ↓
-US-003 (registration-flow guard tests + validation)
-```
-
----
-
-## Validation Requirements
-
-Every story must pass:
-
-- [ ] Type-check: `bun run type-check`
-- [ ] Lint: `bun run lint --max-warnings 0`
-- [ ] Tests: `bun run test`
-- [ ] Format: `bun run format:check`
-- [ ] Agent schema validation: `bun run validate:agents`
-- [ ] Full validation before completion: `bun run validate`
-
----
-
-Generated: 2026-04-24T00:00:00.000Z
diff --git a/.forge/ralph/seed-demo-arc-w3w4-v5/prd.json b/.forge/ralph/seed-demo-arc-w3w4-v5/prd.json
deleted file mode 100644
index 6499e5f..0000000
--- a/.forge/ralph/seed-demo-arc-w3w4-v5/prd.json
+++ /dev/null
@@ -1,49 +0,0 @@
-{
-  "project": "Webster",
-  "branchName": "ralph/seed-demo-arc-w3w4-v5",
-  "prdFile": "prd.md",
-  "description": "Complete feature #57 by extending the existing demo arc seeder from W1/W2 through W3/W4 with 6-of-7 lane coverage and one W4 genealogy spawn.",
-  "userStories": [
-    {
-      "id": "US-003",
-      "title": "Add W3 gate-fail and auto-rollback seeding",
-      "description": "As a Webster demo operator, I want W3 demo-arc artifacts for archive-gate-fail, auto-rollback, and hold outcomes so that the demo can show failure learning without touching live history.",
-      "acceptanceCriteria": [
-        "`bun scripts/seed-demo-arc.ts` writes `history/demo-arc/demo-W3/proposal.md`, `decision.json`, and `verdict.json`.",
-        "W3 verdict includes `exp-05-mid-section-image-swap` with outcome `archive-gate-fail` and a failing `bounce_rate` gate.",
-        "W3 verdict includes `exp-06-cta-color-shift` with outcome `auto-rollback`, classification `hurt`, and `reward_delta_pct` of `-11`.",
-        "W3 verdict includes `exp-07-subhead-rewrite` with outcome `hold` and classification `neutral`.",
-        "`history/demo-arc/baselines.jsonl` records W3 lane statuses as `archived-gate-fail`, `rolled-back`, and no promoted baseline for the held experiment.",
-        "`history/demo-arc/memory.jsonl` contains W3 rows whose final events reflect archive/rollback/hold behavior rather than labeling every W3 experiment as a promotion.",
-        "Running the seeder twice produces deterministic W3 output under `history/demo-arc/` and does not write outside that directory.",
-        "`bun run validate` passes."
-      ],
-      "technicalNotes": "Build on `scripts/seed-demo-arc.ts` only. Reuse existing W3 entries in `EXPERIMENT_SPECS` at `scripts/seed-demo-arc.ts:240-291`; mirror `writeW1`/`writeW2` at `scripts/seed-demo-arc.ts:459-476` with a `writeW3`. Update shared baseline/memory helpers at `scripts/seed-demo-arc.ts:437-457` if needed so lane-specific statuses/events are represented correctly. Preserve `initDemoArcDir()` isolation under `history/demo-arc/` from `scripts/seed-demo-arc.ts:340-351`. Follow the locked W3 narrative in `context/DOMAIN-MODEL.md:415-420` and feature #57 scope in `context/FEATURES.md:172`.",
-      "dependsOn": [],
-      "priority": 1,
-      "passes": true,
-      "notes": "Implemented in iteration 1. Files: scripts/seed-demo-arc.ts, history/demo-arc/demo-W3/proposal.md, history/demo-arc/demo-W3/decision.json, history/demo-arc/demo-W3/verdict.json, history/demo-arc/baselines.jsonl, history/demo-arc/memory.jsonl."
-    },
-    {
-      "id": "US-004",
-      "title": "Add W4 conservative wins and genealogy spawn",
-      "description": "As a Webster demo operator, I want W4 demo-arc artifacts plus one spawned critic artifact set so that the demo closes the loop from W3 failure to critic genealogy and safe recovery wins.",
-      "acceptanceCriteria": [
-        "`bun scripts/seed-demo-arc.ts` writes `history/demo-arc/demo-W4/proposal.md`, `decision.json`, and `verdict.json`.",
-        "W4 verdict includes `exp-08-hero-safety-copy` and `exp-09-cta-size-adjust` as passing conservative experiments.",
-        "Outcome coverage across W1-W4 includes exactly these six lanes at minimum: `promote-fast-track`, `promote-fallback`, `promote-gate-win`, `archive-gate-fail`, `auto-rollback`, and `hold`.",
-        "The seeder writes one W4 genealogy-spawned critic spec for a bounce-risk concern under `history/demo-arc/demo-W4/genealogy/`.",
-        "The genealogy artifacts include a `NewCriticSpec`-shaped JSON payload and an `AgentJSON`-shaped critic registration payload using the existing exported interfaces.",
-        "W4 memory rows include a `gap-detected` event or equivalent genealogy trigger referencing the W3 bounce/gate-fail pattern and the spawned critic.",
-        "The script completion message reflects seeding through demo-W4 instead of demo-W2.",
-        "Running the seeder twice produces deterministic W4/genealogy output under `history/demo-arc/` and does not write outside that directory.",
-        "`bun run validate` passes."
-      ],
-      "technicalNotes": "Depends on US-003's lane-correct baseline and memory helper behavior. Reuse existing W4 entries in `EXPERIMENT_SPECS` at `scripts/seed-demo-arc.ts:292-338`; mirror the existing week writer pattern at `scripts/seed-demo-arc.ts:459-476` with `writeW4`. Use the existing `AgentJSON` and `NewCriticSpec` interfaces from `scripts/seed-demo-arc.ts:68-87` for deterministic genealogy JSON files. `initDemoArcDir()` already creates `history/demo-arc/demo-W4/genealogy` at `scripts/seed-demo-arc.ts:348`; write artifacts there. Follow the W4 table row and Git-state expectations in `context/DOMAIN-MODEL.md:421-429`. Do not call real Managed Agent APIs or alter `agents/` live specs.",
-      "dependsOn": ["US-003"],
-      "priority": 2,
-      "passes": true,
-      "notes": "Implemented in iteration 2. Files: scripts/seed-demo-arc.ts, history/demo-arc/demo-W4/proposal.md, history/demo-arc/demo-W4/decision.json, history/demo-arc/demo-W4/verdict.json, history/demo-arc/demo-W4/genealogy/new-critic-spec.json, history/demo-arc/demo-W4/genealogy/agent-registration.json, history/demo-arc/baselines.jsonl, history/demo-arc/memory.jsonl, context/FEATURES.md."
-    }
-  ]
-}
diff --git a/.forge/ralph/seed-demo-arc-w3w4-v5/prd.md b/.forge/ralph/seed-demo-arc-w3w4-v5/prd.md
deleted file mode 100644
index 23f24cd..0000000
--- a/.forge/ralph/seed-demo-arc-w3w4-v5/prd.md
+++ /dev/null
@@ -1,153 +0,0 @@
-# Seed Demo Arc W3/W4 — Product Requirements
-
-## Overview
-
-**Problem**: Feature #57 is only half shipped. `scripts/seed-demo-arc.ts` already seeds W1/W2, but the demo arc still cannot show the dramatic W3 failure/rollback beat or the W4 critic-genealogy response promised in the Webster narrative.
-**Solution**: Extend the existing seeder with the already-modeled W3 and W4 experiment specs, artifact writers, baseline/memory rows, and W4 genealogy artifacts. Do not rework US-001 or US-002.
-**Branch**: `ralph/seed-demo-arc-w3w4-v5`
-
----
-
-## Goals & Success
-
-### Primary Goal
-
-Complete feature #57 by adding only US-003 and US-004 so `bun scripts/seed-demo-arc.ts` creates a complete, idempotent four-week demo arc under `history/demo-arc/`.
-
-### Success Metrics
-
-| Metric | Target | How Measured |
-| ------ | ------ | ------------ |
-| Week coverage | W1, W2, W3, and W4 artifacts exist | Run seeder and inspect `history/demo-arc/demo-W*/` |
-| Outcome coverage | 6 of 7 Q4 lanes represented | Inspect `verdict.json` outcomes across all weeks |
-| Genealogy proof | One W4 spawned critic artifact set exists | Inspect `history/demo-arc/demo-W4/genealogy/` |
-| Runtime safety | No live history mutation | Seeder writes only beneath `history/demo-arc/` |
-| Quality gate | Validation green | `bun run validate` |
-
-### Non-Goals (Out of Scope)
-
-- Re-implementing W1/W2 scaffold or artifact writers — already landed in `fb3256e`.
-- Creating real Managed Agents through the Anthropic API — this is a deterministic mock seeder.
-- Touching live weekly history outside `history/demo-arc/` — demo data must remain isolated.
-- Covering the 7th outcome lane — the locked hero claim is deliberately 6/7.
-
----
-
-## User & Context
-
-### Target User
-
-- **Who**: Webster implementation operator preparing the hackathon demo.
-- **Role**: Maintains deterministic run artifacts that let the council/planner story be replayed.
-- **Current Pain**: The seeded output stops at W2, so the best narrative beats are absent.
-
-### User Journey
-
-1. **Trigger**: Operator needs a four-week mock arc for the submission demo.
-2. **Action**: Operator runs `bun scripts/seed-demo-arc.ts`.
-3. **Outcome**: `history/demo-arc/` contains W1-W4 proposals, decisions, verdicts, memory, baselines, and W4 genealogy artifacts.
-
----
-
-## UX Requirements
-
-### Interaction Model
-
-CLI-only deterministic seed script. The user runs `bun scripts/seed-demo-arc.ts`; the script recreates `history/demo-arc/` from scratch and prints a completion message.
-
-### States to Handle
-
-| State | Description | Behavior |
-| ----- | ----------- | -------- |
-| Empty | `history/demo-arc/` does not exist | Create directory tree and all artifacts |
-| Loading | Script is running | Synchronous file writes; no progress UI required |
-| Error | Filesystem or type errors occur | Let Bun/Node error surface; no silent fallback |
-| Success | Seeder completes | W1-W4 artifacts are present and deterministic |
-
----
-
-## Technical Context
-
-### Patterns to Follow
-
-- **Existing seeder scaffold**: `scripts/seed-demo-arc.ts:12-129` — constants, demo week identifiers, and TypeScript interfaces already define the artifact model.
-- **Existing W3/W4 data**: `scripts/seed-demo-arc.ts:240-338` — W3 and W4 `EXPERIMENT_SPECS` already encode experiment IDs, outcomes, gates, and insights.
-- **Artifact writer pattern**: `scripts/seed-demo-arc.ts:365-435` — proposal, decision, verdict, baseline, and memory writes are pure helper functions.
-- **Existing W1/W2 orchestration**: `scripts/seed-demo-arc.ts:459-479` — `writeW1`, `writeW2`, and `main` show the intended week writer shape.
-- **Locked domain narrative**: `context/DOMAIN-MODEL.md:411-431` — Q9 table defines W3/W4 experiments, outcomes, and genealogy demo beat.
-- **Feature tracking**: `context/FEATURES.md:172` — #57 status and remaining scope are canonical.
-- **Validation rules**: `CLAUDE.md:18-31` and `package.json:scripts.validate` — type-check, lint, format, agent/findings validation, markdownlint, and tests are mandatory.
-
-### Types & Interfaces
-
-```typescript
-type OutcomeLane =
-  | "promote-fast-track"
-  | "promote-fallback"
-  | "promote-gate-win"
-  | "archive-gate-fail"
-  | "auto-rollback"
-  | "hold";
-
-interface ExperimentSpec extends ExperimentVerdict {
-  week: DemoWeek;
-  target_files: string[];
-  proposed_change: string;
-  rationale: string;
-  baseline_sha: string;
-  verdict_ready_insight: string;
-  promote_insight: string;
-}
-
-interface NewCriticSpec {
-  name: string;
-  scope: string;
-  description: string;
-  rationale: string;
-  focus_owned: string[];
-  focus_not_owned: string[];
-  severity_rubric: string;
-}
-```
-
-### Architecture Notes
-
-- `initDemoArcDir()` currently creates all week directories and `demo-W4/genealogy`, so US-003/US-004 should add writers rather than new directory bootstrapping.
-- `buildBaselineRows()` currently marks every row as `promoted`; US-003 must preserve `archived-gate-fail` and `rolled-back` statuses for W3 lanes.
-- `buildWeekMemoryRows()` currently emits `promote` for every final event; US-003 must emit event names matching each outcome where relevant, especially rollback and skip/hold semantics.
-- W4 genealogy should use the existing `AgentJSON` and `NewCriticSpec` shapes and write deterministic local JSON/Markdown artifacts under `history/demo-arc/demo-W4/genealogy/`.
-
----
-
-## Implementation Summary
-
-### Story Overview
-
-| ID | Title | Priority | Dependencies |
-| -- | ----- | -------- | ------------ |
-| US-003 | Add W3 gate-fail and auto-rollback seeding | 1 | -- |
-| US-004 | Add W4 conservative wins and genealogy spawn | 2 | US-003 |
-
-### Dependency Graph
-
-```text
-US-003 (W3 artifact writers + lane-correct baseline/memory rows)
-    ↓
-US-004 (W4 artifact writers + genealogy spawn artifacts)
-```
-
----
-
-## Validation Requirements
-
-Every story must pass:
-
-- [ ] Type-check: `bun run type-check`
-- [ ] Lint: `bun run lint --max-warnings 0`
-- [ ] Tests: `bun run test`
-- [ ] Format: `bun run format:check`
-- [ ] Full validation: `bun run validate`
-
----
-
-Generated: 2026-04-24T07:47:55Z
diff --git a/.forge/ralph/seed-demo-arc-w3w4-v5/progress.txt b/.forge/ralph/seed-demo-arc-w3w4-v5/progress.txt
deleted file mode 100644
index 2318beb..0000000
--- a/.forge/ralph/seed-demo-arc-w3w4-v5/progress.txt
+++ /dev/null
@@ -1,88 +0,0 @@
-## Codebase Patterns
-
-### Deterministic local genealogy artifacts
-- **Where**: `scripts/seed-demo-arc.ts`
-- **Pattern**: Model demo-only critic genealogy with typed constants satisfying `NewCriticSpec` and `AgentJSON`, then write those JSON payloads under the week-local `history/demo-arc/demo-W4/genealogy/` directory. Do not mutate live `agents/` specs or call Managed Agent APIs from the seeder.
-- **Example**: `BOUNCE_GUARD_CRITIC_SPEC satisfies NewCriticSpec` and `BOUNCE_GUARD_AGENT_JSON satisfies AgentJSON`.
-
-### Outcome lane mapping for demo baselines and memory
-- **Where**: `scripts/seed-demo-arc.ts`
-- **Pattern**: Keep experiment specs as the single source of truth, then derive baseline status and final memory event from `experiment.outcome`.
-- **Example**: `archive-gate-fail -> archived-gate-fail + regression`, `auto-rollback -> rolled-back + rollback`, `hold -> no baseline row + skip`.
-
----
-
-## 2026-04-24T07:55:39Z — US-003: Add W3 gate-fail and auto-rollback seeding
-
-**Status**: PASSED
-**Files changed**:
-- `scripts/seed-demo-arc.ts` — added W3 writer and lane-specific baseline/memory helpers.
-- `history/demo-arc/demo-W3/proposal.md` — seeded W3 proposal artifacts.
-- `history/demo-arc/demo-W3/decision.json` — seeded W3 planner decision artifacts.
-- `history/demo-arc/demo-W3/verdict.json` — seeded W3 verdict artifacts.
-- `history/demo-arc/baselines.jsonl` — added W3 archive/rollback rows with no held-experiment promotion.
-- `history/demo-arc/memory.jsonl` — added W3 verdict-ready plus regression/rollback/skip final events.
-- `.forge/ralph/seed-demo-arc-w3w4-v5/prd.md` — removed emphasis from generated footer so repository markdown validation passes.
-
-**Acceptance criteria verified**:
-- [x] `bun scripts/seed-demo-arc.ts` writes `history/demo-arc/demo-W3/proposal.md`, `decision.json`, and `verdict.json`.
-- [x] W3 verdict includes `exp-05-mid-section-image-swap` with outcome `archive-gate-fail` and a failing `bounce_rate` gate.
-- [x] W3 verdict includes `exp-06-cta-color-shift` with outcome `auto-rollback`, classification `hurt`, and `reward_delta_pct` of `-11`.
-- [x] W3 verdict includes `exp-07-subhead-rewrite` with outcome `hold` and classification `neutral`.
-- [x] `history/demo-arc/baselines.jsonl` records W3 lane statuses as `archived-gate-fail`, `rolled-back`, and no promoted baseline for the held experiment.
-- [x] `history/demo-arc/memory.jsonl` contains W3 rows whose final events reflect archive/rollback/hold behavior rather than labeling every W3 experiment as a promotion.
-- [x] Running the seeder twice produces deterministic W3 output under `history/demo-arc/` and does not write outside that directory.
-- [x] `bun run validate` passes.
-
-**Learnings**:
-- `progress.txt` was absent at iteration start, so this iteration created it with a codebase pattern section.
-- The existing W3 specs already contained the required verdict details; implementation only needed orchestration plus derived baseline/memory semantics.
-- `bun run validate` initially failed on the generated PRD footer being emphasis-only markdown; removing the emphasis made markdownlint pass.
-
-**Verification**:
-- `bun scripts/seed-demo-arc.ts && cp -R history/demo-arc /tmp/demo-arc-first && bun scripts/seed-demo-arc.ts && diff -qr /tmp/demo-arc-first history/demo-arc`
-- `jq '.experiments[] | {exp_id,outcome,classification,reward_delta_pct,gates}' history/demo-arc/demo-W3/verdict.json`
-- `grep 'exp-0[567]' history/demo-arc/baselines.jsonl`
-- `grep 'demo-W3' history/demo-arc/memory.jsonl`
-- `bun run type-check && bun run lint --max-warnings 0 && bun run test && bun run format:check && bun run validate`
-
----
-
-## 2026-04-24T07:59:41Z — US-004: Add W4 conservative wins and genealogy spawn
-
-**Status**: PASSED
-**Files changed**:
-- `scripts/seed-demo-arc.ts` — added W4 writer, deterministic bounce-guard genealogy payloads, W4 gap-detected memory row, and demo-W4 completion output.
-- `history/demo-arc/demo-W4/proposal.md` — seeded W4 proposal artifacts.
-- `history/demo-arc/demo-W4/decision.json` — seeded W4 planner decision artifacts.
-- `history/demo-arc/demo-W4/verdict.json` — seeded W4 verdict artifacts for exp-08 and exp-09.
-- `history/demo-arc/demo-W4/genealogy/new-critic-spec.json` — seeded `NewCriticSpec`-shaped bounce-guard critic payload.
-- `history/demo-arc/demo-W4/genealogy/agent-registration.json` — seeded `AgentJSON`-shaped critic registration payload.
-- `history/demo-arc/baselines.jsonl` — added W4 promoted baseline rows.
-- `history/demo-arc/memory.jsonl` — added W4 gap-detected genealogy trigger and W4 verdict/promote rows.
-- `context/FEATURES.md` — marked feature #57 done.
-
-**Acceptance criteria verified**:
-- [x] `bun scripts/seed-demo-arc.ts` writes `history/demo-arc/demo-W4/proposal.md`, `decision.json`, and `verdict.json`.
-- [x] W4 verdict includes `exp-08-hero-safety-copy` and `exp-09-cta-size-adjust` as passing conservative experiments.
-- [x] Outcome coverage across W1-W4 includes exactly these six lanes at minimum: `promote-fast-track`, `promote-fallback`, `promote-gate-win`, `archive-gate-fail`, `auto-rollback`, and `hold`.
-- [x] The seeder writes one W4 genealogy-spawned critic spec for a bounce-risk concern under `history/demo-arc/demo-W4/genealogy/`.
-- [x] The genealogy artifacts include a `NewCriticSpec`-shaped JSON payload and an `AgentJSON`-shaped critic registration payload using the existing exported interfaces.
-- [x] W4 memory rows include a `gap-detected` event or equivalent genealogy trigger referencing the W3 bounce/gate-fail pattern and the spawned critic.
-- [x] The script completion message reflects seeding through demo-W4 instead of demo-W2.
-- [x] Running the seeder twice produces deterministic W4/genealogy output under `history/demo-arc/` and does not write outside that directory.
-- [x] `bun run validate` passes.
-
-**Learnings**:
-- W4 experiment specs already contained the conservative passing outcomes, so implementation needed orchestration and genealogy artifact emission rather than new experiment modeling.
-- The seeder's exported interfaces can enforce local demo payload shape with `satisfies` while still avoiding live Managed Agent registration.
-- Prettier reformats the long `context/FEATURES.md` table row when feature #57 status changes.
-
-**Verification**:
-- `bun scripts/seed-demo-arc.ts && cp -R history/demo-arc /tmp/demo-arc-first && bun scripts/seed-demo-arc.ts && diff -qr /tmp/demo-arc-first history/demo-arc`
-- `jq -r '.experiments[].outcome' history/demo-arc/demo-W*/verdict.json | sort -u`
-- `jq '.experiments[] | {exp_id,outcome,classification,reward_delta_pct,gates}' history/demo-arc/demo-W4/verdict.json`
-- `grep 'gap-detected' history/demo-arc/memory.jsonl`
-- `bun run type-check && bun run lint --max-warnings 0 && bun run test && bun run format:check && bun run validate`
-
----
diff --git a/.forge/ralph/webster-feature-number-58-pair-alpha-secondary-sub/prd.json b/.forge/ralph/webster-feature-number-58-pair-alpha-secondary-sub/prd.json
deleted file mode 100644
index 3bdf936..0000000
--- a/.forge/ralph/webster-feature-number-58-pair-alpha-secondary-sub/prd.json
+++ /dev/null
@@ -1,91 +0,0 @@
-{
-  "project": "webster",
-  "branchName": "ralph/webster-feature-number-58-pair-alpha-secondary-sub",
-  "prdFile": "prd.md",
-  "description": "Seed Pair Alpha secondary SaaS and local-service substrates with deterministic mock run artifacts.",
-  "userStories": [
-    {
-      "id": "US-001",
-      "title": "Add deterministic secondary substrate model and HTML writers",
-      "description": "As a Webster implementation operator, I want deterministic SaaS and local-service HTML fixtures so that the submission can demonstrate council generalization beyond the primary substrate.",
-      "acceptanceCriteria": [
-        "Create `scripts/seed-secondary-substrates.ts` with `#!/usr/bin/env bun` and pure TypeScript imports from Node/Bun standard libraries only.",
-        "Define typed constants for exactly two substrates: `saas-alpha` and `local-service-alpha`.",
-        "Write `site/secondary/saas-alpha/index.html` and `site/secondary/local-service-alpha/index.html` as complete single-file HTML landing pages.",
-        "HTML output is deterministic and contains no remote scripts, remote stylesheets, or network-fetching code.",
-        "Export constants or helper functions needed by tests without executing `main()` on import.",
-        "Type-check passes",
-        "Tests pass"
-      ],
-      "technicalNotes": "Mirror `scripts/seed-demo-arc.ts:8-17` for ROOT/path constants and fs/path imports. Follow `scripts/seed-demo-arc.ts:21-64` for literal-union types/interfaces. The new script owns `site/secondary/` only for site output and must not touch `site/before/` or `site/after/`.",
-      "dependsOn": [],
-      "priority": 1,
-      "passes": true,
-      "notes": "Implemented in iteration 1. Files: scripts/seed-secondary-substrates.ts, site/secondary/saas-alpha/index.html, site/secondary/local-service-alpha/index.html."
-    },
-    {
-      "id": "US-002",
-      "title": "Write secondary mock run artifacts",
-      "description": "As a Webster implementation operator, I want onboard and two weekly mock runs per secondary substrate so that the demo can show a complete two-cycle council arc for each new vertical.",
-      "acceptanceCriteria": [
-        "Create `history/secondary-arc/saas-alpha/{onboard,week-1,week-2}/` and `history/secondary-arc/local-service-alpha/{onboard,week-1,week-2}/`.",
-        "Every run folder contains exactly the required artifact names: `proposal.md`, `decision.json`, `verdict.json`, and `apply-log.json`.",
-        "Each `proposal.md` includes experiment blocks with exp IDs, kind, target files, proposed change, and rationale.",
-        "Each `decision.json` includes substrate, run, selected issues, reasoning, and monitor signal fields that mirror the `history/demo-arc` decision convention.",
-        "Each `verdict.json` includes substrate, run, experiments, reward delta, p-value, classification, and outcome fields that mirror the `history/demo-arc` verdict convention.",
-        "Each `apply-log.json` records applied status, touched files, skipped rows, and notes for that run.",
-        "Type-check passes",
-        "Tests pass"
-      ],
-      "technicalNotes": "Follow writer shape in `scripts/seed-demo-arc.ts:393-419`: build typed objects, write `JSON.stringify(value, null, 2)` plus trailing newline, and generate Markdown proposal bodies from typed experiment specs. Use the outcome lane names from `scripts/seed-demo-arc.ts:25-31`.",
-      "dependsOn": [
-        "US-001"
-      ],
-      "priority": 2,
-      "passes": true,
-      "notes": "Implemented in iteration 2. Files: scripts/seed-secondary-substrates.ts, history/secondary-arc/*/{onboard,week-1,week-2}/{proposal.md,decision.json,verdict.json,apply-log.json}."
-    },
-    {
-      "id": "US-003",
-      "title": "Wire CLI package script and scope guards",
-      "description": "As a Webster implementation operator, I want a single package command with strict output boundaries so that seeding is repeatable and cannot corrupt primary demo artifacts.",
-      "acceptanceCriteria": [
-        "Add `seed:secondary` to `package.json` scripts with value `bun scripts/seed-secondary-substrates.ts`.",
-        "The script removes/recreates or overwrites only `site/secondary/` and `history/secondary-arc/`.",
-        "The script never reads from or writes to `history/demo-arc/`, `site/before/`, or `site/after/`.",
-        "Running `bun run seed:secondary` exits 0 and prints a concise deterministic success message.",
-        "`main()` is guarded with `if (import.meta.main)` so tests can import the module safely.",
-        "Type-check passes",
-        "Tests pass"
-      ],
-      "technicalNotes": "Mirror CLI/export pattern in `scripts/seed-demo-arc.ts:485-510`. Add the package script near existing scripts in `package.json:12-23`. Protected paths are explicit feature requirements from `context/FEATURES.md:173` and the PRD input.",
-      "dependsOn": [
-        "US-002"
-      ],
-      "priority": 3,
-      "passes": true,
-      "notes": "Implemented in iteration 3. Files: package.json; verified scripts/seed-secondary-substrates.ts guarded main and owned output boundaries."
-    },
-    {
-      "id": "US-004",
-      "title": "Add Bun tests for layout, idempotency, and protected paths",
-      "description": "As a Webster maintainer, I want automated tests around the seeder so that future changes cannot break file layout, determinism, or safety constraints.",
-      "acceptanceCriteria": [
-        "Create `scripts/__tests__/seed-secondary-substrates.test.ts` using Bun's `describe`, `test`, and `expect` APIs.",
-        "Test verifies both secondary HTML files and all six run folders exist after seeding.",
-        "Test verifies every run folder contains `proposal.md`, `decision.json`, `verdict.json`, and `apply-log.json`.",
-        "Test captures contents of all seeded files, runs the seeder a second time, and asserts byte-identical contents for idempotency.",
-        "Test fingerprints `history/demo-arc/`, `site/before/`, and `site/after/` before and after seeding and asserts they are unchanged.",
-        "`bun test` passes.",
-        "`bun run validate` passes."
-      ],
-      "technicalNotes": "Follow filesystem testing style in `scripts/__tests__/memory.test.ts:1-85`: import Bun test helpers, use fs/path utilities, and cleanly assert deterministic data. Existing tests import source modules directly, as shown by `scripts/__tests__/critic-genealogy.test.ts:1-18`.",
-      "dependsOn": [
-        "US-003"
-      ],
-      "priority": 4,
-      "passes": true,
-      "notes": "Implemented in iteration 4. Files: scripts/__tests__/seed-secondary-substrates.test.ts."
-    }
-  ]
-}
diff --git a/.forge/ralph/webster-feature-number-58-pair-alpha-secondary-sub/prd.md b/.forge/ralph/webster-feature-number-58-pair-alpha-secondary-sub/prd.md
deleted file mode 100644
index 3af1442..0000000
--- a/.forge/ralph/webster-feature-number-58-pair-alpha-secondary-sub/prd.md
+++ /dev/null
@@ -1,186 +0,0 @@
-# Pair Alpha Secondary Substrates — Product Requirements
-
-## Overview
-
-**Problem**: Webster's current demo arc proves the council loop on one primary landing page only. Without secondary substrates, judges and operators cannot see whether the planner, critic council, verdict model, and mock history conventions generalize beyond the healthcare landing page.
-**Solution**: Build `scripts/seed-secondary-substrates.ts`, a deterministic Bun/TypeScript seeder that creates two synthetic single-file secondary landing pages plus mock onboard/week-1/week-2 run artifacts for each substrate.
-**Branch**: `ralph/webster-feature-number-58-pair-alpha-secondary-sub`
-
----
-
-## Goals & Success
-
-### Primary Goal
-
-Create a demo-safe Pair Alpha substrate package that proves Webster can operate on a B2B SaaS landing page and a B2C local-service landing page without touching the primary demo arc or before/after site fork.
-
-### Success Metrics
-
-| Metric | Target | How Measured |
-|--------|--------|--------------|
-| Secondary site files created | `site/secondary/saas-alpha/index.html` and `site/secondary/local-service-alpha/index.html` exist | `bun run seed:secondary` then file existence assertions |
-| Mock run layout complete | Each substrate has `onboard`, `week-1`, and `week-2` folders with `proposal.md`, `decision.json`, `verdict.json`, `apply-log.json` | Unit test enumerates expected paths under `history/secondary-arc/<substrate>/` |
-| Idempotent deterministic output | Re-running the seeder produces byte-identical files | Test snapshots file contents before and after a second run |
-| Scope safety | Seeder never mutates `history/demo-arc/`, `site/before/`, or `site/after/` | Test fingerprints protected directories before/after seeding |
-| Validation green | `bun run validate` and `bun test` pass | Local command output |
-
-### Non-Goals (Out of Scope)
-
-- Live analytics ingestion — this is a synthetic seed artifact, not runtime telemetry.
-- E-commerce substrate — explicitly held out by operator decision; Pair Alpha is SaaS + local service only.
-- Modifying `history/demo-arc/` — the primary demo arc is canonical and must remain untouched.
-- Modifying `site/before/` or `site/after/` — those directories are the primary before/after fork and are not part of the secondary-substrate proof.
-- Network calls or external API integration — deterministic mock data only.
-
----
-
-## User & Context
-
-### Target User
-
-- **Who**: Webster implementation operator preparing the hackathon submission.
-- **Role**: Needs a fast, repeatable local command that seeds extra demo evidence.
-- **Current Pain**: Current mock history is convincing for one primary substrate, but does not demonstrate cross-vertical generalization.
-
-### User Journey
-
-1. **Trigger**: Operator needs to show that Webster can run its council loop beyond the primary healthcare landing page.
-2. **Action**: Operator runs `bun run seed:secondary`.
-3. **Outcome**: Two synthetic landing pages and six mock run folders appear in stable locations, ready for demo narration and automated checks.
-
----
-
-## UX Requirements
-
-### Interaction Model
-
-CLI-only seed workflow:
-
-```bash
-bun run seed:secondary
-```
-
-The command should be silent except for a short success message. It should be safe to run repeatedly in local development and CI. The script must use pure TypeScript/Bun stdlib file operations and no network calls.
-
-### States to Handle
-
-| State | Description | Behavior |
-|-------|-------------|----------|
-| Empty | `site/secondary/` or `history/secondary-arc/` does not exist | Create directories and all expected files |
-| Loading | Seeder is writing deterministic files | Synchronous file writes are acceptable; no progress UI required |
-| Error | Filesystem write fails | Let the thrown error fail the command; do not silently swallow |
-| Success | All secondary files are written | Print deterministic success line and exit 0 |
-
----
-
-## Technical Context
-
-### Patterns to Follow
-
-- **Similar implementation**: `scripts/seed-demo-arc.ts:8-17` — use Bun TypeScript, `node:fs`, `node:path`, `ROOT`, and constants for output directories.
-- **Type pattern**: `scripts/seed-demo-arc.ts:21-64` — define string-literal unions and interfaces for experiment kinds, verdict outcomes, decisions, verdicts, and run rows.
-- **Seed lifecycle pattern**: `scripts/seed-demo-arc.ts:345-354` — initialize owned output directories deterministically. For this feature, remove/recreate only `history/secondary-arc/` and `site/secondary/`, never protected primary paths.
-- **Artifact writer pattern**: `scripts/seed-demo-arc.ts:393-419` — emit pretty-printed JSON files with trailing newline and Markdown proposal files.
-- **CLI entry/export pattern**: `scripts/seed-demo-arc.ts:485-510` — `main()` gated by `if (import.meta.main)` and export constants/helpers for tests.
-- **Package script pattern**: `package.json:12-23` — add a new script beside existing validation/test scripts.
-- **Test pattern**: `scripts/__tests__/memory.test.ts:1-85` — Bun test with `describe`, `test`, `expect`, filesystem setup/cleanup, and deterministic assertions.
-
-### Types & Interfaces
-
-```typescript
-type SecondarySubstrate = "saas-alpha" | "local-service-alpha";
-type SecondaryRun = "onboard" | "week-1" | "week-2";
-type ExperimentKind = "text" | "component" | "asset" | "css";
-type OutcomeLane =
-  | "promote-fast-track"
-  | "promote-fallback"
-  | "promote-gate-win"
-  | "archive-gate-fail"
-  | "auto-rollback"
-  | "hold";
-
-interface SecondaryDecisionJSON {
-  substrate: SecondarySubstrate;
-  run: SecondaryRun;
-  selected_issues: Array<{
-    exp_id: string;
-    kind: ExperimentKind;
-    target_files: string[];
-    proposed_change: string;
-    expected_outcome_lane: OutcomeLane;
-  }>;
-  reasoning: string;
-  monitor_signal: string;
-}
-
-interface SecondaryVerdictJSON {
-  substrate: SecondarySubstrate;
-  run: SecondaryRun;
-  experiments: Array<{
-    exp_id: string;
-    kind: ExperimentKind;
-    reward_delta_pct: number;
-    p_value: number;
-    classification: "improved" | "hurt" | "neutral";
-    outcome: OutcomeLane;
-  }>;
-}
-
-interface SecondaryApplyLogJSON {
-  substrate: SecondarySubstrate;
-  run: SecondaryRun;
-  applied: boolean;
-  touched_files: string[];
-  skipped: Array<{ exp_id: string; reason: string }>;
-  notes: string;
-}
-```
-
-### Architecture Notes
-
-- `context/FEATURES.md:173` defines feature #58 as Layer 11 Pair Alpha: SaaS B2B + local service B2C synthetic HTMLs plus onboard/week-1/week-2 mock runs.
-- The script owns only `site/secondary/` and `history/secondary-arc/`.
-- Mock run artifact filenames must match the existing demo-run convention plus the new apply log: `proposal.md`, `decision.json`, `verdict.json`, `apply-log.json`.
-- Artifact JSON shape should mirror `history/demo-arc` conventions: selected issues in `decision.json`, experiment verdict rows in `verdict.json`, Markdown experiment blocks in `proposal.md`.
-- Tests should import exported constants/helpers from `scripts/seed-secondary-substrates.ts` rather than shelling out where possible, then separately verify package script presence if useful.
-
----
-
-## Implementation Summary
-
-### Story Overview
-
-| ID | Title | Priority | Dependencies |
-|----|-------|----------|--------------|
-| US-001 | Add deterministic secondary substrate model and HTML writers | 1 | — |
-| US-002 | Write secondary mock run artifacts | 2 | US-001 |
-| US-003 | Wire CLI/package script and scope guards | 3 | US-002 |
-| US-004 | Add Bun tests for layout, idempotency, and protected paths | 4 | US-003 |
-
-### Dependency Graph
-
-```text
-US-001 (substrate data + HTML writers)
-    ↓
-US-002 (history/secondary-arc artifact writers)
-    ↓
-US-003 (main + package script + protected path discipline)
-    ↓
-US-004 (tests)
-```
-
----
-
-## Validation Requirements
-
-Every story must pass:
-
-- [ ] Type-check: `bun run type-check`
-- [ ] Lint: `bun run lint --max-warnings 0`
-- [ ] Tests: `bun run test`
-- [ ] Format: `bun run format:check`
-- [ ] Full validation: `bun run validate`
-
----
-
-Generated: 2026-04-24T00:00:00.000Z
diff --git a/.gitignore b/.gitignore
index e47423f..40b2195 100644
--- a/.gitignore
+++ b/.gitignore
@@ -83,8 +83,34 @@ demo-output/videos/
 /plan.md
 /research.md
 
-
 # Claude Design polish handoff bundles — committed per-slot only after review
 skills/webster-video/polish-slots/**/handoff/
 skills/webster-video/polish-slots/handoff-shared/
 skills/webster-video/polish-slots.zip
+
+# Internal tracking docs — preserved in ~/Vault/Projects/webster/internal-tracking/
+context/EXPANSION-TASKS.md
+context/E2E-IMPLEMENTATION-TRACKER.md
+context/SITE-FORK-CHECKLIST.md
+context/ROADMAP.md
+context/VIDEO-PLAN.md
+context/VIDEO-PLAN-90s.md
+context/v2-design.md
+
+# Intermediate session prompts — only first/second-wbs and sim-council are public-facing
+prompts/third-wbs-session.md
+prompts/fourth-wbs-session.md
+prompts/sim-audit-fix-session.md
+prompts/composition-session.md
+prompts/e2e-demo-run-session.md
+prompts/sim-runner.md
+
+# History operator notes (story belongs in README/AGENTS.md, not duplicated)
+history/AGENTS.md
+history/CLAUDE.md
+
+# Polish-session worktree prompts (local hand-off only)
+ONBOARDING-V2-PROMPT.md
+
+# Personal launchd plist (hardcoded user paths) — preserved in vault
+deploy/webster-dispatcher.plist
diff --git a/AGENTS.md b/AGENTS.md
index 2f98ae8..797fc51 100644
--- a/AGENTS.md
+++ b/AGENTS.md
@@ -22,9 +22,9 @@ Two active workstreams:
 2. `context/ARCHITECTURE.md` — current system design
 3. `context/FEATURES.md` — shipped state + stream allocation
 4. `context/VISION.md` — canonical north-star for the active hackathon expansion. If about to code or make an architectural call, this doc tells you whether you're drifting.
-5. `context/EXPANSION-TASKS.md` — topologically ordered tasks with acceptance criteria
-6. `context/QUALITY-GATES.md` — validation rules (mirror Forge pattern)
-7. `~/Vault/Projects/webster/webster-decision-log.md` — architectural decisions with rationale
+5. `context/QUALITY-GATES.md` — validation rules (mirror Forge pattern)
+6. `~/Vault/Projects/webster/webster-decision-log.md` — architectural decisions with rationale
+7. `~/Vault/Projects/webster/internal-tracking/context/EXPANSION-TASKS.md` — local-only task tracker for the hackathon expansion (vault, not in repo)
 
 ## Communication with Richie
 
@@ -103,7 +103,7 @@ bun run validate
 
 ## Task pickup protocol (hackathon expansion)
 
-1. Check `context/EXPANSION-TASKS.md` — pick next unblocked task in topological order. Do NOT skip T0.
+1. Check `~/Vault/Projects/webster/internal-tracking/context/EXPANSION-TASKS.md` (vault, local-only) — pick next unblocked task in topological order. Do NOT skip T0.
 2. Re-read the task's acceptance criteria
 3. Read every file the task touches before editing
 4. Implement minimally — no scope expansion, no drive-by refactors
@@ -147,4 +147,4 @@ State the conflict. Don't paper over it.
 
 Consult `~/Vault/Projects/webster/webster-decision-log.md` — every locked decision with rationale.
 
-If a path isn't clear and VISION.md / EXPANSION-TASKS.md don't answer, leave a `[STUCK]` or `[QUESTION]` prefix in your session output. Don't compose around it.
+If a path isn't clear and VISION.md doesn't answer, leave a `[STUCK]` or `[QUESTION]` prefix in your session output. Don't compose around it.
diff --git a/README.md b/README.md
index af1c102..d38dced 100644
--- a/README.md
+++ b/README.md
@@ -147,6 +147,18 @@ Current state: 175 tests passing, 0 lint warnings, 0 type errors, 18 JSON specs
 - `git` with commit-signing configured
 - An Anthropic API key stored in macOS keychain under service `anthropic-webster`. First-session will show the exact `security add-generic-password` command if missing.
 
+### The `wbs` alias (project convention)
+
+The `wbs @prompts/...` commands below assume a shell alias that launches Claude Code into Webster's dispatcher mode (Opus 4.7, 1M context, custom system prompt at `.claude/dispatcher.md`, custom settings at `.claude/dispatcher-settings.json`). Add to your shell rc:
+
+```bash
+alias wbs='cd ~/Projects/webster && claude --dangerously-skip-permissions --model claude-opus-4-7 \
+  --settings .claude/dispatcher-settings.json \
+  --system-prompt "$(cat .claude/dispatcher.md)"'
+```
+
+Or run the equivalent `claude --settings ... --system-prompt ...` directly without aliasing. Either works.
+
 ### Bootstrap (one-time)
 
 ```bash
diff --git a/context/E2E-IMPLEMENTATION-TRACKER.md b/context/E2E-IMPLEMENTATION-TRACKER.md
deleted file mode 100644
index 08003f4..0000000
--- a/context/E2E-IMPLEMENTATION-TRACKER.md
+++ /dev/null
@@ -1,206 +0,0 @@
-# Webster E2E Implementation Tracker
-
-> Handoff file for compaction recovery. Read this first if the session is resumed. Last updated: 2026-04-25.
-
-## Operating mode
-
-- Execute directly; do not wait for approval unless a task has unresolved ambiguity.
-- Preserve production Webster:
-  - Do not modify the existing production `agents/webster-*` specs unless the task explicitly says so.
-  - Do not modify `prompts/second-wbs-session.md`.
-- Validate before claiming completion.
-- Prefer narrow reads and targeted edits.
-- Use subagents for repo-wide audits or isolated review so the main context stays lean.
-
-## Current repo state summary
-
-Verified by main session + subagent scout:
-
-| Task                     | Current status                               | Evidence / notes                                                                                                                                                                                                                                                        |
-| ------------------------ | -------------------------------------------- | ----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------- |
-| T0 Pass-7 fixes          | Done in tree                                 | `scripts/apply-worker-cli.ts`, `scripts/apply-worker.ts`, `.husky/pre-commit`, `scripts/anthropic-agents.ts`, `scripts/planner-invoke.ts`, `scripts/critic-genealogy.ts`; targeted tests passed. Perl byte-count acceptance says 13 but actual correct count is 14.     |
-| T1 Memory stores         | Appears implemented                          | `scripts/provision-memory-stores.ts`, tests exist. Needs validation/live run if not already done.                                                                                                                                                                       |
-| T2 Sim agents            | Appears implemented                          | 18 `agents/webster-{lp,site}-sim-*.json` specs and `scripts/register-sim-agents.ts` exist.                                                                                                                                                                              |
-| T3 Contexts              | Appears implemented                          | `demo-landing-page/context/*`, `demo-sites/northwest-reno/context/*`, `scripts/context-schema.ts` exist.                                                                                                                                                                |
-| T4 Ugly sites            | Partial / uncommitted                        | Ugly files exist but `git status` shows modified/untracked assets. Needs browser/render check and commit cleanup.                                                                                                                                                       |
-| T5 Synthetic analytics   | Appears implemented                          | `scripts/synthetic-analytics.ts` and tests exist.                                                                                                                                                                                                                       |
-| T6 Sim council fork      | Appears implemented                          | `prompts/sim-council.md` and tests exist.                                                                                                                                                                                                                               |
-| T7 Simulation wrapper    | Appears implemented                          | `scripts/run-simulation.ts` and tests exist.                                                                                                                                                                                                                            |
-| T8 Entrypoints           | Appears implemented                          | `scripts/run-simulation-lp.ts`, `scripts/run-simulation-site.ts` exist.                                                                                                                                                                                                 |
-| T9 Manifest/final sheets | Appears implemented                          | `scripts/build-demo-manifest.ts` and tests exist.                                                                                                                                                                                                                       |
-| T10 Full dry run         | Not done                                     | No evidence of full dual 10-week run and handoff.                                                                                                                                                                                                                       |
-| T11 Auto-capture         | Implemented / needs authenticated screenshot | Added capture script, bridge, preflight, screenshot manifest, package scripts, and CAPTURE_TRIGGER emission. `browser-use` requires `-b real --profile Default`; current local Console session is logged out, so authenticated PNG acceptance still needs Richie login. |
-| T12 Onboarding v2        | Not started                                  | Missing `scripts/onboarding/*` and status flow. Secondary/case-study path.                                                                                                                                                                                              |
-| T13 Empire Asphalt       | Not started / blocked                        | Blocked on consent artifact. Missing brand corpus and external demo repo.                                                                                                                                                                                               |
-
-## Current validation state
-
-Latest full validation is green:
-
-```bash
-bun run validate
-# 181 pass, 0 fail
-```
-
-T11 preflight correctly fails until Richie logs into Anthropic Console in local Chrome `Default` profile:
-
-```bash
-bun run sim:preflight
-# AUTH_EXPIRED: Anthropic Console Memory Stores page is not authenticated/reachable
-```
-
-Auth-expired capture path was verified against the current local Chrome state:
-
-```bash
-bun scripts/capture-mem-stores.ts '<week-1 trigger json>'
-# exits 1 with AUTH_EXPIRED because local Anthropic Console is not logged in
-```
-
-Targeted T0 tests passed earlier:
-
-```bash
-bun test scripts/__tests__/anthropic-agents.test.ts scripts/__tests__/critic-genealogy.test.ts scripts/__tests__/apply-worker-cli.test.ts
-# 50 pass, 0 fail
-```
-
-## Immediate next steps
-
-### Step A — Restore green baseline
-
-Done. `bun run validate` is green.
-
-### Step B — Verify implemented tasks T1-T9 before adding new code
-
-Run fast, scoped checks first:
-
-```bash
-bun test \
-  scripts/__tests__/provision-memory-stores.test.ts \
-  scripts/__tests__/register-sim-agents.test.ts \
-  scripts/__tests__/context-schema.test.ts \
-  scripts/__tests__/synthetic-analytics.test.ts \
-  scripts/__tests__/sim-council.test.ts \
-  scripts/__tests__/run-simulation.test.ts \
-  scripts/__tests__/run-simulation-entrypoints.test.ts \
-  scripts/__tests__/build-demo-manifest.test.ts
-```
-
-Then run full `bun run validate` again.
-
-### Step C — Finalize T4 uncommitted ugly-site state
-
-1. Review ugly-site diffs:
-
-   ```bash
-   git diff -- demo-landing-page/ugly demo-sites/northwest-reno/ugly
-   find demo-landing-page/ugly demo-sites/northwest-reno/ugly -maxdepth 3 -type f
-   ```
-
-2. Confirm no JS and no external network resources:
-
-   ```bash
-   rg -n "<script|https?://|//" demo-landing-page/ugly demo-sites/northwest-reno/ugly
-   ```
-
-3. Browser/render smoke check with existing screenshot tooling or Playwright file URLs.
-4. Commit only T4-related files if validation passes:
-
-   ```bash
-   git add demo-landing-page/ugly demo-sites/northwest-reno/ugly
-   git commit -m "feat: add ugly simulation substrates"
-   ```
-
-### Step D — Implement T11 auto-capture infrastructure
-
-Implemented files:
-
-- `scripts/capture-mem-stores.ts`
-- `scripts/sim-capture-bridge.ts`
-- `scripts/sim-preflight.ts`
-- `scripts/emit-memory-screenshot-manifest.ts`
-- `scripts/__tests__/sim-capture.test.ts`
-- `scripts/run-simulation.ts` emits exact `CAPTURE_TRIGGER` JSON at weeks 1, 5, and 10.
-- `package.json` has `sim:lp`, `sim:site`, `sim:capture-bridge`, `sim:preflight`, `sim:emit-manifest`.
-
-Verified:
-
-- `bun run sim:preflight` now enforces authenticated Console reachability and currently fails with `AUTH_EXPIRED`, as intended while logged out.
-- Auth-expired path exits non-zero with `AUTH_EXPIRED`.
-- Bridge tests prove capture failure halts.
-- Trigger format matches `prompts/sim-runner.md`.
-- `bun run validate` green.
-
-Remaining T11 live acceptance:
-
-- Richie must log into Anthropic Console in local Chrome profile `Default`.
-- Manual Memory Stores screenshot is available at `assets/memory-stores-screenshots/manual/console-memory-stores-2026-04-25.png`.
-- `bun run sim:emit-manifest` writes a manifest containing this manual proof.
-- Auto-capture is optional. If required, set `WEBSTER_REQUIRE_CONSOLE_CAPTURE=1` and re-run `bun run sim:preflight`; it should return 0 only after authenticated Console reachability is confirmed.
-- Then commit: `feat: capture memory store console screenshots`.
-
-### Step E — T10 full dry run and handoff
-
-Run after T11:
-
-```bash
-bun run validate
-bun run sim:preflight
-# token-enabled session only:
-bun scripts/provision-memory-stores.ts
-bun scripts/register-sim-agents.ts
-bun scripts/run-simulation-lp.ts | bun scripts/sim-capture-bridge.ts
-bun scripts/run-simulation-site.ts | bun scripts/sim-capture-bridge.ts
-bun run sim:emit-manifest
-bun scripts/build-demo-manifest.ts
-bun run validate
-```
-
-Manual checks:
-
-- Both `demo-output/landing-page/` and `demo-output/northwest-reno/` have week progressions.
-- Screenshots render at 375/768/1440; no blank pages.
-- Week 10 visibly improves over week 0.
-- Memory stores contain meaningful summaries.
-- Genealogy outcome documented honestly.
-
-Commit final handoff assets only if appropriate:
-
-```bash
-git add demo-output assets/memory-stores-screenshots history
- git commit -m "chore: finalize simulation handoff assets"
-```
-
-## Secondary path after core demo
-
-### T12 onboarding v2
-
-Implement only after T10 or if Richie makes the case-study video the priority.
-
-Files:
-
-- `skills/webster-onboarding/SKILL.md`
-- `scripts/onboarding/verify-env.ts`
-- `scripts/onboarding/verify-all.ts`
-- `scripts/onboarding/scaffold-repo.ts`
-
-Acceptance: no key leakage, phase gates, idempotent status file, live verification.
-
-### T13 Empire Asphalt
-
-Do not start until consent exists:
-
-- `assets/onboarding-case-study/dad-consent.txt`
-
-Then prepare:
-
-- `context/brand-corpus/*`
-- private `richsak/empire-paving-demo` repo
-- ugly v0 Astro site with Empire palette.
-
-## If compaction happens
-
-1. Read this file.
-2. Read `context/VISION.md` locked section.
-3. Run `git status --short`.
-4. Run `bun run validate` or the last scoped test listed above.
-5. Continue from the first unchecked step in `Immediate next steps`.
diff --git a/context/EXPANSION-TASKS.md b/context/EXPANSION-TASKS.md
deleted file mode 100644
index 5dda32e..0000000
--- a/context/EXPANSION-TASKS.md
+++ /dev/null
@@ -1,471 +0,0 @@
-# Webster Expansion Tasks
-
-> Topologically ordered. Implement in sequence. Do NOT skip T0. Read `context/VISION.md` before each task and re-read it before marking any task done.
-
-## Session start protocol
-
-When a new session starts on this repo with a prompt like "Go" or "start" or "continue":
-
-1. **Read the first-actions list in `AGENTS.md`** in full (including `context/VISION.md` and this file) before writing any code
-2. **Start T0 immediately** — no confirmation needed to begin work
-3. **Stop after T0 completes** (validate green + committed). Report completion to Richie in 3–5 lines: what changed, test results, commit hash. Wait for his green-light before starting T1.
-4. **From T1 onward, proceed task-by-task without waiting for approval** BUT before starting each new task, post a 2-line announcement:
-   - Line 1: `Starting T<n>: <one-line-summary>`
-   - Line 2: `Files I'll touch: <comma-separated-paths>`
-
-   This gives Richie visibility to interrupt if the approach is drifting without blocking the default path.
-
-5. **At any point**, if ambiguity exceeds what VISION.md + this file answer: stop and surface `[STUCK]` with a concrete question. Do not compose around it.
-
-## Per-task loop
-
-1. Re-read the task's acceptance criteria here
-2. Read the files the task touches before editing them
-3. Implement minimally — no scope expansion, no drive-by refactors, no "while I'm here"
-4. Write the tests listed in acceptance criteria
-5. `bun run validate` must be green
-6. Conventional commit (`fix:` for T0, `feat:` for expansion tasks). One task = one commit (or one small series)
-7. Before marking done, re-read VISION.md's "what's locked" + the task's acceptance criteria. If anything drifted, revisit.
-
-## Day-by-day target
-
-- **Day 1**: T0, T1, T3, T4 (infrastructure + assets, parallel-friendly)
-- **Day 2**: T2, T5 (agent specs + synthetic analytics)
-- **Day 3**: T6, T7, T8 + first dry run
-- **Day 4**: T9, T10 + diagnose/re-run if needed + handoff
-
----
-
-## T0 — Pass-7 review fixes
-
-**Status**: blocking. 4 of 5 fixes touch simulation-path code; skipping T0 risks contaminating the demo with known bugs.
-
-**Files**:
-
-- `scripts/apply-worker-cli.ts:142` — og_card dims 1200x630 → 1536x1024 (or closest supported)
-- `scripts/apply-worker.ts:733-739` — `runtime_failure` drops from visual-veto branch, falls through to `apply-fail`
-- `.husky/pre-commit:13-15` — add `chomp;` + `print "$_\0"` in perl pipeline
-- `scripts/critic-genealogy.ts` — wrap `fetchSessionSnapshot` call in `main()` with try/catch; persist spec.json + snapshot-error sentinel + agent JSON on failure; exit non-zero after commitArtifacts
-- Extract shared paginated `findAgentByName` helper, import from both `scripts/planner-invoke.ts` and `scripts/critic-genealogy.ts`
-
-**Accept**:
-
-- `bun run validate` green
-- New/updated unit tests: `runtime_failure → apply-fail`, snapshot-fetch-fail still writes spec.json, pagination helper finds name on page 2
-- `printf 'foo.ts\0bar.md\0baz.txt\0' | perl -0ne 'chomp; print "$_\0" if /\.(ts|js|json|md|jsonc)$/;' | wc -c` returns 13
-- Conventional commits (one per fix, or one bundled `fix: apply pass 7 review items`)
-
----
-
-## T1 — Memory store provisioning
-
-**Depends on**: T0
-
-Create `scripts/provision-memory-stores.ts` — idempotent provisioner that creates 12 memory stores via `POST /v1/memory_stores` (beta header `managed-agents-2026-04-01`).
-
-**Stores** (6 per substrate):
-
-| Store name                            | Writer                        | Readers                       |
-| ------------------------------------- | ----------------------------- | ----------------------------- |
-| `webster-council-memory-lp`           | orchestrator (RW)             | all LP sim agents (read_only) |
-| `webster-planner-memory-lp`           | planner (RW)                  | planner (RW)                  |
-| `webster-redesigner-memory-lp`        | redesigner (RW)               | redesigner (RW)               |
-| `webster-genealogy-memory-lp`         | orchestrator (RW)             | genealogy logic (read_only)   |
-| `webster-conversion-critic-memory-lp` | conversion-critic (RW)        | conversion-critic (RW)        |
-| `webster-visual-reviewer-memory-lp`   | visual-reviewer (RW)          | visual-reviewer (RW)          |
-| (same 6 names with `-site` suffix)    | (parallel for site substrate) | (parallel)                    |
-
-**Output**: `context/memory-stores.json`:
-
-```json
-{
-  "lp": {
-    "council": "memstore_01...",
-    "planner": "memstore_01...",
-    "redesigner": "memstore_01...",
-    "genealogy": "memstore_01...",
-    "conversion-critic": "memstore_01...",
-    "visual-reviewer": "memstore_01..."
-  },
-  "site": { ... }
-}
-```
-
-**Accept**:
-
-- Running script twice produces identical output (idempotent by name lookup — if store with `name` already exists, reuse its ID)
-- `context/memory-stores.json` contains 12 entries keyed by substrate + role
-- Unit test mocks the API, verifies idempotency + error handling (network fail + partial completion resume)
-- Script is safe to re-run after partial failure
-
----
-
-## T2 — 18 new sim-specific agent specs
-
-**Depends on**: T0
-
-Create 18 new MCP-native agent specs. **Existing 9 `webster-*` agents are NOT modified.**
-
-**LP sim set** (9 files under `agents/`):
-
-- `webster-lp-sim-monitor.json` (Haiku 4.5)
-- `webster-lp-sim-seo-critic.json` (Sonnet 4.6)
-- `webster-lp-sim-brand-voice-critic.json` (Sonnet 4.6)
-- `webster-lp-sim-fh-compliance-critic.json` (Sonnet 4.6)
-- `webster-lp-sim-conversion-critic.json` (Sonnet 4.6)
-- `webster-lp-sim-copy-critic.json` (Sonnet 4.6)
-- `webster-lp-sim-redesigner.json` (Opus 4.7)
-- `webster-lp-sim-planner.json` (Opus 4.7)
-- `webster-lp-sim-visual-reviewer.json` (Opus 4.7)
-
-**Site sim set** (9 files under `agents/`):
-
-- `webster-site-sim-monitor.json`
-- `webster-site-sim-seo-critic.json`
-- `webster-site-sim-brand-voice-critic.json`
-- `webster-site-sim-licensing-and-warranty-critic.json` (replaces fh-compliance slot, Sonnet 4.6)
-- `webster-site-sim-conversion-critic.json`
-- `webster-site-sim-copy-critic.json`
-- `webster-site-sim-redesigner.json`
-- `webster-site-sim-planner.json`
-- `webster-site-sim-visual-reviewer.json`
-
-**System prompt differences from existing `webster-*` agents**:
-
-- **No WebFetch**. All site reads via `get_file_contents` (GitHub MCP) at the demo branch ref passed in user.message (e.g. `ref: demo-sim-lp/w03`)
-- **No LP_TARGET URL** reference. Replace with substrate-appropriate context block
-- **Context paths substrate-specific**: LP agents read `demo-landing-page/context/business.md`; site agents read `demo-sites/northwest-reno/context/business.md`
-- **Site pages (site set only)**: redesigner + critics reference the 3-page structure (`/`, `/services`, `/free-estimate`)
-- **licensing-and-warranty-critic**: scoped to contractor licensing number display, insurance claims, warranty terms, service-area clarity
-- **Brand-voice critic**: reads `brand.json` + `business.md`, enforces voice + do_not_use
-
-**Registration**: via idempotent `POST /v1/agents` (by-name lookup before POST). Wrap in `scripts/register-sim-agents.ts` or extend existing registration script.
-
-**Accept**:
-
-- All 18 specs validate against existing JSON schema
-- `scripts/register-sim-agents.ts` idempotent: re-running doesn't duplicate
-- Spec schema tests cover both sets
-- No reference to `LP_TARGET` or WebFetch anywhere in the 18 new specs
-- Existing 9 `webster-*` agents unchanged (diff check)
-
----
-
-## T3 — Prefilled contexts
-
-**Depends on**: T0. Can run in parallel with T2.
-
-### 3a — Richer Health (LP)
-
-Directory: `demo-landing-page/context/`
-
-- `business.md` — copy from existing `context/business.md` (already Richer-Health-scoped)
-- `personas.json` — 3 personas extracted from `.claude/skills/nicolette-richer/references/brand-bible.md`. Each persona: `{id, name, archetype, goals, anxieties, conversion_triggers, behavior_hints}`. Suggested: "credentials-conscious-executive" / "curious-self-starter" / "skeptical-researcher".
-- `brand.json` — structured: `{voice, tone, palette, typography, signature_phrases, do_not_use}`. Extract from brand bible.
-
-### 3b — Northwest Home Renovations (site)
-
-Directory: `demo-sites/northwest-reno/context/`
-
-- `business.md` — invent from scratch. Fields: business name, owner ("Sam Reyes"), location (Pacific Northwest, non-specific town), services (kitchen / bath / deck renovation), license number (fictional, e.g. WA-CONTR-NWR-2024), warranty terms ("5-year workmanship, 10-year structural"), insurance ("$2M liability"), tone ("competent, direct, trust-heavy").
-- `personas.json` — 3 B2C homeowner personas: "first-time-homeowner-anxious" (scared of being scammed), "price-comparing-pragmatist" (getting 3 quotes), "warranty-conscious-veteran" (has been burned before).
-- `brand.json` — palette (navy/white/safety-orange OR forest-green/cream/brass — pick one, document choice), typography (clear sans-serif + utility), voice (direct + trust-heavy), do_not_use (no superlatives, no "world-class", no generic "quality").
-
-**Accept**:
-
-- Both contexts validate against a shared schema you define in the task (even a simple Zod schema in `scripts/context-schema.ts` is fine)
-- Both brand extracts are rich enough to give the brand-voice critic concrete rules to enforce (at least 5 do_not_use items, palette with hex codes, typography with font families)
-- No cross-contamination (contractor context never references Richer Health; LP context never references Northwest Reno)
-
----
-
-## T4 — Ugly sites
-
-**Depends on**: T3 (needs brand.json to know what the ideal is, so we can deliberately violate it). Can run in parallel with T2.
-
-### 4a — Richer Health ugly
-
-Directory: `demo-landing-page/ugly/`
-
-- `index.html` — single file, intentionally unpolished
-- `style.css` — inline acceptable; keep minimal
-- `README.md` — "Intentionally ugly. Do NOT improve outside simulation."
-
-**Characteristics** (each is something a specific critic should flag):
-
-- Generic stock hero image (not Nicolette's actual photo) — conversion / brand-voice / SEO ding
-- Vague headline "Health & Wellness Coaching" — copy / conversion ding
-- No credentials anywhere — fh-compliance / brand-voice ding
-- Weak CTA "Learn More" — conversion ding
-- Times New Roman everywhere — brand-voice / visual-review ding
-- Center-aligned body text, no hierarchy — visual-review / copy ding
-- No testimonials / social proof — conversion ding
-
-Reference (human-read only, not committed to repo references): existing `site/before/index.html` for layout structure. Do NOT copy — derive an intentionally-worse version.
-
-### 4b — Contractor ugly (3 pages)
-
-Directory: `demo-sites/northwest-reno/ugly/`
-
-- `index.html` (home) + `style.css`
-- `services.html`
-- `free-estimate.html`
-- `README.md`
-
-**Characteristics**:
-
-- Home: Times New Roman, clip-art header, no photos of real work, generic phrases ("Best in the business!"), CTA is bare text link "Contact us"
-- Services: a bulleted list with no descriptions, no prices, no warranties mentioned
-- Free-estimate: unlabeled form inputs, no required-field markers, no phone number option, no expected-response-time
-- Cross-page: inconsistent nav, no footer, no license number anywhere, no insurance mention, no before/after photos
-
-**Accept**:
-
-- Both ugly states commit to dedicated demo branches (`demo-sim-lp/w00`, `demo-sim-site/w00`)
-- No JavaScript, no external network resources (self-contained HTML/CSS)
-- Loaded in a browser they render (no broken markup); they're ugly, not broken
-- Diff against `brand.json` shows broad violation — every persona and every brand rule has something to attack
-
----
-
-## T5 — Synthetic Analytics Agent
-
-**Depends on**: T3
-
-Build `scripts/synthetic-analytics.ts` — generates per-week analytics reacting to current site state.
-
-**Inputs** (JSON file passed via CLI or stdin):
-
-```ts
-{
-  substrate: "lp" | "site",
-  week: number,                   // 0-indexed, 0 = baseline
-  weekDate: string,               // ISO, for seasonality
-  sitePath: string,               // absolute path to site dir for current week
-  contextPath: string,            // absolute path to context dir
-  previousAnalytics?: AnalyticsJson, // week N-1, absent on week 0
-  seed: string                    // determinism
-}
-```
-
-**Output**:
-
-- `analytics.json` — schema matches existing `scripts/analytics-ingestion.ts` (`sessions`, `bounce_rate`, `avg_time_s`, `scroll_depth_{25,50,75,100}`, `cta_clicks` per CTA, `section_engagement[]`)
-- `analytics-reasoning.md` — per-persona narrative of why metrics moved (3–5 sentences each)
-
-**Agent invocation**:
-
-- Uses `/v1/messages` (not Managed Agents) for simplicity — synthetic analytics is one-shot, no memory needed
-- Model: Opus 4.7 (judgment-heavy)
-- System prompt includes: persona distribution (5000 users × 3 personas, fixed), hard continuity (±15% per metric unless justified), seasonality hints, realistic event variance, no bias toward specific gaps
-
-**Accept**:
-
-- Golden-file test: given fixed seed + fixed week-0 HTML + personas, produces identical analytics.json on re-run
-- Continuity test: given week-0 output as previousAnalytics + SAME site (unchanged), week-1 deltas stay within ±5% per metric (no change = no reason to swing)
-- Continuity test: given week-0 output + MUTATED site (hero copy improved), week-1 bounce_rate drops by 5–20%, justification in reasoning.md
-- Schema-compatibility test: output `analytics.json` parses cleanly via existing `analytics-ingestion.ts` normalizer
-
----
-
-## T6 — Sim orchestrator fork
-
-**Depends on**: T2, T3, T4
-
-Fork `prompts/second-wbs-session.md` → `prompts/sim-council.md`. Parameterize the hardcoded values.
-
-**Changes from source**:
-
-- Header block takes env vars: `SUBSTRATE` (`lp`|`site`), `WEEK_DATE`, `BRANCH` (e.g. `demo-sim-lp/w03`), `AGENT_SET` (`webster-lp-sim`|`webster-site-sim`), `CONTEXT_PATH`, `SITE_PATH`, `MEMORY_STORES_JSON`
-- Drop the `LP_TARGET=https://certified.richerhealth.ca` line and remove all WebFetch-based critic instructions (sim agents already read via MCP)
-- Drop the 10-week mock-history seeder (Step 1) — simulation wrapper generates fresh analytics per week via T5
-- Agent IDs sourced from `context/sim-agents.json` (produced by T2's registration script), keyed by `$AGENT_SET`
-- Memory-store attachment in every `POST /v1/sessions` call — attach the role-appropriate store from `$MEMORY_STORES_JSON`
-
-**Accept**:
-
-- `sim-council.md` validates shellcheck on its bash blocks
-- Running with `SUBSTRATE=lp WEEK_DATE=2026-02-01 BRANCH=demo-sim-lp/w00 ... wbs @prompts/sim-council.md` produces a week-0 council run with all agents invoked via sim IDs
-- Production `prompts/second-wbs-session.md` untouched (diff check)
-
----
-
-## T7 — Simulation wrapper
-
-**Depends on**: T5, T6
-
-Build `scripts/run-simulation.ts` — library + CLI that loops N weeks for one substrate.
-
-**Flow per week**:
-
-1. Checkout/create demo branch `demo-sim-<substrate>/w<NN>`
-2. If week 0: commit the ugly site; else use previous week's branch as base
-3. Call Synthetic Analytics Agent (T5) → write `history/<substrate-demo>/w<NN>/analytics.json`
-4. Spawn `prompts/sim-council.md` with env vars for this week
-5. After orchestrator completes: capture screenshots at 3 breakpoints × all pages using Playwright on the local file (no deploy needed — Playwright can open file:// URLs)
-6. Write memory-store summaries via REST API (council + planner + redesigner insights)
-7. Bundle week artifacts into `demo-output/<substrate>/week-NN/`
-
-**Accept**:
-
-- Config-driven (substrate specifier, week count, paths) — not substrate-hardcoded
-- Unit test with mock council (no real API calls) runs 2-week loop end-to-end
-- Screenshot capture works with Playwright headless on `demo-landing-page/ugly/index.html` (file://)
-- Fixed seed → identical demo branch HEAD after N weeks
-
----
-
-## T8 — Per-substrate invocations
-
-**Depends on**: T7
-
-Thin entry scripts:
-
-- `scripts/run-simulation-lp.ts` — calls `run-simulation.ts` with `substrate=lp` + LP paths + 10 weeks
-- `scripts/run-simulation-site.ts` — calls `run-simulation.ts` with `substrate=site` + site paths + 10 weeks
-
-**Accept**:
-
-- `bun scripts/run-simulation-lp.ts` runs 10 weeks end-to-end, ~30–45 min
-- `bun scripts/run-simulation-site.ts` same
-- Output directories `demo-output/landing-page/` and `demo-output/northwest-reno/` both populated with week-00 through week-10 artifacts
-- Memory Stores Console shows 12 entries populated
-
----
-
-## T9 — Demo manifest + final sheets
-
-**Depends on**: T8
-
-Build `scripts/build-demo-manifest.ts` — aggregates simulation output.
-
-**Per-substrate outputs**:
-
-- `demo-output/<substrate>/demo-manifest.json` — machine-parseable index of all weeks, screenshots, council artifacts, genealogy events, memory-store references
-- `demo-output/<substrate>/final-sheet.png` — side-by-side week-0 vs week-10 desktop hero shot (ffmpeg or ImageMagick)
-
-**Accept**:
-
-- Manifest validates against a schema you define
-- Final sheet is visually compelling (real improvement visible)
-- Manifest includes absolute paths the downstream video-composition session can feed to Remotion
-
----
-
-## T10 — End-to-end dry run + handoff
-
-**Depends on**: T7, T8, T9
-
-Run both simulations. Inspect outputs. Decide.
-
-**Accept — all must be true before handoff to video composition**:
-
-- Both `demo-output/` substrates contain full 10-week progressions
-- Screenshots visually coherent (no blank pages, no JS errors, layouts render at all 3 breakpoints)
-- Memory Stores Console shows 12 stores with content (open one, verify it contains meaningful summaries)
-- Genealogy log shows what happened (a spawn, or a diagnosed-then-fixed non-spawn, or an explicit "no spawn in 10 weeks" with investigation notes)
-- If no spawn and no budget to re-run: accept outcome, update VISION.md risk section with the finding, proceed to video composition with improvement-only narrative
-
-**Handoff deliverable** (for fresh Claude Code session to compose video):
-
-- `demo-output/<substrate>/demo-manifest.json` × 2
-- `demo-output/<substrate>/final-sheet.png` × 2
-- Memory-Stores-Console screenshots (captured manually by Richie)
-- Nicolette clip (recorded separately by Richie)
-- Onboarding skill recording (recorded separately by Richie)
-- Brand bible content for copy/narration reference
-
----
-
-## Validation checkpoints
-
-Before moving to the next task, verify:
-
-1. `bun run validate` green
-2. Committed (conventional commit message)
-3. Re-read VISION.md's "what's locked" section — did you drift?
-4. Flag anything unexpected with `[STUCK]` prefix before continuing
-
-## When genuinely stuck
-
-- Re-read VISION.md. The vision is the real contract.
-- Surface the block to Richie. Don't produce composed-looking workarounds.
-- Visible struggle > invisible corner-cutting.
-
----
-
-## Tier 2 implementation tasks (case-study + auto-capture support)
-
-> Added 2026-04-25. These tasks support the Tier 2 demo asset (Empire Asphalt onboarding case study video + automated Anthropic Console screenshot capture for Beat 5). Specced in `context/ONBOARDING-CASE-STUDY.md` and `prompts/sim-runner.md`. T11 is **blocking** T8/T10 because the sim must emit capture triggers and the bridge must consume them; T12 and T13 are case-study-only and can run parallel to T8–T10.
-
-## T11 — Auto-capture infrastructure
-
-**Depends on**: T7 (sim wrapper)
-**Blocks**: T8 (sim invocations should emit capture triggers from the start), T10 handoff (Memory Stores screenshots are part of the deliverable)
-
-Wire capture-trigger emission into the sim wrapper, build the bridge process that reads triggers and spawns captures, and build the capture script that drives the `browser-use` CLI.
-
-**Before writing any T11 code (5-min pre-flight):** manually drive `browser-use` once against the real Anthropic Console memory stores page and capture the actual selectors:
-
-```bash
-browser-use --profile "Default" open https://console.anthropic.com  # navigate to memory stores via the UI
-browser-use state                                                    # dump real selectors and URL
-```
-
-Copy the real list-page URL and a real container selector from the `state` output into `scripts/capture-mem-stores.ts`. The `[data-testid='memory-stores-list']` selector and `/settings/memory-stores` path used in design docs are intuition, not verified — replacing them with what `browser-use state` actually returns prevents a silent hang in the capture script.
-
-**Code:**
-
-- Modify `scripts/simulation-core.ts` to emit `CAPTURE_TRIGGER` JSON lines on stdout at weeks 1, 5, and 10 (exact format spec in `prompts/sim-runner.md` "Trigger protocol")
-- Add `scripts/capture-mem-stores.ts` — accepts `{substrate, week, output}` from a trigger payload, shells out to `browser-use --profile "Default"` for navigation + screenshot, verifies the captured PNG is not a login page (size + text heuristic), exits 0 on success or non-zero with `AUTH_EXPIRED` on stderr if logged out
-- Add `scripts/sim-capture-bridge.ts` — reads stdin line-by-line, passes through unchanged to its own stdout, parses lines that match `{"event":"CAPTURE_TRIGGER",...}`, spawns the capture script for each, halts the pipe on capture failure
-- Add `bun run sim:preflight` script — checks: 18 sim agents registered, 12 memory stores provisioned, `console.anthropic.com` reachable via `browser-use`, `bun run` for sim scripts compiles
-- Add `bun run sim:emit-manifest` script — at end of sim, walks `assets/memory-stores-screenshots/` and writes `manifest.json` consolidating the 6 PNG paths and per-week sizes
-
-**Accept:**
-
-- `bun run sim:preflight` returns 0 against a fully-provisioned environment
-- A 1-week dry run (force `CAPTURE_TRIGGER` at week 1) writes a real authenticated Anthropic Console screenshot to `assets/memory-stores-screenshots/lp/week-1.png` — file > 100KB, visibly contains the memory stores list page (not a login screen)
-- An auth-expired dry run (intentionally signed out of Console) makes the capture script exit non-zero with `AUTH_EXPIRED` on stderr, and the bridge halts the pipe rather than silently continuing
-- Trigger protocol JSON format exactly matches `prompts/sim-runner.md` "Trigger protocol" section
-
-## T12 — `webster-onboarding` v2 skill + verify-all script
-
-**Depends on**: T1 (memory provisioning script), T2 (production agent specs already registered)
-**Blocks**: case-study video recording
-
-Rewrite the onboarding skill from the b3fd05f baseline to fit the v2 phase model and v2 stack. Build the rollup verify script the skill drives at P3/P4 gates.
-
-**Code:**
-
-- `skills/webster-onboarding/SKILL.md` — phase model (P0–P5), status file at `context/onboarding-status.json`, dynamic Q&A in P1, key-safety disclaimer at P2, machine-checked gates at each phase boundary, resume-from-status-file at startup. Full spec in `context/ONBOARDING-CASE-STUDY.md` "Skill design — webster-onboarding v2"
-- `scripts/onboarding/verify-env.ts` — reads `.env.local`, hits each provider's verify endpoint, returns ok/fail without echoing key values
-- `scripts/onboarding/verify-all.ts` — runs all P3 + P4 checks (env + repo + memory stores + agents) as a single rollup; supports `--phase {p3,p4}` flag
-- `scripts/onboarding/scaffold-repo.ts` — creates a fresh GitHub repo under the user's account, scaffolds an Astro starter using brand identity from `context/business.yaml`
-
-**Accept:**
-
-- `bun run onboarding:verify-all` exits 0 only when all of: `.env.local` has the 3 keys verified live, target GitHub repo is reachable via the user's PAT, `GET /v1/agents` returns ≥9 production agents, `GET /v1/memory_stores` returns ≥6 stores
-- Skill, run twice on a fresh environment, produces identical state (idempotent)
-- A test run on a clean environment, with all gates failing intentionally, reports the specific failing check + remediation hint, persists the status file, and resumes correctly when re-run after fixes
-- No key values appear in stdout, stderr, or any committed file at any point
-
-## T13 — Empire Asphalt Paving substrate prep
-
-**Depends on**: dad consent (logged at `assets/onboarding-case-study/dad-consent.txt`)
-**Blocks**: case-study video recording
-
-Hand-craft the ugly v0 of dad's site, fill the brand corpus, and create a fresh GitHub repo for the case study install to land into.
-
-**Code + assets:**
-
-- `context/brand-corpus/` populated with: logo.png, business-card.jpg, past-jobs/{1..3}.jpg, service-list.md, reviews.md, voice-notes.md (full spec in `context/ONBOARDING-CASE-STUDY.md` "Brand corpus")
-- Fresh GitHub repo `richsak/empire-paving-demo` (private) containing a hand-crafted ugly v0 — single Astro page with the brand colors (`#1B47A1` royal blue, `#F9D71C` yellow), bad layout, missing trust signals, no responsive breakpoints. Acceptable to piggyback on T4's ugly-site fork script if it generalizes cleanly.
-- `assets/onboarding-case-study/dad-consent.txt` — one-line acknowledgment confirming dad has agreed to use of business name, logo, and paraphrased quotes in the submission video. Do not commit a PII-heavy version.
-
-**Accept:**
-
-- `git clone richsak/empire-paving-demo` succeeds and the cloned site builds (`bun run build`) without errors
-- The ugly v0 visibly uses the Empire palette and identity (not generic gray)
-- Dad consent artifact exists in `assets/onboarding-case-study/`
-- Brand corpus directory contains all 6 corpus categories, with at least placeholder contents for any items dad doesn't have real assets for (e.g. reviews paraphrased from real reviews if Google reviews are sparse)
diff --git a/context/ONBOARDING-CASE-STUDY.md b/context/ONBOARDING-CASE-STUDY.md
index e0c4654..97be371 100644
--- a/context/ONBOARDING-CASE-STUDY.md
+++ b/context/ONBOARDING-CASE-STUDY.md
@@ -23,7 +23,7 @@ This is **not** a role-play. Richie narrates from the operator/builder perspecti
 | Q1   | asset = case study video, not role-play                                                                                  | dad's domain is real, dad's quote is real (paraphrased), Richie remains himself |
 | Q2   | persona dissolved — Richie is Richie, dad is the user                                                                    | no character swap                                                               |
 | Q3   | skill v2 = thin shell + scripts                                                                                          | matches Layer 4 architecture; UX layer over orchestration                       |
-| Q4   | skill provisions full v2 stack: 9 agents + 6 memory stores + first council                                               | matches video marquee feature                                                   |
+| Q4   | skill provisions full v2 stack: 10 production agents + 6 memory stores + first council                                   | matches video marquee feature                                                   |
 | Q5   | skill = brand context + infra wiring only; site code is upstream                                                         | Claude Design zip → Astro is a separate future skill                            |
 | Q6   | substrate = Empire Asphalt Paving (`empireasphalt.ca` parked, repo modern but undeployed)                                | strongest narrative — "domain owned, no real site, Webster built it"            |
 | Q7   | context capture has 3 sources: URL scrape, file uploads, dynamic Q&A                                                     | fills brand memory from whatever surfaces exist                                 |
@@ -51,7 +51,7 @@ This is **not** a role-play. Richie narrates from the operator/builder perspecti
 | 8–33s  | P1 Context capture | drag `logo.png`, `business-card.jpg`, `past-jobs/`, `voice-notes.md` into chat; skill auto-asks 2–3 dynamic gap-fills (voice register, do-not-use list, target customer)         | Richie VO paraphrasing dad: _"Eighteen years paving. Family business. Premium handcraft, not the cheap-truck guys."_                                                                          |
 | 33–41s | P2 Prep checklist  | checklist appears in chat: Anthropic key, GitHub access, Cloudflare token                                                                                                        | VO: _"Three keys. He pastes them on his own machine. The skill never sees them."_                                                                                                             |
 | 41–56s | P3 Execute         | user pastes keys locally (off-screen disclaimer overlay: _"Keys never typed in chat — pasted into `.env.local` on dad's machine"_); GitHub repo scaffolded; `.env.local` appears | VO: _"Skill writes nothing it can't see. Keys stay local."_                                                                                                                                   |
-| 56–68s | P4 Verify          | green checks roll in: env ✓ / repo ✓ / 6 memory stores provisioned ✓ / 9 agents registered ✓                                                                                     | VO: _"Six memory stores. Nine agents. Wired in seconds."_ (deliberately vague — actual install time will be measured at recording and the pacing edited to match what the visuals show)       |
+| 56–68s | P4 Verify          | green checks roll in: env ✓ / repo ✓ / 6 memory stores provisioned ✓ / 10 production agents registered ✓                                                                         | VO: _"Six memory stores. Ten agents. Wired in seconds."_ (deliberately vague — actual install time will be measured at recording and the pacing edited to match what the visuals show)        |
 | 68–90s | P5 First council   | session ID flashes; PR URL surfaces; week-1 redesign of dad's site appears in browser tab; cut to Webster wordmark                                                               | VO: _"First council fires. Reads his brand. Proposes week-one redesign. Dad reviews. Merges if he likes it."_ + paraphrased dad quote: _"He told me, 'I don't even need to think about it.'"_ |
 
 **Hard length**: 90s. **Floor**: 60s collapse via the drop priority below.
@@ -127,14 +127,14 @@ P5 First council — trigger session, surface PR URL, end
 
 ### Phase exit gates (machine-checked)
 
-| phase | gate        | check                                                                                                                                           |
-| ----- | ----------- | ----------------------------------------------------------------------------------------------------------------------------------------------- |
-| P0    | soft        | user typed "ready"                                                                                                                              |
-| P1    | hard        | `context/business.yaml` exists + ≥1 source signal recorded                                                                                      |
-| P2    | hard        | checklist all `[x]`                                                                                                                             |
-| P3    | hard rollup | `bun run onboarding:verify-all` green: `.env.local` exists + `gh repo view` ok + `GET /v1/agents` returns 9 + `GET /v1/memory_stores` returns 6 |
-| P4    | hard        | same rollup re-runs green                                                                                                                       |
-| P5    | hard        | session_id returned + PR URL surfaced                                                                                                           |
+| phase | gate        | check                                                                                                                                                                                                          |
+| ----- | ----------- | -------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------- |
+| P0    | soft        | user typed "ready"                                                                                                                                                                                             |
+| P1    | hard        | `context/business.yaml` exists + ≥1 source signal recorded                                                                                                                                                     |
+| P2    | hard        | checklist all `[x]`                                                                                                                                                                                            |
+| P3    | hard rollup | `bun run onboarding:verify-all` green: `.env.local` exists + `gh repo view` ok + `GET /v1/agents` returns the count of production specs in `agents/*.json` (currently 10) + `GET /v1/memory_stores` returns ≥6 |
+| P4    | hard        | same rollup re-runs green                                                                                                                                                                                      |
+| P5    | hard        | session_id returned + PR URL surfaced                                                                                                                                                                          |
 
 Gate failure → show the specific check that failed + remediation hint + halt with status file preserved. User fixes, re-runs skill, resume from same phase.
 
diff --git a/context/ROADMAP.md b/context/ROADMAP.md
deleted file mode 100644
index 8ba1823..0000000
--- a/context/ROADMAP.md
+++ /dev/null
@@ -1,192 +0,0 @@
-# Webster Roadmap — the map
-
-> Single source of truth for "where am I, what's next, what did I sign up for."
-> Read top-to-bottom when lost. Regenerate from `context/FEATURES.md` if it drifts.
-
-## The one-paragraph map
-
-Webster is a **Council of Claude Managed Agents** that autonomously redesigns a small-business landing page, week after week, with **Opus 4.7 spawning new critics at runtime** when it spots patterns existing critics miss. The novel mechanic is **Critic Genealogy** — agents creating agents. The hackathon submission for Anthropic × Cerebral Valley "Built with Opus 4.7" is due **Sunday April 26 2026, 8PM EST** (~70h from now). Target prize lanes: Managed Agents $5K (62-72/100) + Creative Exploration $5K (48-58/100) + Grand $50K (18-25/100).
-
-## North-star invariant
-
-**Validate before human approval.** Every change passes the full validation stack — static critics → runtime gate → visual reviewer → autoresearch verdict — before it reaches a PR in Richie's inbox. Human is the last ratchet, not the first debugger. If a feature doesn't connect to this principle, it's out of scope.
-
-## Where we are right now (2026-04-23)
-
-- **Branch**: `main`, 5 commits ahead of `origin/main` (push-blocked by permission policy — Richie's action)
-- **Submission runway**: ~70 hours to deadline
-- **Shipped**: Layers 1–4 + 7 — 24 features in ~12 hours of focus-work
-- **In-progress**: 1 (Layer 1 live-artifact pattern)
-- **Blocked**: Layer 6 video (5 features, Richie voice record)
-- **Open loops**: 3 deadline-critical + 4 scope-expansion layers (see below)
-- **Full submission scope** (updated): Layers 1–11 — everything ships before 4/26
-
-## Timeline correction (my estimation bias)
-
-My earlier estimates assumed calendar-hours. Actual tempo: **24 features in 12 hours** with Forge + Pi workers dispatched in parallel. The remaining 4 layers (L8 + L9 + L10 + L11) total ~55 focus-hours of feature work, which at your tempo compresses to ~18–25h of your wall time. Fits in 70h runway with room for the video, form, and a voice-surgery polish pass.
-
-Operating assumption from here forward: **every feature you name is in pre-submission scope unless you explicitly say otherwise.**
-
-## Layer-by-layer truth
-
-| Layer | Theme                                      | Status                                 | Features                                 |
-| ----- | ------------------------------------------ | -------------------------------------- | ---------------------------------------- |
-| L1    | Routine + Orchestrator                     | shipped                                | #2–6 done; #1 cut; #5 in-progress        |
-| L2    | 7 Managed Agent Critics                    | shipped                                | #7–#12 done                              |
-| L3    | **Critic Genealogy (HERO)**                | shipped, live-validated                | #13–#17 done                             |
-| L4    | Onboarding Skill                           | shipped                                | #18, #19, #23, #24 done; #20–#22 cut     |
-| L5    | Substrate + Mock History                   | core shipped                           | #27 done; #25, #26, #28 cut              |
-| L6    | Meta Video                                 | blocked                                | #29–#33 waiting on voice record          |
-| L7    | Polish                                     | mostly shipped                         | #34–#36 done; #37 todo (Richie action)   |
-| L8    | **v2: Apply worker, text-only**            | planned — ships FIRST                  | #38 done; #39a–e, #40a–d todo            |
-| L10   | **v2.5: Designer scope expansion**         | planned — ships SECOND                 | #47–#49 todo (kind+constraints+verifier) |
-| L9    | **v3: Visual review + Autoresearch**       | planned — ships THIRD (0bb9db2)        | #41a–d, #42–#46 todo                     |
-| L11   | **v4: Planner + experiment-aware council** | planned — ships LAST (closes the loop) | #50–#53 todo (NEW this session)          |
-
-## What's new THIS session (session 4)
-
-- `61cfae4` — `site/before/` + `site/after/` forked from live `certified.richerhealth.ca`; 5-issue proposal applied by hand to `after/`
-- `475e129` — `context/v2-design.md` grill-me answers; Layer 8 decomposed into #39a-e + #40a-d
-- `a1cb0e5` — advisor-caught regression fix: "No more patient churn" restored in Issue 4 hero
-- `0bb9db2` — Layer 9 added (9 sub-features: visual-reviewer chain + autoresearch chain) + 6 hero screenshots as motivating evidence
-- `f34858d` — `context/ROADMAP.md` — single source of truth for roadmap + narrative
-- **PENDING (this phase)**: `context/DOMAIN-MODEL.md` (NEW) + Layer 10 + Layer 11 added to FEATURES.md
-
-All commits local-only. Push permission policy blocks direct push to main; Richie-action item.
-
-## Architectural shift locked this session
-
-Autoresearch is NOT a back-end post-merge feedback loop. It's the **input** to the next council run. A **planning agent** sits before the 5 critics + redesigner, reads last week's verdict + what-changed, decides experiment direction for this week, then the council runs with `plan.md` as context.
-
-This is the shift from **autonomous weekly redesigner** → **autonomous experiment agent**. See `context/DOMAIN-MODEL.md` for the formal model + week lifecycle + grill-me questions on the 7 remaining architectural decisions.
-
-## Deadline-critical loops for 4/26
-
-**Human-only actions** (no Claude can do these):
-
-1. **Cerebral Valley submission form** (#37; ~15 min; Richie-only)
-2. **Demo video voice record** (Layer 6 blocker; ~1h record + Saturday assembly)
-3. **Push local commits to origin/main** (1-min terminal action, required before submission)
-
-**Scope-expansion layers that ALSO ship pre-submission** (Claude+worker parallelizable):
-
-- **Layer 8** — apply worker text-only (~18h feature work)
-- **Layer 10** — designer scope expansion (~7h feature work)
-- **Layer 9** — visual review + autoresearch measurement (~18h feature work)
-- **Layer 11** — planner agent + experiment-aware council (~12h feature work, NEW)
-
-Ordering: 1–3 anytime. 4–7 in dependency order (L8 → L10 → L9 → L11). Grill-me on DOMAIN-MODEL.md open questions unblocks L11 implementation.
-
-## Pre-submission roadmap — L8 → L10 → L9 → L11 (dependency order)
-
-All three layers exist to make Webster **genuinely autonomous**, not just autonomously-change-producing. Build order matters:
-
-### L8 (v2) — Apply worker, text-only | ~18h total
-
-**Why it exists**: today the council emits `proposal.md`. No code changes. L8 turns proposal into PR diffs. Text-level only — council says "change X to Y", apply runs find-replace, runs lint/type/format, emits a PR.
-
-| #      | Feature                                                                   | Hours |
-| ------ | ------------------------------------------------------------------------- | ----- |
-| #38    | site/ fork — DONE session 4                                               | ✅    |
-| #39a   | Apply worker core (Pi worker via Forge, worktree-isolated)                | 4–6   |
-| #39b   | Runtime validation gate (Playwright: CTAs resolve, no JS errors)          | 2–3   |
-| #39c   | Critic re-run gate (0 new CRITICAL, ≤2 new HIGH; 3-iter fix loop)         | 2     |
-| #39d   | Per-cluster PR emission (1–3 issues/PR, max 3 PRs/week)                   | 3     |
-| #39e   | CF Pages preview URL wiring                                               | 1–2   |
-| #40a–d | Image-gen tool (tool schema, backend, brand persistence, #39 integration) | 7     |
-
-**Testable when**: `wbs @prompts/fifth-wbs-session.md` produces a PR with real code diffs, not just `proposal.md`.
-
-### L10 (v2.5) — Designer scope expansion | ~7h total
-
-**Why it exists**: session-4 proved text-only proposals aren't enough. Longer copy needs smaller font-size to keep hero rhythm. Without L10, the council is a **copy-editor council**, not a **design council**. L10 lets the designer propose CSS/layout/component changes as first-class issues.
-
-| #   | Feature                                                                               | Hours |
-| --- | ------------------------------------------------------------------------------------- | ----- |
-| #47 | Proposal schema v2 (kind-aware: text/css/component/asset + constraints block)         | 2     |
-| #48 | Apply worker multi-kind routing (tool per kind)                                       | 3     |
-| #49 | Visual-reviewer constraint verifier (asserts declared constraints in rendered output) | 2     |
-
-**Testable when**: council proposes "shorter subhead + 0.75× hero font-size + 3-line desktop H1 constraint" as ONE atomic issue; apply worker executes all three together; visual-reviewer confirms constraint met.
-
-### L9 (v3) — Visual review + Autoresearch | ~18h total
-
-**Why it exists**: L8 and L10 ship changes. L9 **verifies they work**. Two halves:
-
-**Visual reviewer** (runs immediately post-apply, pre-PR):
-
-| #    | Feature                                                                                             | Hours |
-| ---- | --------------------------------------------------------------------------------------------------- | ----- |
-| #41a | `agents/webster-visual-reviewer.json` spec (Opus 4.7)                                               | 1     |
-| #41b | `skills/webster-browser-audit/SKILL.md` (Playwright screenshot + a11y tree + interaction recording) | 3     |
-| #41c | Proposal-intent verifier (content presence + overflow detection)                                    | 2     |
-| #41d | #39 integration (3-iteration fix-hint loop back to apply worker)                                    | 1     |
-
-**Autoresearch** (runs post-merge, week+ cycles):
-
-| #   | Feature                                                                               | Hours |
-| --- | ------------------------------------------------------------------------------------- | ----- |
-| #42 | Analytics ingestion (CF Worker pixel → D1 or PostHog/GA4 webhook)                     | 3     |
-| #43 | Baseline tracker + change log                                                         | 2     |
-| #44 | Verdict engine (proxy-first fast signal + CVR slow confirm; asymmetric rollback gate) | 3     |
-| #45 | Auto-rollback worker (git revert → CF preview → draft PR for override)                | 2     |
-| #46 | Baseline promoter (2-week sustained improvement → new baseline)                       | 1     |
-
-**Testable when**: visual-reviewer blocks a known-bad session-4-style regression; autoresearch rolls back a week that hurts proxy metrics; baseline promoter advances after 2 good weeks.
-
-### L11 (v4) — Planner + experiment-aware council | ~12h total | NEW
-
-**Why it exists**: L9 measures last week's experiment. But measurement without decision is half a loop. L11 adds a **planning agent** that sits BEFORE the 5 critics + redesigner, reads last week's verdict + what-changed, decides direction for this week (promote / hold / rollback), and feeds `plan.md` as context to the council run. Closes the autonomy loop — Webster becomes an **experiment agent**, not a weekly redesigner.
-
-| #   | Feature                                                                                                           | Hours |
-| --- | ----------------------------------------------------------------------------------------------------------------- | ----- |
-| #50 | `agents/webster-planner.json` (Opus 4.7) — reads verdict + what-changed, decides next-experiment direction        | 2     |
-| #51 | Verdict → plan pipeline — orchestrator invokes planner with verdict.json + proposal.md + apply-log + monitor data | 3     |
-| #52 | Plan → council integration — critics + redesigner read plan.md as input context                                   | 3     |
-| #53 | Cold-start behavior — week 1 with no prev verdict; planner outputs "explore broadly" default plan                 | 2     |
-
-**Testable when**: week N+1 council run reads week N verdict automatically; planner outputs plan.md before critics spawn; critics + redesigner have plan.md in context; end-to-end cycle (propose → apply → review → merge → measure → verdict → plan → propose) runs in simulator without human touch between measure and plan.
-
-**Grill-me questions blocking L11**: 7 open decisions listed in `context/DOMAIN-MODEL.md`. Richie answers → implementation unblocks.
-
-## Decisions waiting on you
-
-Ranked by blast radius:
-
-1. **Push path for 5 local commits** — direct push to main, OR PR branch? (blocks submission)
-2. **Cerebral Valley submission form** (#37) — Richie-only 15-min task
-3. **Voice record scheduling** — Sat AM? blocks Layer 6 video (~3h cleanup after)
-4. **L11 grill-me answers** — 7 open questions in `context/DOMAIN-MODEL.md` unblock planner implementation
-5. **Session-4 hero voice-surgery** — revert copy to BEFORE wording (85/100), or trim line 3 (75/100), or keep as cautionary-tale artifact (45/100)? My pick: option 1 after v2 apply worker lands, as the first-ever apply-worker PR demo
-6. **`[R-confirm]` in `context/v2-design.md`** (3 items): visual-regression cost threshold, `gpt-image-1` as image backend default, PR `summary.json` alongside markdown
-
-## Three things to hold in your head
-
-Everything else is noise until these land:
-
-1. **Submit by 4/26** — form + video + push origin (human-only actions)
-2. **Answer L11 grill-me** — 7 questions in `context/DOMAIN-MODEL.md` unblock the planner agent and the full-cycle autonomous claim
-3. **Kick off L8 #39a** — apply worker core. First real PR with mutated code. Everything downstream (L10 → L9 → L11) layers on top
-
-The rest exists. Those three are the **bottleneck path**. Full submission scope is now all 11 layers — ~18–25h wall time at your tempo, fits in 70h runway.
-
-## How this doc relates to the rest
-
-- `context/FEATURES.md` — canonical per-row status. This doc quotes it; FEATURES.md is authoritative for "what's `todo` vs `done`."
-- `context/ARCHITECTURE.md` — system diagram + layer breakdown. This doc is the narrative overlay.
-- `context/v2-design.md` — grill-me answers + rationale for Layer 8 decomposition. This doc summarizes; v2-design.md is the detailed record.
-- `~/Vault/Projects/webster/Webster.md` — cross-session hub + pitch.
-- `~/Vault/Projects/webster/webster-open-loops.md` — action queue (vault-scoped, broader than this doc's 3 open loops).
-
-## How to use this doc
-
-- **Lost** → read top to bottom in 5 min
-- **Before a session** → skim "what's new this session" + "three things to hold in your head"
-- **After a decision** → update "decisions waiting on you" or ask me to
-- **On a pull request** → cross-check "Layer-by-layer truth" table
-
-This doc is the truth-source for roadmap questions. If `context/FEATURES.md` contradicts this about per-row state, FEATURES.md wins. If anything contradicts this about layer-narrative or ordering, this wins.
-
----
-
-Last regenerated: 2026-04-23 (session 4 Phase 5, after Layer 9 commit + Layer 10 proposal).
diff --git a/context/SITE-FORK-CHECKLIST.md b/context/SITE-FORK-CHECKLIST.md
deleted file mode 100644
index 964bb08..0000000
--- a/context/SITE-FORK-CHECKLIST.md
+++ /dev/null
@@ -1,94 +0,0 @@
-# site/ Fork Checklist
-
-Run this the moment `site/` is forked from `certified.richerhealth.ca`. Everything here is a one-shot onboarding for the submitted code's own quality gates. Root-level webster gates (JSON schemas, findings validator, markdownlint) already run against the repo and will continue to; this page covers what to add _inside_ `site/`.
-
-## Build surface
-
-- `site/package.json` exists with Astro scripts
-- `site/bun.lock` committed
-- `bun install --frozen-lockfile` in `site/` succeeds on CI
-- `bun run build` in `site/` succeeds (will flip on the `site-build` job in `.github/workflows/test.yml`)
-
-## site/ toolchain to install
-
-```bash
-cd site
-bun add -D @astrojs/check astro-eslint-parser eslint-plugin-astro prettier-plugin-astro
-```
-
-## site/eslint.config.js
-
-```js
-import js from "@eslint/js";
-import tseslint from "typescript-eslint";
-import astro from "eslint-plugin-astro";
-
-export default tseslint.config(
-  { ignores: ["dist", ".astro", "node_modules"] },
-  js.configs.recommended,
-  ...tseslint.configs.strict,
-  ...astro.configs.recommended,
-);
-```
-
-## site/.prettierrc (inherits from root)
-
-```json
-{ "plugins": ["prettier-plugin-astro"] }
-```
-
-## site/package.json scripts
-
-```json
-{
-  "scripts": {
-    "dev": "astro dev",
-    "build": "astro check && astro build",
-    "preview": "astro preview",
-    "lint": "eslint . --cache --max-warnings 0",
-    "format:check": "prettier --check .",
-    "type-check": "astro check"
-  }
-}
-```
-
-## Root workflow flips
-
-Once `site/package.json` exists, the `site-build` job in `.github/workflows/test.yml` starts running. Additions to make at the same time:
-
-- Add `site-lint` job running `bun run lint --max-warnings 0` in `site/`
-- Add `site-format` job running `bun run format:check` in `site/`
-- Remove `continue-on-error` from any remaining site-build steps once it's stable
-
-## Pre-commit hook bump
-
-When `site/` lands, append to `.husky/pre-commit`:
-
-```sh
-if [ -d site ]; then
-  (cd site && bun run lint --max-warnings 0 && bun run format:check) || exit 1
-fi
-```
-
-## Playwright (Day 5 polish, optional)
-
-If time holds after core fan-out + redesigner works:
-
-```bash
-cd site
-bun add -D @playwright/test
-bunx playwright install chromium
-```
-
-One smoke test confirming the redesigned LP renders and the Acuity booking CTA is present at `site/tests/hero.spec.ts`. Run in CI matrix against Cloudflare preview URLs.
-
-## Do NOT add preemptively
-
-These buy nothing until `site/` exists, and installing them now balloons the root `node_modules`:
-
-- `astro` / `@astrojs/cloudflare`
-- `eslint-plugin-astro` / `astro-eslint-parser`
-- `prettier-plugin-astro`
-- `@playwright/test`
-
-They go in `site/package.json` when `site/` lands.
diff --git a/context/VIDEO-PLAN-90s.md b/context/VIDEO-PLAN-90s.md
deleted file mode 100644
index 1735ee0..0000000
--- a/context/VIDEO-PLAN-90s.md
+++ /dev/null
@@ -1,189 +0,0 @@
-# Demo Video Plan — 90-second cut (genealogy spine)
-
-> Active spec for the 2026-04-26 hackathon submission. Supersedes `context/VIDEO-PLAN.md` for this submission. The 180s plan in `VIDEO-PLAN.md` is preserved as historical artifact for any post-submission re-cut.
-
-## Why 90s, not 180s
-
-Submission deadline is 2026-04-26 (one calendar day from 2026-04-25). Nicolette interview window is post-deadline, so Beat 1 of the original 180s plan is unavailable. Without Beat 1 the 180s arc loses its emotional opener. Recasting around the genealogy moment — the only capability that strictly requires Opus 4.7 reasoning — produces a tighter, harder-hitting submission than a degraded 3-min cut.
-
-## Hard constraints
-
-- **Deadline**: 2026-04-26
-- **Length target**: 90s (acceptable floor: 80s)
-- **Voice**: Richie records; no AI voice; no Nicolette clip
-- **Composition stack**: Forge Remotion (per locked decision in `VIDEO-PLAN.md`)
-- **Real artifacts only**: every on-screen artifact is a real file path / commit / agent name from the Webster repo. No fabrication.
-- **Spine**: runtime agent genealogy — Webster spawned `visual-design-critic` in the live `history/2026-04-23/` council run
-
-## 5-beat structure
-
-| #   | Beat       | Time      | Spoken (~) | Hero visual                                                               | Asset source                                                |
-| --- | ---------- | --------- | ---------- | ------------------------------------------------------------------------- | ----------------------------------------------------------- |
-| 1   | Hook       | 0:00–0:10 | 17 words   | Black → "Webster" text card → council diagram zoom                        | Forge-Remotion-authored title card                          |
-| 2   | Setup      | 0:10–0:25 | 29 words   | 7-node council fan-out animation                                          | Forge Remotion comp from `agents/*.json` registry           |
-| 3   | The Moment | 0:25–0:55 | 61 words   | Cursor scrolling `spec.json` → terminal `POST /v1/agents` → first finding | `history/2026-04-23/genealogy/spec.json` + screen recording |
-| 4   | Receipt    | 0:55–1:15 | 35 words   | Genealogy log on screen → before/after LP morph                           | `history/2026-04-23/genealogy/` + sim `final-sheet.png`     |
-| 5   | Frame      | 1:15–1:30 | 27 words   | Feature grid page scroll → end card                                       | `assets/feature-grid/index.html` (Tier 3 item #1 output)    |
-
-Total spoken: ~169 words at ~130 wpm = ~78s. Buffer: 12s of silence/visual breathing, distributed unevenly (most at end of Beat 3 and Beat 5).
-
-## VO recording script (Richie reads top to bottom)
-
-Read at ~130 wpm. Record per-line takes; 3-5 takes minimum per line. Pauses between sentences are fine — they get cut at edit. Save raw takes to `assets/voiceover/raw/<beat>-<line>.wav` (or `.mp3`). External mic only — laptop mic kills credibility.
-
-### Beat 1 — Hook (~7s spoken)
-
-**Take 1** (declarative, intimate, set the tone for the whole video):
-
-> "I taught a website to improve itself."
-
-**Take 2** (matter-of-fact, slightly faster):
-
-> "Every week, a council of Claude agents debates it."
-
-### Beat 2 — Setup (~12s spoken)
-
-**Take 1** (factual, clipped):
-
-> "Seven Managed Agents — five critics, a planner, a redesigner."
-
-**Take 2** (slightly slower, give "audit" weight):
-
-> "Each owns one slice of the audit."
-
-**Take 3** (three-beat rhythm, slight pause between):
-
-> "They propose. Apply. Verify."
-
-### Beat 3 — The Moment (~26s spoken — the hero beat)
-
-Slow ~10% on this beat. The phrase "they wrote a new agent" is the emotional pivot — let it breathe.
-
-**Take 1** (date-stamp opener, factual):
-
-> "April twenty-third — they hit a problem nothing could solve."
-
-**Take 2** (recite the three categories with slight pauses between, mirroring the visual cut):
-
-> "Three critics flagged the same kind of issue. Hero imagery. Layout rhythm. Visual hierarchy."
-
-**Take 3** (declarative, slight resignation in tone):
-
-> "All three said it was outside their scope."
-
-**Take 4** (the punchline — slow down, lean in):
-
-> "So they wrote a new agent. With code. From scratch."
-
-### Beat 4 — Receipt (~16s spoken)
-
-**Take 1** (clipped, technical, receipts-energy):
-
-> "Visual-design-critic. Sonnet four-point-six."
-
-**Take 2** (factual, even):
-
-> "Registered through the Managed Agents API. Same session."
-
-**Take 3** (declarative, slight pride):
-
-> "Six critics now. Append-only. Every spawn auditable."
-
-**Take 4** (warmth — the only soft moment in the video, slow it down):
-
-> "Like growing a new sense."
-
-### Beat 5 — Frame (~12s spoken)
-
-**Take 1** (bookend energy, mirrors Beat 1 opener):
-
-> "A website that improves itself."
-
-**Take 2** (declarative, hackathon claim — slight smile in voice):
-
-> "Built with Opus four-point-seven."
-
-**Take 3** (read the URL in natural English: "github" + "dot com" as words, not letters):
-
-> "Receipts at github dot com slash richsak slash webster."
-
-## Recording order recommendation
-
-Record in this order to warm up your voice:
-
-1. **Beat 4 takes** (technical, low stakes, easy warm-up)
-2. **Beat 5 takes** (3 short lines, closer energy)
-3. **Beat 2 takes** (mid-stakes, three-beat rhythm)
-4. **Beat 1 takes** (set the tone — your voice should be warm here, not stiff)
-5. **Beat 3 takes** (highest stakes — save your best vocal energy for the hero beat, do these last when you're warmest)
-
-Total session length target: 30-45 min including retakes.
-
-## Anti-goals
-
-- Don't try to "sound like a podcast voiceover." That's the AI-slop voice. Sound like you.
-- Don't rush Beat 3 punchlines. "From scratch." needs air around it.
-- Don't add words. Read the locked script verbatim. Tone variation only.
-- Don't pronounce "github.com" as "github-dot-com." Read "dot com" as natural words.
-- Don't go up at the end of Beat 5. Land flat.
-- Don't try one continuous take. Per-line takes give the editor (or composition session) room.
-
-## Forge Remotion composition handoff brief
-
-The video composition session reads this doc and assembles in Forge Remotion. Order:
-
-### 1. Asset readiness check (composition session blocks until all green)
-
-- [ ] `assets/voiceover/raw/` populated with per-line takes per the 5-beat script above
-- [ ] `history/2026-04-23/genealogy/spec.json` — exists (verified 2026-04-25)
-- [ ] `history/2026-04-23/genealogy/rationale.md` — exists (verified 2026-04-25)
-- [ ] `demo-output/lp/week-{1,10}/screenshots/1440/index.png` — for Beat 4 before/after morph (T8 sim run output)
-- [ ] `assets/feature-grid/index.html` — for Beat 5 scroll (Tier 3 item #1 output)
-- [ ] Council fan-out diagram source — Forge Remotion authors from scratch using `agents/*.json` names
-
-### 2. Composition phases
-
-1. **Beat 1**: Title card (Forge Remotion text comp). Black → white "Webster" lockup → quick scale-zoom into council diagram (transition into Beat 2). VO Take 1 + Take 2 layered.
-2. **Beat 2**: Council fan-out animation. 7 nodes appearing in sequence (planner → 5 critics → redesigner). Use real agent names from `agents/*.json` as node labels. VO Takes 1-3 layered with the node-appearance choreography.
-3. **Beat 3**: Cursor-scrolling-`spec.json` screen recording → cut to terminal showing `POST /v1/agents` (mocked from real session record at `history/2026-04-23/genealogy/session.json`) → cut to first finding rendering. VO Takes 1-4 layered with cuts. SFX stinger optional on "they wrote a new agent."
-4. **Beat 4**: Genealogy folder structure on screen (real `history/2026-04-23/genealogy/` listing) → before/after morph of Richer Health LP at week 0 vs week 10 (sim outputs). VO Takes 1-4 layered. Soften visual energy for Take 4 ("Like growing a new sense").
-5. **Beat 5**: Quick scroll-through of `assets/feature-grid/index.html` → end card with "Built with Opus 4.7" lockup + GitHub URL + small QR code linking to repo. VO Takes 1-3 layered.
-
-### 3. Length check
-
-- Target: 90s. Floor: 80s.
-- If overshoot: trim Beat 2 first (drop "They propose. Apply. Verify." — saves ~3s) → trim Beat 4 by removing "Append-only. Every spawn auditable." (saves ~3s) → only trim Beat 3 if absolutely required.
-- If undershoot: do NOT pad. Submit short.
-
-### 4. Output format
-
-- 1080p MP4
-- Confirm Cerebral Valley submission format requirements before bake.
-
-### 5. Pre-submission gates
-
-- Verify Beat 3 narration matches what actually spawned: `visual-design-critic` (NOT visual-reviewer or visual-critic — exact name from `history/2026-04-23/genealogy/spec.json`)
-- Verify Beat 2 agent count matches reality at the time of the demonstrated council run (5 critics + planner + redesigner = 7, before the spawn)
-- Verify Beat 4 post-spawn count: 6 critics
-- Watch end-to-end at least once on a phone (most judges watch on phones)
-
-### 6. Submit
-
-- Cerebral Valley form
-- GitHub repo link
-- DM if relevant
-
-## Open dependencies before composition can run
-
-| Asset                                                | Status                          | Owner                  | Blocks       |
-| ---------------------------------------------------- | ------------------------------- | ---------------------- | ------------ |
-| Voiceover takes                                      | not recorded                    | Richie                 | Beats 1-5    |
-| Sim outputs (`demo-output/lp/week-{1,10}/`)          | not run                         | T0-T13 finishing track | Beat 4 morph |
-| Feature grid HTML (`assets/feature-grid/index.html`) | not built                       | Tier 3 item #1 session | Beat 5       |
-| Genealogy artifacts                                  | available (verified 2026-04-25) | n/a                    | n/a          |
-
-## When in doubt
-
-- Tone questions: read the existing VO script in `VIDEO-PLAN.md` for register reference (warm, first-person, conversational; not declamatory).
-- Asset ambiguity: surface `[STUCK]` to Richie. Do not silently improvise.
-- Anything else: the spine is genealogy. If a composition decision pulls focus away from the genealogy moment (Beat 3), reject it.
diff --git a/context/VIDEO-PLAN.md b/context/VIDEO-PLAN.md
deleted file mode 100644
index 3a3c28f..0000000
--- a/context/VIDEO-PLAN.md
+++ /dev/null
@@ -1,665 +0,0 @@
-# Demo Video Plan — Webster Hackathon
-
-> **SUPERSEDED for the 2026-04-26 submission cut.** See `context/VIDEO-PLAN-90s.md` for the active 90-second genealogy-spine spec. This doc is preserved as historical artifact (180s 6-beat plan with Nicolette clip in Beat 1) for any post-submission re-cut.
-> Session-durable working doc. Evolves across compactions. If resuming mid-session, read this first, then `VISION.md`.
-
-## Session purpose
-
-Grill through the 6-beat demo video arc until every decision is locked. Output is a shot-list / narrative spec that the video-composition session (fresh Claude Code + Forge Remotion) builds against. This is NOT the simulation implementation track (that's `EXPANSION-TASKS.md`).
-
-## Hard constraints
-
-- **Deadline**: 2026-04-28 (Built with Opus 4.7 by Anthropic × Cerebral Valley)
-- **Today**: 2026-04-24 (4 days to submission, 3 full work days)
-- **Locked scope**: `VISION.md` — two substrates, 10 weeks × 2 sims, hybrid memory, pure-organic genealogy
-- **Human-in-loop assets** (Richie records separately):
-  - Nicolette clip (A/B testing pain)
-  - Voiceover narration
-  - Onboarding skill role-play (contractor persona)
-  - Memory Stores Console screenshots
-- **Composition stack**: Claude Design (claude.ai/design, research preview, code-powered animations + UI) for diagram + artifact micro-UIs; Forge Remotion for final video composition (voiceover + Nicolette clip + Claude Design output + screenshot timelapses + transitions). Deployed via fresh session after sim assets exist.
-
-## Implementation track status (as of compaction)
-
-- T0 Pass-7 fixes: ✓ shipped
-- T1 memory stores: ✓ shipped
-- T2 sim agent specs: ✓ shipped
-- T3 substrate contexts: ✓ shipped
-- T4 ugly baselines: ✓ shipped
-- T5 Synthetic Analytics Agent: next
-- T6–T10: queued
-
-Video planning runs in parallel with T5–T10. The video-composition session happens AFTER T10 when all assets exist.
-
-## Video arc (6 beats)
-
-1. **Problem** — Nicolette clip (manual A/B testing pain)
-2. **Solution intro** — Voiceover + council UI animation
-3. **LP timelapse** — Richer Health 10-week timelapse (one veto/skip beat)
-4. **Site timelapse** — Northwest Home Renovations 10-week timelapse
-5. **Genealogy reveal** — Memory Stores Console + spawn moment
-6. **Close** — Tagline, CTA, Anthropic framing
-
-## Grill status
-
-| Beat | Budget (target/floor) | Status                              | Next action                      |
-| ---- | --------------------- | ----------------------------------- | -------------------------------- |
-| 1    | 45s / 35s             | LOCKED (talking points + drop list) | Richie sends to Nicolette        |
-| 2    | 35s / 25s             | LOCKED                              | (composition session implements) |
-| 3    | 35s / 25s             | LOCKED                              | (composition session implements) |
-| 4    | 30s / 22s             | LOCKED                              | (composition session implements) |
-| 5    | 25s / 18s             | LOCKED with fallback rules          | (composition session implements) |
-| 6    | 10s / 8s              | LOCKED                              | (composition session implements) |
-
-## Composition session brief (handoff start)
-
-This document is the locked spec. The video-composition session reads it and executes. Order:
-
-1. **Confirm asset readiness**:
-   - `demo-output/lp/week-{1..10}/` populated (screenshots at 375/768/1440, manifests, council reasoning, analytics.json)
-   - `demo-output/site/week-{1..10}/` populated
-   - Memory Stores Console screenshots captured at relative weeks (Richie)
-   - Nicolette clip recorded (Richie)
-   - Voiceover recorded per Beat 2/3/4/5/6 scripts (Richie)
-   - Real artifact bodies extracted: best critic finding (Beat 2 Window 1) + actual `POST /v1/agents` request+response (Beat 2 Window 2)
-   - If genealogy didn't spawn → see Beat 5 fallback rules; do NOT silently improvise
-
-2. **Build animated assets in Claude Design** (claude.ai/design):
-   - Beat 2: council diagram + 2 artifact windows (per Beat 2 spec, including 5 critic nodes with `xxx-critic` + role subtitles)
-   - Beat 3 + Beat 4: animated bounce-rate line chart, fed by `analytics.json` per substrate
-   - Beat 5: composite Console-styled UI with genealogy tree, week N captions, spawn animation
-   - Beat 6: final frame composition (Webster wordmark + "Built with Opus 4.7" lockup + GitHub URL + small QR)
-
-3. **Compose in Forge Remotion**:
-   - Sequence: Beat 1 (45s) → Beat 2 (35s) → Beat 3 (35s) → Beat 4 (30s) → Beat 5 (25s) → Beat 6 (10s) = 180s
-   - Embed Claude Design output via `<Html>` / `<IFrame>` or screen-recorded MP4 asset
-   - Layer voiceover audio synced to choreography tables in each beat spec
-   - Music bed under all beats except where VO carries; SFX stinger at Beat 5 spawn moment
-
-4. **Length check**:
-   - Target: 3:00 (180s). Cerebral Valley cap: confirm before bake.
-   - If overshoot: walk drop-priority lists mechanically (per beat, ordered)
-   - If undershoot: do NOT pad. Submit short.
-
-5. **Output format**: 1080p MP4. Confirm any specific Cerebral Valley submission format requirements.
-
-6. **Pre-submission gates**:
-   - Verify Beat 5 narration matches what actually spawned (substitute real critic name into the overlay)
-   - Verify Beat 3/4 veto callouts match real veto weeks from sim manifest
-   - Verify all on-screen agent spec names match the registered agent names (no typos vs `agents/*.json`)
-   - Watch end-to-end at least once on a phone (most judges watch on phones)
-
-7. **Submit**: Cerebral Valley form. Then GitHub repo link. Then DM if relevant.
-
-If anything ambiguous, surface `[STUCK]` to Richie — don't improvise.
-
----
-
-## Beat 1 — Nicolette clip (locked draft)
-
-**Role**: Emotional hook. Real user describing real pain. Not a product endorsement.
-
-**Talking points** (pick 3-4 for final):
-
-1. **The weekly reality** — "Every week I'm on the clinic floor. I treat patients, I run the business, I can't also sit at my laptop A/B testing hero copy."
-   - _Lands because_: time-scarcity is universal SMB pain; "clinic floor" is concrete.
-
-2. **Manual A/B mechanics** — "I've changed headlines before. You change one line and you don't know for a month whether it helped. By then you forgot what you changed."
-   - _Lands because_: concrete mechanics of why solo A/B is broken — timescale × memory = impossible feedback loop.
-
-3. **Trust-sensitive business** — "My patients need to trust me before they ever come in. My site has to earn that. Not once — every time."
-   - _Lands because_: LP isn't marketing fluff; it's patient acquisition in a trust profession.
-
-4. **Time cost** — "I'd need to pay someone 10-20 hours a month to do what Webster does in a weekly cycle."
-   - _Lands because_: concrete dollar/hour framing judges hear without Richie narrating.
-
-5. **Transformative outcome** — "I just want to walk in Monday and know the page is better than last Monday. Without me doing anything."
-   - _Lands because_: articulates Webster's outcome in her own words.
-
-6. **AI credibility pivot** — "I've tried AI tools before. They gave me generic copy. This is the first one that sounds like me."
-   - _Lands because_: brand-voice preservation differentiates Webster from LLM-slop.
-
-**Production notes**:
-
-- Natural lighting (clinic or home office background)
-- Medium-close framing, eye level
-- External mic (lavaliere or shotgun) — laptop mic kills credibility
-- Each point: 20-45 seconds raw. 3-5 takes per point.
-- No teleprompter. She speaks from heart.
-
-**Anti-goals**:
-
-- NO scripted lines reading
-- NO Webster endorsement phrases
-- NO naming "Webster" or "the council"
-- NO discussing Opus 4.7 or Anthropic (voiceover's job)
-- NO A/B jargon (bounce rate, funnel)
-
-**Final cut target**: 45s (target) / 35s (floor) — pick 3 talking points for target, drop to 2 for floor
-
-**First-cut recommended**: #1 (clinic floor) + #2 (manual A/B mechanics) + #5 (Monday outcome). #1 anchors the time-pain, #2 makes it concrete, #5 articulates the exact Webster outcome in her own words.
-
-**Drop priority (first to drop → last to drop) if cut runs long**:
-
-1. #4 (time cost dollar framing) — voiceover can deliver this more efficiently
-2. #6 (AI credibility pivot) — overlaps with brand-voice reveal in Beat 2
-3. #3 (trust-sensitive business) — important but adjacent, not core A/B pain
-4. #2 (manual A/B mechanics) — concrete but partially redundant with #1
-5. #1 (clinic floor) — anchor opener, hard cut
-6. #5 (Monday outcome) — must-keep, defines outcome
-
-If only 2 fit (floor cut), keep #1 + #5.
-
-### Beat 1 — Interview guide for Nicolette meeting
-
-Goal: elicit the 6 talking points in her own words. Open questions first; follow-ups only if she doesn't hit the angle naturally. **Do NOT ask her to praise Webster, name the council, or read lines.**
-
-**Opening framing** (say to her before recording starts):
-
-> "I'm not going to put words in your mouth or feed you lines. I just want to record you describing your week and what's hard, in your own words. Talk like you're explaining it to a friend, not pitching anything. We'll do multiple takes — feel free to retry any answer."
-
-**Interview questions** (in order, each elicits a talking point):
-
-| #   | Question to ask on camera                                                                                                      | Eliciting (talking point)                        | Follow-up if she doesn't hit it                                                        |
-| --- | ------------------------------------------------------------------------------------------------------------------------------ | ------------------------------------------------ | -------------------------------------------------------------------------------------- |
-| 1   | "Walk me through what your average week looks like."                                                                           | #1 — weekly reality, clinic floor, time scarcity | "When in your week do you ever sit at your laptop and optimize the website?"           |
-| 2   | "Have you ever tried to change something on the website to get more bookings? What happened?"                                  | #2 — manual A/B mechanics, broken feedback loop  | "How long did it take to know whether the change worked?"                              |
-| 3   | "What role does your website play in your relationship with patients?"                                                         | #3 — trust-sensitive business                    | "How does the page need to make a brand-new patient feel before they ever walk in?"    |
-| 4   | "If you wanted to keep improving the website every week — manually — what would that cost you?"                                | #4 — time cost, hire-someone framing             | "Would you actually hire someone to do that, or just live without it?"                 |
-| 5   | "If a tool could quietly improve your website each week without you doing anything, what would the perfect outcome feel like?" | #5 — Monday outcome, transformative              | "What would you want to see when you check it next week vs this week?"                 |
-| 6   | "Have you tried any AI tools for your business before? What was that experience like?"                                         | #6 — AI credibility pivot, generic copy          | "Did any of them ever feel like they actually understood your business or your voice?" |
-
-**Soft warm-up question** (use if she's stiff at start, no need to use the take in final cut):
-
-> "Tell me a bit about yourself and Richer Health — what you do, who your patients are."
-
-**Anti-goals during the interview** (avoid these mistakes):
-
-- Don't ask her to praise Webster, the council, or any product. Anything she says about a product becomes salesy.
-- Don't say "rate Webster on a scale of..." — she's not reviewing software.
-- Don't lead with claims ("Webster cut your bounce rate by X%") — she'll repeat the number and it's fabrication.
-- Don't ask yes/no questions — they produce dead air. Open questions only.
-- Don't interrupt her for retakes mid-answer. Let her finish, then ask "wanna try that one again?"
-- Don't worry about background noise / lighting too much — patient-clinic look is authentic. Just no distracting background motion.
-
-**Production reminders** (you already know but for the record):
-
-- External mic on her (lavaliere or shotgun). Phone mic kills credibility.
-- Eye-level framing, medium-close (shoulders up).
-- Multi-take per question — get 3-5 takes per angle so you have options at edit time.
-- Total recording target: ~30-45 min for all 6 angles + warm-up.
-- Final cut from this footage: 45s (Beat 1) + 3s echo (Beat 6 bookend, ideally pulled from talking point #5).
-
-**Edit-time selection rule**: in the final cut, prefer takes where she sounds _resigned_ over takes where she sounds _frustrated_. The Beat 1 emotional register is "this is just my reality" not "this is unfair." Resignation registers as relatable; frustration registers as venting.
-
-## VO recording script (Richie reads top to bottom)
-
-Total spoken material: ~65 seconds across 5 narrated beats. Recording session length: aim for 30-45 min including retakes.
-
-**Tone reminders (before you start)**:
-
-- Conversational, not declamatory. Talk like you're explaining to a curious friend.
-- ~130 wpm — slower than your normal speech; let lines breathe.
-- 3-5 takes minimum per line. Read straight first, then vary emphasis.
-- Pauses between sentences are fine — they get cut at edit.
-- For punchlines ("Like growing a new sense" / "Real. Not pre-scripted." / the tagline) — slow down, lean in.
-
----
-
-### Beat 2 — Solution intro (~24s spoken)
-
-Record as 4 separate takes. Pause 2-3s between takes for the editor.
-
-**Take 1**:
-
-> "I taught a website to improve itself."
-
-**Take 2**:
-
-> "Every week, a council of Claude agents debates it — copy, conversion, brand voice, SEO, compliance. They propose, apply, verify."
-
-**Take 3**:
-
-> "And when they hit a blind spot they can't solve — they write a new agent. With code. From scratch."
-
-**Take 4** (slow down, this is the Beat 2 punch + Beat 5 setup):
-
-> "Like growing a new sense."
-
----
-
-### Beat 3 — LP timelapse VO (~9s spoken total)
-
-3 sparse callouts. Each is a single line, recorded standalone.
-
-**Take 1** (week 1 callout — slight resignation in tone, this is the "before"):
-
-> "Week one — ugly, generic, no brand."
-
-**Take 2** (veto callout — flat, factual, slightly amused at the system):
-
-> "Week six — the council rejected this redesign."
-
-**Take 3** (week 10 callout — confident, payoff energy):
-
-> "Week ten — on brand, converting."
-
----
-
-### Beat 4 — Site timelapse VO (~9s spoken total)
-
-3 sparse callouts.
-
-**Take 1** (opening, the highest-leverage 4 words in Beat 4):
-
-> "Different industry. Same system."
-
-**Take 2** (veto, parallel to Beat 3):
-
-> "Council rejected this redesign."
-
-**Take 3** (week 10):
-
-> "Trust signals. Clear pricing. Mobile-ready."
-
----
-
-### Beat 5 — Genealogy reveal (~19s spoken)
-
-3 narration segments + a spawn-moment pause.
-
-**Take 1** (setup, descriptive):
-
-> "Twelve memory stores fill over the weeks. Each council inherits what came before."
-
-**Take 2** (problem reveal + spawn — the dramatic line):
-
-> "And in week eight — they hit a problem nothing could solve. So they wrote a new agent."
-> ⚠️ **Placeholder check**: if actual spawn happened on a different week (not week 8), record alternates: "...week seven...", "...week nine...", etc. Get whatever range covers the likely actual spawn week.
-
-**Take 3** (post-spawn, confident, factual):
-
-> "A new sense. Real. Not pre-scripted."
-
----
-
-### Beat 6 — Close (~4s spoken)
-
-**Take 1** (bookend energy, slight smile in voice):
-
-> "A website that improves itself. Built with Opus 4.7."
-
----
-
-### Recording order recommendation
-
-Record in this order to warm up your voice:
-
-1. Beat 3 callouts (3 short lines — easy warm-up, low stakes)
-2. Beat 4 callouts (3 short lines — same energy as Beat 3)
-3. Beat 6 tagline (single short line — closer)
-4. Beat 5 narration (3 takes — mid-stakes, building)
-5. Beat 2 narration (4 takes — highest stakes, do these last when you're warmest)
-
-Save your best vocal energy for Beat 2 since it sets the tone for the whole video.
-
-### Anti-goals
-
-- Don't try to "sound like a podcast voiceover." That's the AI-slop voice. Sound like you.
-- Don't rush Beat 2 punchlines. "From scratch." and "Like growing a new sense." need air around them.
-- Don't add words. Read the locked script verbatim. Tone variation only.
-- Don't try to do all 65s in one continuous take. Per-line takes give the editor room.
-
----
-
-## Tooling stack — composition pipeline
-
-| Tool                                                             | Use                                                                                                                          | Notes                                                                                                                                                                                                                                                                                                                           |
-| ---------------------------------------------------------------- | ---------------------------------------------------------------------------------------------------------------------------- | ------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------- |
-| **Claude Design** (claude.ai/design, research preview, Opus 4.7) | Animated council diagram, real-artifact UI windows (critic finding cards, API req/res viewer), any HTML/CSS/JS-driven motion | Code-powered output (HTML/CSS/JS, WebGL, shaders). Two-pane chat + canvas. Exports as ZIP / standalone HTML / handoff bundle to Claude Code. NOT for photorealistic AI video. Token cost: animations are heavier than static — budget accordingly. Known bug: inline comments occasionally drop, paste into chat as workaround. |
-| **Forge Remotion**                                               | Final video composition: stitching voiceover + Nicolette clip + Claude Design HTML + sim screenshots + transitions + music   | React-based programmatic video composition. Embeds Claude Design output via `<Html>` / `<IFrame>` or screen-recorded MP4.                                                                                                                                                                                                       |
-| **Sim screenshot harness** (T9 deliverable)                      | Per-week per-breakpoint screenshots of both substrates, used as raw frames for timelapse beats                               | Output lives in `demo-output/<substrate>/week-N/screenshots/{375,768,1440}/*.png`                                                                                                                                                                                                                                               |
-| **Anthropic Console**                                            | Source for memory store screenshots (Beat 5), agent registration screenshots (Beat 2 fallback)                               | Manual capture; relative captions per VISION.md (Week 1 / Week 5 / Week 10)                                                                                                                                                                                                                                                     |
-| **Recording surface (Richie)**                                   | Voiceover, Nicolette clip, onboarding role-play                                                                              | External mic. Recorded separately.                                                                                                                                                                                                                                                                                              |
-
-## Asset handoff to composition session
-
-When the video-composition session starts (after T10), it inherits:
-
-1. This file (VIDEO-PLAN.md) — complete shot list, timing, drop priorities
-2. `demo-output/lp/` — Richer Health screenshots, manifests, council reasoning per week
-3. `demo-output/site/` — Northwest Reno screenshots, manifests, council reasoning per week
-4. Real artifact bodies (captured from sim runs):
-   - Best critic finding text (for Beat 2 Window 1) — sourced from `demo-output/lp/week-N/findings/`
-   - Real `POST /v1/agents` request + response (for Beat 2 Window 2) — captured during genealogy spawn
-5. Memory Stores Console screenshots (Beat 5) — Richie captures during/after sim runs
-6. Voiceover script (drafted in this file as we grill) + recorded audio
-7. Nicolette clip (Richie sources)
-
-Composition session then opens Claude Design to build animated assets, screen-records or exports them, and composes everything in Remotion.
-
-## Per-beat specifications (all locked)
-
-### Beat 2 — Solution intro — LOCKED
-
-**Locked**:
-
-- Length: 35s target / 25s floor
-- Voice: Richie's real voice (Q2.1 = A) — applies to all narrated beats in the video
-- Narrative structure: tease genealogy upfront (Q2.2 = D) — sets up Beat 5 payoff
-- Visual treatment: animated structural diagram + 2 real artifact "windows" (Q2.3 = B)
-  - Diagram: site at center, 5 critic nodes orbiting, redesigner + verifier on side, NEW node spawns at "author a new agent" moment
-  - Window 1 (during "council debates", ~3s): real critic finding text in styled card UI (built in Claude Design)
-  - Window 2 (during "author a new agent", ~3s): real `POST /v1/agents` request + 200 response in HTTP-inspector UI (built in Claude Design)
-- Real artifact bodies (not mocked): captured from actual sim runs; Claude Design wraps them in branded UI
-
-**Production workflow**:
-
-1. Claude Design generates the council diagram as animated HTML/CSS/JS (loops, scroll-triggered, or play-on-trigger)
-2. Claude Design generates the two artifact windows with real captured bodies as styled HTML
-3. Screen-record Claude Design output (or export ZIP and play HTML in Remotion via `<Html>` / `<IFrame>`)
-4. Remotion composes the recordings with voiceover, transitions to Beat 3
-
-**Locked fine-tuning** (Q2.4):
-
-- Critic node labels: real spec names + role subtitle (e.g. `conversion-critic` / "Conversion") — A3
-- Narration framing: "council of Claude agents" — B1
-- Diagram critic set: LP-sim (`seo-critic`, `brand-voice-critic`, `fh-compliance-critic`, `conversion-critic`, `copy-critic`) — primary set established in Beat 2, since Beat 3 plays the LP timelapse next
-
-**Artifact capture criteria** (decided in advance, content captured during sim):
-
-- Window 1 source: best critic finding from `demo-output/lp/week-N/findings/` — selection criteria: specific (not generic), short (fits a card), demonstrates real judgment (not boilerplate)
-- Window 2 source: actual `POST /v1/agents` request body + 200 response captured at the genealogy spawn moment during sim. If pure-organic spawn doesn't fire by Week 10, use the 1-day diagnose budget per VISION.md, then re-run; absolute fallback is to capture from a manually-prompted spawn during diagnostics (Beat 5 documents this risk)
-
-**Locked narration script (Q2.5 = Draft A)**:
-
-> "I taught a website to improve itself.
->
-> Every week, a council of Claude agents debates it — copy, conversion, brand voice, SEO, compliance. They propose, apply, verify.
->
-> [breath — Window 1: real critic finding card, ~3s]
->
-> And when they hit a blind spot they can't solve — they write a new agent. With code. From scratch.
->
-> [breath — Window 2: real POST /v1/agents call + response, ~3s]
->
-> Like growing a new sense."
-
-53 words → ~24s narration + 6s artifact dwell + 4s transition = ~34s.
-
-**Locked visual choreography**:
-
-| Time   | Narration                                                                                             | Visual                                                                             |
-| ------ | ----------------------------------------------------------------------------------------------------- | ---------------------------------------------------------------------------------- |
-| 0-3s   | "I taught a website to improve itself."                                                               | Diagram opens: ugly site materializes at center                                    |
-| 3-10s  | "Every week, a council of Claude agents debates it — copy, conversion, brand voice, SEO, compliance." | 5 critic nodes appear in sequence as named, each with `xxx-critic` + role subtitle |
-| 10-13s | "They propose, apply, verify."                                                                        | Redesigner + verifier nodes light up                                               |
-| 13-16s | [breath]                                                                                              | Window 1 pops in: real critic finding card (~3s)                                   |
-| 16-21s | "And when they hit a blind spot they can't solve — they write a new agent."                           | Diagram shows "?" gap node, new node materializes                                  |
-| 21-24s | [breath]                                                                                              | Window 2 takes over: real POST /v1/agents call + response (~3s)                    |
-| 24-27s | "With code. From scratch."                                                                            | Back to diagram, new node integrated                                               |
-| 27-31s | "Like growing a new sense."                                                                           | Diagram pulses, holds                                                              |
-| 31-35s | [transition]                                                                                          | Fade to Beat 3 opener                                                              |
-
-**Open / not blocking**:
-
-- Music / SFX bed (or silent under VO) — composition session decides at compose time
-
-**Drop priority (35s → 25s floor)**:
-
-1. Drop Window 1 (real critic finding UI) — diagram still conveys "critics critique"; window is proof but not load-bearing
-2. Compress diagram opening animation — start with diagram already populated instead of nodes appearing one-by-one
-3. Cut narration beat #2 ("a council of Claude agents debates it weekly") — implied by diagram
-4. Floor structure: open with already-populated diagram → narration beats #1, #3, #4 → spawn moment with Window 2 → transition. Loses pacing breath but keeps the tease intact.
-
-### Beat 3 — LP timelapse (Richer Health) — LOCKED
-
-**Locked**:
-
-- Length: 35s target / 25s floor
-- Pacing principle: **dwell on key moments** (Q3.1 = C). Fast cuts (~2s) for incremental weeks, longer dwell (~5s) on weeks with major visual deltas + the veto + bookends (week 1, week 10). Specific dwell times assigned at composition time from actual sim screenshots.
-- Veto treatment: **halt callout** (Q3.2 = A). At the veto week, overlay "Week N — REJECTED" briefly stops timelapse, shows proposed-vs-rejected comparison (~3s), then resumes.
-
-**Key-moment heuristic for composition session** (use this to assign dwell times when you have the screenshots):
-
-1. **Week 1 (baseline)**: ~5s dwell — viewer needs to register the ugly starting state
-2. **First major redesign week** (largest visual delta vs week 1, likely w2-w4): ~5s dwell
-3. **Veto week** (per sim manifest, planted w5-w6): ~5s halt with REJECTED overlay
-4. **Mid-progression weeks** (incremental changes, no major restructure): ~2s flips
-5. **Week 10 (final reveal)**: ~5s dwell — payoff
-6. **Genealogy spawn week** (if visible in screenshots, e.g. w7-w8): ~4s dwell — sets up Beat 5
-
-How to identify the "first major redesign": diff weeks pixel-by-pixel (or just visual eyeball), find the first week where >40% of viewport pixels changed vs prior week. That's the redesign moment.
-
-**Drop priority for floor (35s → 25s)**:
-
-1. Reduce mid-progression flip from 2s → 1.5s (saves ~3s across 5 mid weeks)
-2. Drop the genealogy-spawn-week dwell — let Beat 5 carry that
-3. Trim veto halt from 5s → 3s (still visible, less narrative weight)
-4. Trim week 10 dwell from 5s → 3s
-5. Floor structure: ~3s baseline + ~3s first redesign + ~3s veto + ~9s incremental + ~3s w10 + ~4s overlay/transitions = ~25s
-
-**Locked visual layers (Q3.3 + Q3.4)**:
-
-- Breakpoint treatment: **desktop (1440) for the 10-week timelapse** + 2-3s **breakpoint sweep on the final week-10 frame** (morphs through 1440 → 768 → 375 to prove responsive). Q3.3 = E.
-- Analytics overlay: **animated line chart, bounce-rate trending down across weeks** in top-right corner, drawn live in sync with timelapse pacing. Q3.4 = B.
-  - **Built in Claude Design** as animated HTML/CSS chart. Data source: real synthetic-analytics output from `demo-output/lp/week-N/analytics.json` (T5 deliverable). Chart scrubs data points week-by-week as the timelapse plays; final value highlighted at week 10.
-
-**Locked text + audio (Q3.5 + Q3.6)**:
-
-- Week labels: **"Week N" bottom-left, simple** (Q3.5 = A). Big enough to read; sim dates are seeded so absolute date adds no signal.
-- Narration: **sparse VO at 3 key moments + music bed underneath** (Q3.6 = B). Roughly:
-  - Week 1 (~3s): "Week one — ugly, generic, no brand."
-  - Week 6 / veto halt (~3s): "Week six — the council rejected this redesign."
-  - Week 10 (~3s): "Week ten — on brand, converting."
-- Cursor/pointer overlay: skip (adds noise without payoff)
-
-### Beat 3 status: LOCKED
-
-### Beat 4 — Site timelapse (Northwest Home Renovations) — LOCKED
-
-**Locked**:
-
-- Length: 30s target / 22s floor
-- Pacing principle: dwell-on-key-moments (parallel to Beat 3, same heuristic)
-- Veto treatment: halt callout (parallel to Beat 3)
-- Analytics overlay: animated bounce-rate line chart in corner (parallel to Beat 3, fed by `demo-output/site/week-N/analytics.json`)
-- Week labels: "Week N" bottom-left
-- Critic set established for diagram (if Beat 4 ever flashes diagram): `seo-critic`, `brand-voice-critic`, `licensing-and-warranty-critic`, `conversion-critic`, `copy-critic` (note: licensing-and-warranty replaces fh-compliance for the contractor substrate)
-- Page handling (Q4.1 = E): **home page primary timelapse for ~27s + ~3s "page sweep" at week 10** (week 10 home holds, then morphs through services + free-estimate also evolved)
-- Narration framing (Q4.2 = B): mirror Beat 3 + lead with generalization beat
-  - 0-3s: "Different industry. Same system."
-  - ~Week 6 veto halt (~3s): "Council rejected this redesign."
-  - ~Week 10 (~3s): "Trust signals. Clear pricing. Mobile-ready."
-
-Total: ~9s VO + ~21s silent-with-music + visuals = 30s
-
-**Why "Different industry. Same system." is load-bearing**: this 4-word opening converts Beat 4 from "redundant second timelapse" into "generalization proof." Without it, judges see two timelapses; with it, they see Webster's judgment generalizing across substrates. Highest-leverage line of Beat 4.
-
-**Drop priority for floor (30s → 22s)**:
-
-1. Drop the page sweep at week 10 (saves ~3s) — loses "full site" proof, falls back to "home page only" framing
-2. Reduce mid-progression flips ~2s → ~1.5s (saves ~3s)
-3. Trim veto halt from 5s → 3s
-4. Floor structure: ~3s baseline + ~3s first redesign + ~3s veto + ~7s incremental + ~3s w10 + ~3s overlay/transitions = ~22s. Loses page sweep; keeps generalization framing.
-
-### Beat 4 status: LOCKED
-
-### Beat 5 — Genealogy reveal — LOCKED
-
-**Locked**:
-
-- Length: 25s target / 18s floor
-- Visual structure (Q5.1 = D): **composite Claude Design treatment** — animated genealogy tree rendered _inside_ a stylized Console UI frame; Week N captions on the side; the 13th critic both grows on the tree AND appears in the Console list simultaneously. One animation conveys metaphor + proof.
-- Spawn dramatization (Q5.2 = D): **pause + zoom + audio stinger + critic-name overlay**. At spawn moment: animation freezes ~1s, camera zooms onto new entry/branch, audio stinger fires, text overlay shows the actual spawned critic's name (e.g. `mobile-ux-critic — week 8`) for ~1s.
-- Narration script (Q5.3 = Draft C):
-
-  > "Twelve memory stores fill over the weeks. Each council inherits what came before.
-  >
-  > And in week eight — they hit a problem nothing could solve. So they wrote a new agent.
-  >
-  > [SPAWN — pause + zoom + stinger + critic-name overlay]
-  >
-  > A new sense. Real. Not pre-scripted."
-
-  ~42 words → ~19s narration + 6s spawn dwell.
-
-**Visual choreography**:
-
-| Time   | Narration                                                                           | Visual                                                                                           |
-| ------ | ----------------------------------------------------------------------------------- | ------------------------------------------------------------------------------------------------ |
-| 0-5s   | "Twelve memory stores fill over the weeks. Each council inherits what came before." | Composite Console-styled UI; store list grows Week 1 → 5 → 10; tree visible on side at 9 critics |
-| 5-9s   | [breath beat, music carries]                                                        | Tree pulses; council animation shows 9 critics active                                            |
-| 9-13s  | "And in week eight — they hit a problem nothing could solve."                       | "?" gap node appears in tree; critics visibly stuck                                              |
-| 13-15s | "So they wrote a new agent."                                                        | New branch begins growing                                                                        |
-| 15-19s | [SPAWN — pause + zoom + stinger + overlay]                                          | Pause; zoom on new branch + new Console entry; "<critic-name> — week 8" overlay for ~1s          |
-| 19-22s | "A new sense. Real. Not pre-scripted."                                              | Both Console + tree visible, holds                                                               |
-| 22-25s | [transition]                                                                        | Fade to Beat 6                                                                                   |
-
-**Critical fallback handling — pure-organic genealogy may not fire**:
-
-VISION.md is explicit that the spawn is pure-organic, no pre-committed target. If genealogy doesn't fire by week 10:
-
-1. **First fallback** (per VISION.md, 1-day diagnose budget): investigate why detection didn't trigger → adjust thresholds/prompts → re-run sim. Spawn happens, Beat 5 plays as designed.
-2. **Second fallback** (if re-run still doesn't spawn): Beat 5 gets RESTRUCTURED. Options:
-   - 2a. Cut Beat 5 entirely. Redistribute ~25s across Beat 3/4 timelapses (extra dwell). Genealogy concept stays as Beat 2 tease but is unfulfilled. Video runs ~2:35. **Risk**: pitch loses its sharpest claim.
-   - 2b. Keep Beat 5 but reframe as "memory stores fill over time" — drop the spawn moment. Narration: "Twelve memory stores fill over the weeks. Each council inherits what came before. The council learns." No spawn callout. **Risk**: violates Beat 2 promise of "growing a new sense."
-   - 2c. Honest framing — Beat 5 narrates "we ran ten weeks; no spawn fired this time." Authentic but undermines pitch. **Risk**: kills momentum.
-3. **Absolute fallback** (per VISION.md): video restructures around improvement story alone. Beat 2 tease gets re-cut to remove "growing a new sense" line.
-
-**Decision rule for the composition session**: if at simulation completion the spawn didn't fire AND re-run also didn't fire, surface this as a `[STUCK]` to Richie before proceeding. Do not silently fall back to 2b or 2c.
-
-**Placeholder substitution (composition session must do)**:
-
-The Beat 5 narration script and visual choreography contain placeholders that get filled from the actual sim run:
-
-- `week eight` in narration → substitute actual spawn week (could be w5, w7, w9, etc.)
-- `<critic-name> — week 8` in overlay → substitute actual spawned critic name + actual week
-- "Twelve memory stores" → confirm count is still 12; if genealogy spawned a critic that got its own memory store, the count is now 13 — adjust narration accordingly
-- Which substrate spawned (LP or site)? — narration is substrate-agnostic in current draft. If visually obvious, optionally add "during the {trade contractor / clinic} run" — but this might break pacing. Default: keep substrate-agnostic.
-
-**Drop priority for floor (25s → 18s)**:
-
-1. Drop the 4s breath beat (5-9s) — keeps narration tight
-2. Trim spawn dwell from 6s → 4s
-3. Trim final hold from 3s → 2s
-4. Floor structure: ~5s setup + ~4s problem reveal + ~2s spawn line + ~4s spawn dwell + ~3s resolution = ~18s
-
-### Beat 5 status: LOCKED with fallback rules
-
-### Beat 6 — Close — LOCKED
-
-**Locked**:
-
-- Length: 10s target / 8s floor
-- Closing structure (Q6.1 = A): **Nicolette bookend + tagline + GitHub URL** — emotional symmetry, opens and closes on her
-- Tagline (Q6.2 = A): **"A website that improves itself. Built with Opus 4.7."**
-  - Closes the linguistic loop: Beat 2 says "I taught a website to improve itself" (first-person, builder); Beat 6 says "A website that improves itself" (third-person, system) → implies Webster has internalized the capability
-  - "Built with Opus 4.7" is the literal hackathon submission framing
-- Logo/URL frame (Q6.3 = E): **Webster wordmark + "Built with Opus 4.7" lockup + GitHub URL + small QR code** — single composition, full hackathon framing, scannable for viewers outside Cerebral Valley submission form
-- Anthropic feature grid: NOT in the video. Lives as a standalone HTML page linked from README (Tier 1 extra-time move). Beat 6 stays clean.
-
-**Visual choreography**:
-
-| Time  | Narration / Visual                                                                                                              | Asset                     |
-| ----- | ------------------------------------------------------------------------------------------------------------------------------- | ------------------------- |
-| 0-3s  | Brief flash of Nicolette echoing "...without me doing anything." (cut from Beat 1 take)                                         | Nicolette video clip echo |
-| 3-7s  | VO: "A website that improves itself. Built with Opus 4.7." Tagline appears on screen as it's spoken                             | On-screen tagline text    |
-| 7-10s | Tagline holds → fades into final frame: Webster wordmark + "Built with Opus 4.7" lockup + GitHub URL + small QR → fade to black | Logo lockup composition   |
-
-**Production note**: The 3s Nicolette echo is ZERO additional cost — capture this as a separate take during her main session (or cut from her existing footage). Frame: the same "Monday outcome" line from Beat 1, but used as the closing affirmation here.
-
-**Drop priority for floor (10s → 8s)**:
-
-1. Compress Nicolette echo from 3s → 1.5s (saves ~1.5s) — keeps the bookend, tighter cut
-2. Compress tagline reveal from 4s → 3s (saves ~1s)
-3. Floor structure: 1.5s Nicolette echo + 3s tagline + 3.5s logo+URL+fade = 8s
-4. Absolute fallback (if even 8s is over): drop Nicolette echo entirely → 4s tagline + 4s logo+URL = 8s. Loses bookend; gains cleanest close.
-
-### Beat 6 status: LOCKED
-
-## Video length — LOCKED at 3:00
-
-Hard ceiling: **180 seconds**. We design to a tighter floor budget so composition can absorb overshoot without breaking the arc.
-
-### Per-beat budgets (target / floor)
-
-| Beat                 | Target          | Floor           | Notes                                             |
-| -------------------- | --------------- | --------------- | ------------------------------------------------- |
-| 1 — Nicolette        | 45s             | 35s             | Pick 3 talking points; floor = drop one           |
-| 2 — Solution intro   | 35s             | 25s             | Floor = compress narration, single animation pass |
-| 3 — LP timelapse     | 35s             | 25s             | Floor = single breakpoint, no analytics overlay   |
-| 4 — Site timelapse   | 30s             | 22s             | Floor = compress 3-page rotation                  |
-| 5 — Genealogy reveal | 25s             | 18s             | Floor = static screenshots only, no zoom-in       |
-| 6 — Close            | 10s             | 8s              | Floor = drop CTA framing, just tagline            |
-| **Total**            | **180s (3:00)** | **133s (2:13)** | 47s buffer for composition                        |
-
-### Safeguard mechanism — drop-priority list per beat
-
-Each beat above has a **numbered drop list**. If composition session sees the cut running over 3:00, walk the list mechanically: drop item #1, recheck length, still over? Drop #2. No judgment calls under deadline pressure.
-
-All drop lists populated. Composition session can execute mechanically.
-
-**Open caveat**: confirm Cerebral Valley submission guidelines don't impose a stricter cap (e.g., 2:00). If they do, collapse to floors (target = 2:13). If they require under 2:13, escalate to Richie — partial cut required.
-
-## File pointers (read on rehydration)
-
-- `context/VISION.md` — canonical north-star
-- `context/EXPANSION-TASKS.md` — T0–T10 implementation scaffolding
-- `context/FEATURES.md` — shipped feature log
-- `AGENTS.md` — operator guide
-- `agents/AGENTS.md` — agent spec rules
-- `~/Vault/Projects/webster/webster-decision-log.md` — ADR log
-
-## Identity facts (never drift)
-
-- **Nicolette**: real client of Richer Health. Live site `certified.richerhealth.ca` — NEVER use in sim. Production `webster-*` agents run her real weekly council.
-- **Northwest Home Renovations**: fictional contractor. Pacific Northwest. Blue-collar trade angle (demographic least served by AI).
-- **Richie**: sole builder/operator. ADHD, autodidact, systems-thinker. Thinks in layers and building blocks.
-
-## Resume protocol (post-compaction)
-
-All 6 beats are LOCKED. Grilling complete.
-
-If a fresh session opens with this file:
-
-1. Read this file in full (VIDEO-PLAN.md)
-2. Read VISION.md demo arc section
-3. Confirm what's needed: composition session execution OR additional grill rounds OR something else
-4. If executing composition: see "Composition session brief" section above. If anything ambiguous, surface `[STUCK]` to Richie — do not improvise the spec.
-
-## Locked decisions (do not re-grill)
-
-From prior grilling + VISION.md:
-
-- Two substrates only (Richer Health LP + Northwest Home Renovations)
-- 10 weeks per substrate
-- Pure-organic genealogy (no pre-committed spawn target)
-- 1 veto per substrate embedded at week 5-6 for authenticity
-- Video composed in fresh session via Forge Remotion after assets exist
-- Hybrid memory (file-based ground truth + 12 managed stores for showcase)
-- MCP-native sim agents (no WebFetch, no localhost, no deploy)
-- Demo arc is 6 beats per VISION.md
-- Nicolette clip anti-goals (no scripting, no product naming, no A/B jargon)
-- Memory Stores demo uses **relative captions** (Week 1/5/10), not timestamps
-
-## Deferred (not part of this session's grilling)
-
-- Nicolette video clip recording (Richie does in separate session)
-- Voiceover narration recording (after script drafted)
-- Onboarding skill role-play recording (separate video asset)
-- Cerebral Valley submission form (manual at submission time)
-- Tier 1 extra-time moves (Webster-for-Webster, feature grid, playground, governance narrative, cost transparency) — queued after T10
-
-## Post-T10 followups (technical debt / enhancements surfaced during planning)
-
-**Mobile responsiveness gap in redesigner specs** (severity: medium, effort: ~20 min):
-
-- `webster-redesigner.json` system prompt has zero mobile/responsive/breakpoint directives. It proposes LP changes without reasoning about mobile upfront.
-- Visual reviewers DO catch breakpoint regressions reactively (production + both sim variants check 375/768/1440), but reactive ≠ proactive.
-- Sim redesigners (`webster-lp-sim-redesigner`, `webster-site-sim-redesigner`) have the same gap.
-- Fix path:
-  1. Extend redesigner system prompts: "Specify changes for all 3 breakpoints (375/768/1440). Note responsive behavior explicitly in proposal.md."
-  2. Either extend `visual-design-critic` to judge mobile upfront OR add a dedicated `mobile-ux-critic` to the council
-- Risk if not fixed: wasted iteration cycles (redesigner proposes desktop-first → visual reviewer blocks → redesigner re-proposes); mobile-specific _opportunities_ missed (only regressions get caught, not absent improvements).
-- Does NOT block hackathon submission — visual reviewers safety-net mobile during sim runs. This is a quality enhancement.
diff --git a/context/v2-design.md b/context/v2-design.md
deleted file mode 100644
index 6b8d46e..0000000
--- a/context/v2-design.md
+++ /dev/null
@@ -1,312 +0,0 @@
-# Webster v2 — Apply + Review/Fix Loop (design doc)
-
-> Captured during session 4 Phase 2 grill-me on 2026-04-23.
-> Feature entries: `FEATURES.md` #39 (apply worker), #40 (image-gen).
->
-> Context: Richie executed session 4 in auto-mode. Below reflects the
-> best-available decisions derived from the prompt's rec baseline + the
-> live finding from today's wget mirror (critic blind-spot re
-> `data-calendly-base` runtime rewrite) + advisor sanity-check.
-> Items marked **[R-confirm]** would benefit from an explicit Richie pass
-> before implementation kicks off.
-
----
-
-## Q1 — Apply worker runtime
-
-**Decision (80/100):** Pi worker (Codex gpt-5.4) invoked via a Forge
-workflow, worktree-isolated per apply run.
-
-**Rationale (building blocks → connections → behaviour):**
-
-- Pi is already Webster's worker-pool standard. Adding another runtime
-  class for one new worker is cost the system doesn't need.
-- Codex (gpt-5.4, high reasoning) handles structured code mutation
-  reliably — find-string / replace-with-tree transforms, JSON-LD
-  insertion, Astro-component patching. Today's session proved this kind
-  of work is doable by a reasoning model, not a stretch.
-- Forge gives the two things the apply step needs that raw `claude -p`
-  doesn't: (a) isolated git worktree per run, so one bad apply doesn't
-  clobber another's branch; (b) a validation stage with lint+type+format
-  baked in.
-- The alternative of a Claude Opus managed-agent session is overkill —
-  Opus' reasoning surplus isn't the bottleneck in find-replace on 5
-  issues; the bottleneck is confining the transform. Codex + validation
-  harness wins on $/task by an order of magnitude.
-
-**Non-option:** Claude Opus managed-agent. `claude -p` subscription
-without Forge isolation.
-
-**Open:** none significant.
-
----
-
-## Q2 — Done-definition
-
-**Decision (72/100):** Three-part gate, all required to pass before the
-apply worker opens a PR:
-
-1. **Static floor** — lint + type + format green on the mutated source
-   (mirrors existing Webster validate pipeline).
-2. **Runtime check** — headless browser opens the mutated page and
-   verifies CTAs resolve to real booking URLs, `<script>` blocks don't
-   throw, no console errors. Directly motivated by today's critic
-   blind-spot finding: static greps miss runtime-rewritten CTAs like
-   `data-calendly-base` → Calendly. A headless-browser gate would have
-   caught the week-1 CRITICAL misdiagnosis.
-3. **Critic re-run** — spawn the same 5 critics (or 6 with visual-design)
-   against the mutated code. Zero new CRITICAL findings required; HIGH
-   findings permitted up to a threshold (e.g. ≤2).
-
-**Rationale:** "green build" is necessary but not sufficient — it doesn't
-catch wrong content, dead JS, or regressions in the critics' core
-concerns. The runtime check is the cheapest addition that closes the
-biggest known gap. Re-running critics is the self-consistency loop.
-
-**Visual-regression snapshot:** deferred to v2 week 2+. The Playwright
-infra to snapshot and diff-compare is a separate setup; week 1 ships
-without it. **[R-confirm]** if visual-regression is worth building
-immediately for the demo-video cut.
-
-**Open:** HIGH-finding threshold (2? 3?). `[R-confirm]`
-
----
-
-## Q3 — #39 ↔ #40 dependency strength
-
-**Decision (78/100):** Soft dependency. #39 (apply worker) ships first
-with `<!-- asset TBD: <type> -->` HTML-comment stubs where it encounters
-image placeholders. #40 (image-gen tool) ships as a follow-up; the apply
-worker begins calling it when available.
-
-**Enumerated type list for #40:**
-
-```text
-{
-  og_card,               // 1200×630 social-share image (week-1 need)
-  hero_background,       // Full-bleed hero section backdrop
-  testimonial_headshot,  // Circular 400×400 portrait for quote cards
-  icon,                  // 48×48 mono/duotone line-art (step cards)
-  section_illustration   // 800×600 supporting editorial image
-}
-```
-
-Five is a small enough list to keep the schema tight. If the apply
-worker encounters a `TBD` type that isn't in this enum, it emits a stub
-comment flagging the need — this is how the enum grows intentionally
-over subsequent weeks.
-
-**Missing-from-list candidates that were considered and cut for v2 week 1:**
-
-- `diagram_illustration` (for arch diagrams, decision trees) — niche on
-  an LP; add if a future week demands it.
-- `pattern_tile` (for textured backgrounds) — CSS can do this.
-- `animated_gif` / `video_loop` — out of scope; different backend.
-
-**Cost ceiling:** $2/run self-imposed (≈20 generations at gpt-image-1
-rates); forces quality gates and prevents a loop from burning $$$ on
-regenerations.
-
-**Brand-context input format:** JSON blob the apply worker builds from
-`context/business.md` + a palette file the onboarding skill writes:
-
-```json
-{
-  "palette": ["#495A58", "#80A8A7", "#292F2E"],
-  "brand_voice": "calm-authoritative; dark/sage/near-black color mood",
-  "typography": "Inter headline, Source Sans Pro body",
-  "restraint": "no saturated primaries, no cartoon style, no stock-photo feel"
-}
-```
-
-**Asset persistence path:** `site/public/assets/generated/<week>/<type>-<slug>.<ext>`.
-Gitignored cache at `.webster/generated-cache/` to dedupe identical-brief
-regenerations across weeks.
-
-**Stub-when-absent vs. complete-or-fail:** stub wins. Partial progress
-beats blocked-entirely; the week-1 proposal's og-card is a good example —
-the SEO meta-tags ship valuable without the image, and the image is a
-separable follow-up. This session's `site/after/index.html` already
-demonstrates the pattern (HTML comments where og-card.jpg would go).
-
-**Open:** backend choice — OpenAI `gpt-image-1` vs. Stitch MCP vs.
-Replicate. gpt-image-1 is the safest default (proven, widely integrated,
-Anthropic-adjacent-tooling-friendly). `[R-confirm]` backend + cost
-ceiling.
-
----
-
-## Q4 — PR format
-
-**Decision (70/100):** One PR per **issue-cluster**, where a cluster is
-the group of issues that touch overlapping files. Minimum 1 issue per
-PR, maximum 3 issues per PR. Hard ceiling: 3 PRs per weekly run.
-
-**Rationale:**
-
-- One-PR-per-issue was the ergonomic ideal (smaller, partial-mergeable,
-  clearer history) but the tradeoff — 5× CI runs, 5× review windows, 5×
-  merge conflicts when two issues touch the same file — is prohibitive
-  in a weekly cadence with non-technical operators reviewing on phone.
-- One-PR-for-everything gives zero partial-merge-ability; operator must
-  accept all-or-nothing, and that's where good proposals die.
-- Cluster-based is the mid-point: related issues (e.g. Issues 2 + 3 from
-  today's proposal both touch the founder section) ship together, so
-  reviewers see a coherent semantic change; unrelated issues (e.g.
-  Issue 5 head-tag vs. Issue 1 CTA wiring) stay separate.
-
-**Clustering heuristic for the apply worker:**
-
-1. Build a `{issue → touched_files}` map after dry-run parse.
-2. Union-find on shared files; each connected component is a cluster.
-3. If any cluster exceeds 3 issues, split heuristically by severity
-   (CRITICALs first cluster, rest second).
-
-**Noise threshold Richie asked about:** in practice ≤3 PRs/week is
-comfortable; ≥5 PRs/week starts eroding review quality. Hard ceiling of
-3 matches this.
-
-**Open:** PR description format — is there a machine-readable `summary.json`
-alongside markdown? `[R-confirm]`
-
----
-
-## Q5 — Failure fallback when apply can't land an issue
-
-**Decision (75/100):** Skip + annotate, with a severity-tiered response.
-
-**Per-issue handling:**
-
-- **String not found / diff impossible**: skip, log to
-  `history/<week>/apply-log.json` with `{issue, reason: "string_mismatch",
-evidence}`, continue.
-- **Layout conflict (two issues modify the same region incompatibly)**:
-  apply issue with higher severity first; skip the lower one with
-  reason `layout_conflict`; continue.
-- **Merge impossible after 2 auto-fix attempts in the review/fix loop**:
-  skip, log reason `fix_loop_exceeded`, continue.
-
-**PR-level response (after all issues processed):**
-
-- **All 5 issues applied**: open normal PR.
-- **1–4 issues skipped, at least 1 applied**: open PR with `[partial]`
-  label and a "Skipped issues" section in the PR body listing each
-  skipped issue + reason + next-step suggestion.
-- **0 issues applied (all skipped)**: do NOT open a PR; post a
-  structured report to `history/<week>/apply-failed.md` and notify the
-  operator via GitHub issue.
-- **Any skipped issue is CRITICAL severity**: PR opens as draft (not
-  ready), even if others applied cleanly. Operator decides whether the
-  partial ship is acceptable given the CRITICAL skip.
-
-**Rationale:** partial progress > blocked-entirely; the operator sees
-every skip in the PR body, no silent failures. Fail-fast would block
-other fixes for no reason. Auto-escalate to Opus is expensive and
-negates the autonomy claim.
-
-**Open:** `[R-confirm]` whether draft-on-CRITICAL-skip is the right
-default.
-
----
-
-## Q6 — Preview URL strategy
-
-**Decision (85/100):** Cloudflare Pages PR preview URLs. **Confirmed live
-today** — `curl -sI https://certified.richerhealth.ca/` returns
-Cloudflare `report-to` headers (CF Pages behind CF CDN). Every PR against
-the production repo auto-generates a preview URL like
-`pr-<n>.<project>.pages.dev`; operator reviews on that URL with zero
-infra cost.
-
-**Rationale:**
-
-- Standard pattern — CF Pages does this out of the box when a GitHub repo
-  is connected. No custom subdomain, no staging wrangler, no manual
-  deploy step.
-- Disposable — preview URL dies when PR closes. No long-lived staging to
-  maintain.
-- Zero risk to production — separate origin, separate analytics ID
-  (operator must scrub the Umami `data-website-id` on preview builds —
-  see below).
-- Operator can share the preview URL with stakeholders for a pre-merge
-  eyeball without giving GitHub access.
-
-**Gotchas to handle in #39e (preview URL wiring):**
-
-- **Analytics contamination**: the live LP fires `umami` analytics with
-  `data-website-id="2d335573-..."`. Preview builds should either strip
-  the script OR replace the site-id with a preview-only id. Otherwise
-  preview traffic pollutes the real analytics that the monitor reads.
-  Fix: build-time env flag, `data-preview="1"` gates the script.
-- **Canonical tag**: the after/ index.html now has
-  `<link rel="canonical" href="https://certified.richerhealth.ca/">`.
-  On a preview URL this would still point canonical to prod — fine for
-  SEO (preview pages shouldn't index), but verify preview URLs get
-  `X-Robots-Tag: noindex`.
-- **UTM passthrough**: the Calendly JS snippet reads `window.location.search`.
-  Preview URLs won't have real UTMs; the snippet should no-op cleanly
-  (it already does — empty `queryString` branch handles it).
-
-**Multi-tenancy note:** when Webster is sold beyond Richie, the preview
-URL strategy stays per-client via their own CF Pages project. Each
-client's repo → CF Pages project → PR previews. Webster just needs to
-write the preview URL into `history/<week>/apply-log.json` after PR
-creation so the operator doesn't have to hunt for it.
-
-**Fallback:** if a client isn't on CF Pages / Vercel / Netlify, the apply
-PR falls back to "clone locally + serve" instructions in the PR body.
-Higher friction, usable.
-
-**Open:** none — this one is resolved.
-
----
-
-## Deferred to a later grill-me
-
-- Visual-design critic: standing (Opus-sample-to-ground-truth) vs.
-  spawn-each-week. Leaning standing.
-- Multi-site vs. single-site from day 1. Leaning single-site; multi-site
-  is a v2 week 4+ feature.
-- Trigger cadence (every merge vs. on-demand vs. weekly). Leaning weekly
-  - on-demand override.
-- Review step composition — new code-focused `webster-code-reviewer`
-  critic vs. re-run the existing 5. Leaning re-run existing with ONE
-  new `apply-diff-reviewer` that's code-aware (current critics read
-  rendered HTML; apply reviewer reads diffs).
-- Iteration cap on review/fix loop. Default proposed: 3 loops, then
-  skip + annotate.
-
----
-
-## Operational intel for the next critic cycle
-
-From today's session — critic blind-spot finding:
-
-The conversion + seo critics both flagged CTAs as dead based on static
-greps for `acuityscheduling` / `href="#"`. Reality: CTAs wire via
-`data-calendly-base` + a JS snippet that rewrites `.href` at page load.
-The critics missed a runtime-wiring pattern.
-
-**Apply-worker implication:** Q2's headless-browser runtime check is
-partly motivated by this. The apply worker should catch the same class
-of error before opening a PR.
-
-**Critic-upgrade implication (separate from apply worker):** before v2
-week 2, update `agents/conversion-critic.json` and `agents/seo-critic.json`
-to include a static-analysis pass for:
-
-- `data-calendly-base`, `data-calendly`, `data-acuity`, `data-book-base`
-  style data-attr wiring patterns.
-- `class="booking-cta"` or similar CTA-flag class patterns + matching
-  `<script>` blocks that assign to `.href`.
-
-Any critic that grep's for booking URLs should ALSO grep for
-runtime-rewrite patterns, or fall back to "inconclusive — recommend
-headless validation" rather than a false CRITICAL.
-
----
-
-## FEATURES.md translation (Phase 3 output preview)
-
-See `context/FEATURES.md` for the concrete #39a–e and #40a–d rows landed
-during Phase 3 of this session.
diff --git a/deploy/webster-dispatcher.plist b/deploy/webster-dispatcher.plist
deleted file mode 100644
index 3ce60d8..0000000
--- a/deploy/webster-dispatcher.plist
+++ /dev/null
@@ -1,48 +0,0 @@
-<?xml version="1.0" encoding="UTF-8"?>
-<!DOCTYPE plist PUBLIC "-//Apple//DTD PLIST 1.0//EN" "http://www.apple.com/DTDs/PropertyList-1.0.dtd">
-<plist version="1.0">
-<dict>
-    <!--
-    Webster dispatcher liveness check.
-    Fires every 30 minutes. Checks if any forge workflows are active. If none AND
-    context/FEATURES.md has pending items, pops a macOS notification reminding Richie
-    to re-run `wbs`. Does NOT auto-start the dispatcher (which is interactive).
-
-    To install:
-      cp ~/Projects/webster/deploy/webster-dispatcher.plist ~/Library/LaunchAgents/com.richsak.webster.dispatcher.plist
-      launchctl load ~/Library/LaunchAgents/com.richsak.webster.dispatcher.plist
-
-    To uninstall:
-      launchctl unload ~/Library/LaunchAgents/com.richsak.webster.dispatcher.plist
-      rm ~/Library/LaunchAgents/com.richsak.webster.dispatcher.plist
-    -->
-    <key>Label</key>
-    <string>com.richsak.webster.dispatcher</string>
-
-    <key>ProgramArguments</key>
-    <array>
-        <string>/bin/zsh</string>
-        <string>-c</string>
-        <string>
-cd /Users/richiesakhon/Projects/webster
-active=$(~/.local/bin/forge isolation list 2>/dev/null | grep -c "^feat/\|^video/" || echo 0)
-pending=$(grep -c "^\- \[ \]" context/FEATURES.md 2>/dev/null || echo 0)
-if [ "$active" = "0" ] &amp;&amp; [ "$pending" -gt "0" ]; then
-    osascript -e "display notification \"$pending pending, 0 active. Run \\\"wbs\\\" to dispatch.\" with title \"Webster Dispatcher\" sound name \"Ping\""
-fi
-        </string>
-    </array>
-
-    <key>StartInterval</key>
-    <integer>1800</integer>
-
-    <key>StandardOutPath</key>
-    <string>/Users/richiesakhon/Projects/webster/tmp/logs/dispatcher-liveness.log</string>
-
-    <key>StandardErrorPath</key>
-    <string>/Users/richiesakhon/Projects/webster/tmp/logs/dispatcher-liveness.err</string>
-
-    <key>RunAtLoad</key>
-    <false/>
-</dict>
-</plist>
diff --git a/history/AGENTS.md b/history/AGENTS.md
deleted file mode 100644
index c9e4b51..0000000
--- a/history/AGENTS.md
+++ /dev/null
@@ -1,33 +0,0 @@
-# History artifacts — immutable
-
-> Runtime output lives here. Never edit, never delete, never regenerate.
-
-## What's in this directory
-
-- `history/<YYYY-MM-DD>/` — weekly production council runs (Nicolette's live business)
-- `history/demo-arc/` — pre-shipped 4-week demo arc seeder output
-- `history/secondary-arc/` — Pair Alpha (SaaS + local service) seeder output
-- `history/memory.jsonl` — event log read by planner + apply-worker + visual-reviewer
-- `history/baselines.jsonl` — per-experiment baselines
-
-## The rule
-
-If you think you need to modify something in here, **STOP and ask Richie**.
-
-Manipulating runtime artifacts destroys evidence the planner depends on for next-week decisions. It also breaks the auditability claim that underpins the verdict engine's `confidence` heuristic.
-
-## Hackathon expansion isolation
-
-The hackathon simulation writes to `demo-output/<substrate>/` — NOT under `history/`. Keep it that way. Isolation between production runtime artifacts and demo simulation output is a feature, not an accident.
-
-New sim output structure: `demo-output/landing-page/week-NN/...` and `demo-output/northwest-reno/week-NN/...`. See `context/EXPANSION-TASKS.md` T7–T9 for the asset-bundle contract.
-
-## When you genuinely need to change something here
-
-Reasons this is ever acceptable:
-
-- Richie explicitly instructs it
-- A schema migration of `memory.jsonl` or `baselines.jsonl` with an accompanying migration script + test
-- Adding a new week-dated directory via a production council run (via `prompts/second-wbs-session.md`, the normal path)
-
-Anything else: surface `[STUCK]` and ask.
diff --git a/history/CLAUDE.md b/history/CLAUDE.md
deleted file mode 120000
index 47dc3e3..0000000
--- a/history/CLAUDE.md
+++ /dev/null
@@ -1 +0,0 @@
-AGENTS.md
\ No newline at end of file
diff --git a/package.json b/package.json
index c165dfb..881e565 100644
--- a/package.json
+++ b/package.json
@@ -24,6 +24,9 @@
     "validate:agents": "bun scripts/validate-agents.ts",
     "validate:findings": "bun scripts/validate-findings.ts",
     "validate:md": "markdownlint-cli2",
+    "onboarding:verify-env": "bun scripts/onboarding/verify-env.ts",
+    "onboarding:verify-all": "bun scripts/onboarding/verify-all.ts",
+    "onboarding:scaffold-repo": "bun scripts/onboarding/scaffold-repo.ts",
     "validate": "bun run type-check && bun run lint --max-warnings 0 && bun run format:check && bun run validate:agents && bun run validate:findings && bun run validate:md && bun test",
     "test": "bun test",
     "prepare": "husky"
diff --git a/prompts/composition-session.md b/prompts/composition-session.md
deleted file mode 100644
index 5a49565..0000000
--- a/prompts/composition-session.md
+++ /dev/null
@@ -1,145 +0,0 @@
-# Composition session prompt — Webster hackathon demo video
-
-> Paste this into a fresh Claude Code session in the Webster repo. The session composes the final 90-second demo video for the Built with Opus 4.7 hackathon submission.
-
-## Mission
-
-You are running the video composition session for Webster's hackathon submission ("Built with Opus 4.7" by Anthropic × Cerebral Valley, deadline 2026-04-26).
-
-Your only job: assemble the final video per the locked spec. Do NOT redesign, re-grill, or improvise the video plan. Every beat is locked in `context/VIDEO-PLAN-90s.md` — your job is execution.
-
-## First actions (in order)
-
-1. Read `AGENTS.md` (operator guide, branch conventions, do/don't rules)
-2. Read `context/VIDEO-PLAN-90s.md` in full — canonical video spec for the 2026-04-26 submission cut. The 180s plan in `context/VIDEO-PLAN.md` is superseded; consult it only for tone/register reference.
-3. Read `context/VISION.md` (north-star context for any judgment calls)
-4. Confirm asset readiness (see `VIDEO-PLAN-90s.md` "Open dependencies" section)
-5. If any asset missing or ambiguous: surface `[STUCK]` to Richie with specific paths/symptoms. Do NOT silently fall back to alternates without explicit approval.
-
-## Asset readiness checklist
-
-Confirm each of these exists before starting any composition work. If any is missing, stop and surface to Richie.
-
-### Sim assets (produced by T5–T10 implementation track)
-
-- [ ] `demo-output/lp/week-{1..10}/screenshots/{375,768,1440}/` — Richer Health LP screenshots, all 10 weeks, all 3 breakpoints
-- [ ] `demo-output/lp/week-{1..10}/manifest.json` — per-week sim manifest including veto flag
-- [ ] `demo-output/lp/week-{1..10}/analytics.json` — synthetic analytics per week (bounce rate, scroll depth, CTA per persona)
-- [ ] `demo-output/lp/week-{1..10}/findings/` — critic findings per week
-- [ ] `demo-output/site/week-{1..10}/` — same shape, Northwest Home Renovations substrate (3 pages: home, services, free-estimate)
-- [ ] `demo-output/genealogy-event.json` — captured `POST /v1/agents` request + 200 response from the actual organic spawn moment
-
-### Human-recorded assets (Richie produces separately)
-
-- [ ] `assets/nicolette-clip/` — raw multi-take footage from Nicolette interview (per Beat 1 interview guide in VIDEO-PLAN.md)
-- [ ] `assets/voiceover/` — Richie's VO takes for Beats 2/3/4/5/6 (per VO recording script in VIDEO-PLAN.md)
-- [ ] `assets/memory-stores-screenshots/` — Anthropic Console screenshots showing the 12 memory stores filling over time, with relative captions (Week 1 / Week 5 / Week 10)
-
-### Curated artifacts (you produce as part of composition prep)
-
-- [ ] `composition/best-finding.md` — single critic finding selected from `demo-output/lp/week-N/findings/` per Beat 2 Window 1 selection criteria (specific, short, demonstrates real judgment)
-- [ ] `composition/spawn-context.json` — extracted from `demo-output/genealogy-event.json` for Beat 2 Window 2
-
-## Tooling stack
-
-- **Claude Design** (claude.ai/design, Opus 4.7) — animated assets:
-  - Beat 2: council diagram (site at center, 5 critic nodes orbiting + redesigner + verifier, new node spawns) + 2 artifact windows (critic finding card UI + HTTP req/res viewer)
-  - Beat 3 + 4: animated bounce-rate line chart in corner, fed by analytics.json data
-  - Beat 5: composite Console-styled UI with genealogy tree growing animation
-  - Beat 6: final frame composition (Webster wordmark + "Built with Opus 4.7" lockup + GitHub URL + small QR)
-- **Forge Remotion** — final composition: stitches voiceover + Nicolette clip + Claude Design HTML + sim screenshots + transitions + music
-- **Screen recording** — fallback if Claude Design HTML doesn't embed cleanly via `<Html>` / `<IFrame>` in Remotion: screen-record the Claude Design output as MP4 and import as raw footage
-
-## Build order (sequential)
-
-### Phase 1 — Static asset prep (~1-2 hr)
-
-1. Select Beat 2 Window 1 critic finding from `demo-output/lp/week-N/findings/` per criteria in VIDEO-PLAN.md → write to `composition/best-finding.md`
-2. Extract Beat 2 Window 2 spawn artifact from `demo-output/genealogy-event.json` → write to `composition/spawn-context.json`
-3. Identify "first major redesign week" in LP timelapse (largest visual delta vs week 1) — this drives Beat 3 dwell timings. Write to `composition/lp-pacing.md`
-4. Identify same for site substrate → `composition/site-pacing.md`
-5. Identify the actual veto week per substrate (read manifest.json `veto: true` flag) → confirm matches what VO references; record alternate VO takes if veto landed on a different week
-
-### Phase 2 — Animated asset build in Claude Design (~3-5 hr)
-
-In claude.ai/design, build each animated asset per the visual choreography tables in VIDEO-PLAN.md:
-
-1. **Beat 2 council diagram** — animated structural diagram following Beat 2 visual choreography table
-   - Critic nodes use real spec names + role subtitles (`conversion-critic` / "Conversion", etc.)
-   - Spawn animation at the right moment in the timeline
-2. **Beat 2 Window 1** — finding card UI (use real text from `composition/best-finding.md`)
-3. **Beat 2 Window 2** — HTTP req/res viewer UI (use real bodies from `composition/spawn-context.json`)
-4. **Beat 3 + 4 bounce chart** — animated line chart, scrubs week-by-week from analytics.json
-5. **Beat 5 composite** — Console-styled UI + genealogy tree growing animation
-6. **Beat 6 final frame** — wordmark + lockup + URL + QR
-
-Export each as standalone HTML or screen-record as MP4. Decide per asset based on Remotion embedding feasibility.
-
-### Phase 3 — Composition in Forge Remotion (~3-5 hr)
-
-1. Set up Remotion project at composition target (1080p, 30fps, 180s)
-2. Sequence beats: 1 → 2 → 3 → 4 → 5 → 6 with locked durations
-3. Embed Claude Design assets via `<Html>` / `<IFrame>` or imported MP4
-4. Layer voiceover audio synced to choreography tables
-5. Add music bed (low-volume under all beats except where VO carries)
-6. SFX stinger at Beat 5 spawn moment
-7. Transitions between beats: fade or crossfade per spec; do NOT use stylized transitions (slides, wipes) — they read as cheap
-
-### Phase 4 — Length check & drop pass (~30 min)
-
-1. Render preview at full quality
-2. Time the cut — must be ≤180s
-3. If overshoot: walk the per-beat drop-priority lists in VIDEO-PLAN.md mechanically. Drop item #1 from the most-overshot beat, recheck length, continue.
-4. If undershoot: do NOT pad. Submit short.
-
-### Phase 5 — Pre-submission gates (~30 min)
-
-Verify each:
-
-- [ ] Beat 5 narration matches actual spawn week from sim (substitute correct week if not "week eight")
-- [ ] Beat 5 spawn overlay shows actual spawned critic name (no placeholder `<critic-name>`)
-- [ ] Beat 3/4 veto callouts match actual veto weeks from sim manifests
-- [ ] All on-screen agent spec names match registered names (cross-check `agents/*.json`)
-- [ ] No fabricated stats (every number on screen sourced from real analytics.json or real Console)
-- [ ] Watch end-to-end at least once on a phone (most judges watch on phones)
-- [ ] Audio levels normalized (VO ≈ -16 LUFS, music bed -28 LUFS, no clipping)
-- [ ] No typos in tagline / URL / QR / on-screen text
-- [ ] GitHub URL renders correctly + QR scans correctly when filmed
-
-### Phase 6 — Submission
-
-1. Export final MP4 (1080p, H.264, AAC audio, ≤2GB)
-2. Upload to Cerebral Valley submission form
-3. Confirm video plays correctly on the form preview
-4. Submit
-
-## Escalation rules — when to surface `[STUCK]` to Richie
-
-Surface and STOP if any of these:
-
-1. Genealogy spawn never fired (sim ran 10 weeks + re-run, no spawn) — apply Beat 5 fallback rules per VIDEO-PLAN.md, but ASK Richie which fallback option (2a/2b/2c) before composing
-2. Cerebral Valley submission cap is shorter than 3:00 — escalate length cut decisions
-3. Asset missing that you can't produce yourself (e.g. Nicolette clip not recorded, VO not recorded)
-4. Claude Design output won't embed cleanly into Remotion AND screen-recording produces unacceptable quality
-5. Visual deltas across timelapse weeks are too small to register at 35s — Beat 3/4 may need pacing rebalance
-6. Any decision that requires choosing between two reasonable options and isn't in VIDEO-PLAN.md
-
-Do NOT surface for:
-
-- Routine production decisions (font choice, color tweaks, exact stinger sound)
-- Anything explicitly resolved in VIDEO-PLAN.md
-
-## Hard rules
-
-- Do NOT modify VIDEO-PLAN.md to make execution easier. If the spec is wrong, surface to Richie.
-- Do NOT add scope (extra beats, extended length, additional assets).
-- Do NOT improvise the spawned critic name or veto week — they're real artifacts from sim runs.
-- Do NOT use stock footage or AI-generated imagery in the final cut. Real screenshots only.
-- Do NOT skip the pre-submission gates. They're cheap; missing one is expensive.
-- Do NOT touch production agents, the production orchestrator, or anything in the existing 9 `webster-*` set during composition.
-
-## Output of the composition session
-
-Final deliverable: `composition/final.mp4` (1080p, H.264, ≤180s, ≤2GB) ready to upload to Cerebral Valley submission form.
-
-Plus: `composition/changelog.md` — log of any deviations from VIDEO-PLAN.md, with rationale (should ideally be empty).
diff --git a/prompts/e2e-demo-run-session.md b/prompts/e2e-demo-run-session.md
deleted file mode 100644
index fb8b9d8..0000000
--- a/prompts/e2e-demo-run-session.md
+++ /dev/null
@@ -1,155 +0,0 @@
-# Webster E2E Demo Run Session
-
-## Mission
-
-Run the Webster end-to-end demo pipeline and produce the final handoff assets for video composition.
-
-This session is allowed to use Anthropic API tokens. Do not run this prompt in a token-restricted session.
-
-## Read first
-
-1. `AGENTS.md`
-2. `context/VISION.md`
-3. `context/EXPANSION-TASKS.md`
-4. `context/E2E-IMPLEMENTATION-TRACKER.md`
-5. `prompts/sim-runner.md`
-
-## Current prepared state
-
-- Core validation was green before this handoff: `bun run validate` → 181 tests passing.
-- Core preflight does not require browser Console auth:
-  - `bun run sim:preflight`
-- Manual Memory Stores screenshot already exists:
-  - `assets/memory-stores-screenshots/manual/console-memory-stores-2026-04-25.png`
-- Manual screenshot manifest already supports this proof path:
-  - `bun run sim:emit-manifest`
-- Auto-capture remains available but optional:
-  - strict mode: `WEBSTER_REQUIRE_CONSOLE_CAPTURE=1 bun run sim:preflight`
-  - bridge: `bun run sim:lp 2>&1 | bun run sim:capture-bridge`
-
-## Hard rules
-
-- Do not modify production agents.
-- Do not modify `prompts/second-wbs-session.md`.
-- Do not run both substrates in parallel.
-- Do not hide failures. If a council run fails repeatedly, stop and report `[STUCK]` with the failing command and last 40 lines.
-- Do not require Console screenshot auto-capture; manual proof is already present.
-
-## Recommended run path
-
-### 1. Confirm clean enough state
-
-```bash
-git status --short
-bun run validate
-bun run sim:preflight
-```
-
-If validation fails from unrelated formatting, fix formatting only and rerun. If tests fail, stop.
-
-### 2. Ensure provisioned API resources
-
-These use Anthropic API tokens and are expected in this session:
-
-```bash
-bun scripts/provision-memory-stores.ts
-bun scripts/register-sim-agents.ts
-```
-
-Expected outputs:
-
-- `context/memory-stores.json` contains 12 store IDs.
-- `context/sim-agents.json` contains 18 sim agent IDs.
-
-### 3. Run LP simulation
-
-Use the no-auto-capture path first:
-
-```bash
-bun run sim:lp
-```
-
-If Richie explicitly wants fresh Console milestone screenshots and is logged into Anthropic Console in Chrome profile `Default`, use:
-
-```bash
-bun run sim:lp 2>&1 | bun run sim:capture-bridge
-```
-
-### 4. Run site simulation
-
-```bash
-bun run sim:site
-```
-
-Optional auto-capture variant:
-
-```bash
-bun run sim:site 2>&1 | bun run sim:capture-bridge
-```
-
-### 5. Emit screenshot manifest
-
-```bash
-bun run sim:emit-manifest
-```
-
-This should include the manual screenshot under `manual_proof`. Auto week screenshots are optional unless `WEBSTER_REQUIRE_AUTO_MEMORY_SCREENSHOTS=1` is set.
-
-### 6. Build demo manifests and final sheets
-
-```bash
-bun scripts/build-demo-manifest.ts
-```
-
-Expected outputs:
-
-- `demo-output/landing-page/demo-manifest.json`
-- `demo-output/landing-page/final-sheet.png`
-- `demo-output/northwest-reno/demo-manifest.json`
-- `demo-output/northwest-reno/final-sheet.png`
-- `assets/memory-stores-screenshots/manifest.json`
-
-### 7. Inspect handoff assets
-
-Check visually and structurally:
-
-```bash
-find demo-output -maxdepth 3 -type f | sort | sed -n '1,120p'
-find assets/memory-stores-screenshots -maxdepth 3 -type f | sort
-```
-
-Manual inspection checklist:
-
-- Week 0 and week 10 screenshots exist for both substrates.
-- Final sheets are not blank.
-- LP and Northwest Reno visibly improve.
-- Genealogy outcome is documented honestly: spawn, no-spawn, or diagnosed rerun.
-- Memory proof screenshot exists and is referenced in manifest.
-
-### 8. Final validation
-
-```bash
-bun run validate
-```
-
-If green, report:
-
-- commands run
-- key output paths
-- whether genealogy spawned
-- final validation result
-- any assets still missing for video composition
-
-## If stuck
-
-Use this exact format:
-
-```text
-[STUCK] <short failure>
-Command: <command>
-Last output:
-<last 40 lines>
-What I tried:
-- ...
-Recommendation: <one direct next action with score/100>
-```
diff --git a/prompts/fourth-wbs-session.md b/prompts/fourth-wbs-session.md
deleted file mode 100644
index d5a9a66..0000000
--- a/prompts/fourth-wbs-session.md
+++ /dev/null
@@ -1,333 +0,0 @@
-# Fourth wbs session — deploy old/new LP + grill-me on v2
-
-> **Override default Operating Loop.** This is a polish + planning session. Do NOT scan `FEATURES.md` for the normal dispatch loop, do NOT launch feature workflows, do NOT create Anthropic managed-agent sessions. Execute the phases below end-to-end.
-
-## What this session does
-
-Two goals, sequenced so Phase 1 (deploy) runs first — Richie can eyeball the old/new UI in his browser while Phase 2 (grill-me) is active.
-
-1. **Phase 1 — Fork + manual apply + local preview (~45 min).** Mirror `certified.richerhealth.ca` into `site/before/`, clone to `site/after/`, manually apply the 5 `history/2026-04-23/proposal.md` edits, start a local http server, output two URLs.
-2. **Phase 2 — Grill-me on v2 (~30 min).** Invoke the `grill-me` skill on the top-6 planning questions for features #39 (apply + review/fix loop) and #40 (image-gen tool). Output: `context/v2-design.md`.
-3. **Phase 3 — Translate decisions.** Update `FEATURES.md` Layer 8 with concrete sub-features derived from the grill-me outcome.
-4. **Phase 4 — Checkpoint.**
-
-**Expected runtime:** 75–90 min wall-clock (Phase 1 ~45, Phase 2 ~30, Phase 3–4 ~10).
-**Expected API cost:** ~$0 (Opus subscription; no managed-agent calls).
-
-## Pre-flight (MANDATORY — do not skip)
-
-```bash
-# 1. Working tree clean — we'll be creating files under site/
-if [[ -n $(git status --porcelain) ]]; then
-  echo "ABORT: working tree has uncommitted or untracked files."
-  git status --short
-  exit 1
-fi
-
-# 2. Tools required
-for tool in wget python3 jq gh git; do
-  command -v "$tool" >/dev/null 2>&1 || { echo "ABORT: $tool not installed"; exit 1; }
-done
-
-# 3. Operator-decision.json for last week exists (confirms session 3 ran)
-[[ -f history/2026-04-23/operator-decision.json ]] || {
-  echo "ABORT: history/2026-04-23/operator-decision.json missing."
-  echo "Run prompts/third-wbs-session.md first."
-  exit 1
-}
-
-# 4. Proposal source for manual edits exists
-[[ -f history/2026-04-23/proposal.md ]] || {
-  echo "ABORT: history/2026-04-23/proposal.md missing."
-  echo "Run prompts/third-wbs-session.md first or restore the proposal before applying edits."
-  exit 1
-}
-
-# 5. site/ should NOT already exist (this session creates it); bail if it does
-if [[ -d site/before || -d site/after ]]; then
-  echo "NOTE: site/before or site/after already exists."
-  echo "If this is a re-run, delete them first:  rm -rf site/"
-  exit 1
-fi
-
-mkdir -p site tmp .claude/checkpoints
-```
-
-## Phase 1 — Fork + manual apply + preview server
-
-### Step 1.1 — Mirror live LP into `site/before/` (~5 min)
-
-```bash
-cd site
-wget \
-  --mirror \
-  --convert-links \
-  --adjust-extension \
-  --page-requisites \
-  --no-parent \
-  --span-hosts \
-  --domains=certified.richerhealth.ca,richerhealth.ca \
-  --user-agent="Mozilla/5.0 (webster-fork)" \
-  -e robots=off \
-  -o ../tmp/wget-before.log \
-  https://certified.richerhealth.ca/ || {
-    echo "wget hit errors — inspect tmp/wget-before.log"
-  }
-
-# wget nests everything under certified.richerhealth.ca/; flatten into before/
-mv certified.richerhealth.ca before
-[[ -d richerhealth.ca ]] && mv richerhealth.ca before/_external-richerhealth.ca
-
-cd ..
-
-# Sanity check: must have an index.html
-[[ -f site/before/index.html ]] || {
-  echo "ABORT: wget did not produce site/before/index.html"
-  ls -la site/before/
-  exit 1
-}
-
-echo "── site/before rendered OK ──"
-du -sh site/before
-ls site/before/ | head -20
-```
-
-### Step 1.2 — Clone `before` → `after` (<1 min)
-
-```bash
-cp -R site/before site/after
-[[ -f site/after/index.html ]] || { echo "ABORT: copy failed"; exit 1; }
-echo "── site/after ready for edits ──"
-```
-
-### Step 1.3 — Apply the 5 proposal.md edits to `site/after/` (~30 min)
-
-**You (Opus 4.7) now perform the edits directly, using the `Read`/`Edit` tools against `site/after/index.html` (and any linked HTML files wget produced). Edit sources: `history/2026-04-23/proposal.md` Issues 1–5.**
-
-Apply order (surgical, one at a time, verify after each):
-
-1. **Issue 1 — CTA → Acuity.** Find every `<a … href="#"` that is a BOOK/CALL CTA. Replace `href="#"` with `href="https://app.acuityscheduling.com/schedule.php?owner=16697295"`, add `target="_blank"`, `rel="noopener"`, `data-cta="book-strategy-call"`. Standardise visible label to `BOOK YOUR FREE STRATEGY CALL`. **Expected count: 5 CTAs.** If you find more or fewer, stop and report — the live LP may have changed since the critics last read it.
-
-2. **Issue 2 — DSocSci + medical disclaimer.** In `site/after/index.html` find `FOUNDER & MASTER CLINICIAN` (or the `&amp;` variant) → replace with `FOUNDER, RICHER HEALTH`. Find `Dr. Nicolette Richer` in the founder section → replace with `Dr. Nicolette Richer, DSocSci`. Append the scope-note `<p>` block from proposal.md Issue 2 Change A immediately after the founder name. In footer, prepend the medical-disclaimer `<p>` from Issue 2 Change B. Replace footer `href="#"` links with `/privacy`, `/terms`, `/clinical-standards`, `mailto:hello@richerhealth.ca`.
-
-3. **Issue 3 — Hedge clinical-authority language.** Three replacements:
-   - `25 years reversing chronic disease…` → hedged version from Issue 3 Change A
-   - `Patients Treated` → `Clients Served`
-   - `Trained under Charlotte Gerson…` → first-person hedged version from Issue 3 Change C
-
-4. **Issue 4 — Hero H1 + subhead.** Find current H1 `YOUR PRACTICE. THEIR PLAYBOOK. PATIENTS NOTICE.` → replace with the N&D-keyword-bearing H1 from Issue 4. Replace the existing subhead `<p>` with the ICP-framed subhead.
-
-5. **Issue 5 — Head tag foundation.** In `<head>` of `site/after/index.html`: rewrite `<title>`, add meta description, canonical, OG tags, Twitter tags, JSON-LD block. Full HTML is in proposal.md Issue 5.
-
-   **Dependency**: `og-card.jpg` doesn't exist yet. Omit `og:image` and `twitter:image` meta tags until a valid asset exists. Do NOT ship broken image URLs in the meta.
-
-After each issue, run a smoke check:
-
-```bash
-# Count the change to confirm it landed
-grep -c "app.acuityscheduling.com" site/after/index.html   # expect ≥5 after Issue 1
-grep -c "DSocSci" site/after/index.html                     # expect ≥2 after Issue 2
-grep -c "Clients Served" site/after/index.html              # expect 1 after Issue 3
-grep -c "N&amp;D Team Certification" site/after/index.html  # expect ≥1 after Issue 4
-grep -c "application/ld+json" site/after/index.html         # expect 1 after Issue 5
-```
-
-If any count is 0, stop and diagnose — the rendered HTML may use different markup than proposal.md assumed.
-
-### Step 1.4 — Start preview server (background) (<1 min)
-
-```bash
-# Kill any previous server on 8080
-lsof -ti:8080 | xargs kill -9 2>/dev/null || true
-
-# Start server in background, pinned to repo root so both before/ and after/ serve
-nohup python3 -m http.server 8080 > tmp/http-server.log 2>&1 &
-disown
-sleep 1
-
-# Verify
-curl -sf http://localhost:8080/site/before/ >/dev/null && echo "  ✓ before reachable" \
-  || echo "  ✗ before NOT reachable — check tmp/http-server.log"
-curl -sf http://localhost:8080/site/after/ >/dev/null && echo "  ✓ after reachable" \
-  || echo "  ✗ after NOT reachable"
-
-echo ""
-echo "══════════════════════════════════════════════════"
-echo "Open in browser:"
-echo "  BEFORE: http://localhost:8080/site/before/"
-echo "  AFTER:  http://localhost:8080/site/after/"
-echo "══════════════════════════════════════════════════"
-```
-
-### Step 1.5 — Commit the fork + apply (optional; gate on Richie visual approval)
-
-**PAUSE.** Richie eyeballs both URLs. If anything is visibly broken (layout collapse, missing CSS, wrong content), fix before committing.
-
-Once Richie confirms visual parity and the `after` edits look correct:
-
-```bash
-git add site/
-git commit -m "feat(site): fork certified.richerhealth.ca + apply week 2026-04-23 proposal (manual apply)"
-git push origin main
-```
-
-Commit ends Phase 1.
-
----
-
-## Phase 2 — Grill-me on v2 features (interactive)
-
-**Invoke the `grill-me` skill with the question tree below.** Grill-me is an interview pattern — one question at a time, pressure-test Richie's answer, move on when an answer is sharp. Keep each exchange tight (no walls of text).
-
-### Question tree (top priority — must answer in this session)
-
-**Q1. Apply worker runtime.**
-Recommendation (75/100): Pi worker (Codex gpt-5.4) via a Forge workflow. Rationale: Pi is already Webster's worker-pool standard, Codex is good at structured code mutation, Forge gives us worktree isolation + validation. Alternatives: a Claude Opus managed agent (expensive, unnecessary), `claude -p` subscription (subscription burn, no isolation). Grill-me: press on why NOT Forge+Pi; surface concrete blockers.
-
-**Q2. Done-definition.**
-Recommendation (70/100): "Lint+type green" as a hard floor, PLUS re-running the 5 (or 6 with visual-design) council critics against the mutated code and requiring zero new CRITICAL/HIGH findings. Rationale: "green build" is necessary but not sufficient; re-running critics is the system's own quality signal. Alternatives: purely green-build (lower bar), add visual-regression snapshot (stronger but needs a Playwright infra layer). Grill-me: is visual-regression worth the infra cost, or overkill for weekly cadence?
-
-**Q3. #39 ↔ #40 (image-gen tool) dependency strength.**
-Recommendation (75/100): **Soft dependency.** #39 (apply worker) ships first and stubs image assets with `<!-- asset TBD: og-card -->` comments when encountered. #40 (image-gen tool — enumerated types `{og_card, icon, hero_bg, section_illustration}`, backend `gpt-image-1`) ships as a follow-up that the apply worker starts calling when available. Rationale: unblocks #39 from #40's planning tail (brand-guide schema, cost ceiling, persistence path); degrades gracefully when #40 is down. Alternatives: hard dependency (wait for #40 — delays #39; #40 is the more experimental feature), no dependency (operator fills assets manually forever — drift risk). Grill-me: is "stub + comment" acceptable for v2 week-1, or does the apply PR need to be complete-or-fail? Also: is the enumerated type list correct, or is something obvious missing (testimonial headshots? diagram illustrations?).
-
-**Q4. PR-format: one big PR vs. one per issue.**
-Recommendation (65/100): **One PR per issue** (or per issue-cluster if two issues touch the same file — e.g. Issues 2 + 3 both edit `FounderSection.astro`). Rationale: smaller PRs = easier review, partial-merge-ability (operator can merge Issue 1 and reject Issue 5 independently), clearer Git history. Tradeoff: more PR overhead (5x branches, 5x CI runs). Alternatives: one big PR (simpler automation, all-or-nothing merge). Grill-me: at what issue-count does "one per issue" become too noisy? (2? 5? 10?)
-
-**Q5. Failure fallback when apply can't land an issue.**
-Recommendation (70/100): **Skip + annotate.** If the apply worker can't apply an issue (string mismatch, layout conflict, merge impossible), skip that issue, log a structured annotation to `history/<week>/apply-log.json`, and continue. Do NOT fail the whole run on one skipped issue. Operator review sees the annotation and decides next steps. Rationale: partial progress > blocked-entirely. Alternatives: fail-fast (blocks other fixes for no reason), auto-escalate to Opus-4.7 human-in-loop (expensive, negates autonomy claim). Grill-me: should a CRITICAL-severity skipped issue block the PR from opening at all?
-
-**Q6. Preview URL strategy for the apply PR (how the operator reviews before merge).**
-Recommendation (80/100): **Use host-provided PR preview URLs.** If the production `certified.richerhealth.ca` repo is hosted on Cloudflare Pages / Vercel / Netlify, every PR auto-gets a preview URL like `pr-<n>.<project>.pages.dev` — operator reviews on that URL; zero interference with the production domain. Rationale: standard pattern, zero infra, no custom domain to maintain, disposable per PR. Alternatives: local-only (operator must `git checkout <pr-branch>` + serve locally — high friction for non-technical operators when Webster is sold beyond Richie), custom staging subdomain `staging.richerhealth.ca` (more setup, worth it only for long-lived staging), path-based on prod (`certified.richerhealth.ca/preview/` — BAD: same analytics/robots/origin, real visitors could land there). Grill-me: which host is the real Richer Health repo on today? If it's not on CF Pages / Vercel / Netlify, "wire up PR preview" becomes a prerequisite for #39 to be useful — call it #39f.
-
-### Deferred to a later grill-me (ack but don't resolve this session)
-
-- Visual-design-critic: standing vs. spawn-each-week
-- Multi-site vs. single-site from day 1
-- Trigger cadence (every merge vs. on-demand vs. weekly)
-- Review step composition (new code-reviewer agent vs. re-run critics)
-- Iteration cap (how many review/fix loops before bail)
-
-### Output format
-
-Grill-me writes answers to `context/v2-design.md` as it goes:
-
-```markdown
-# Webster v2 — Apply + Review/Fix Loop (design doc)
-
-> Captured from the Phase 2 grill-me session on 2026-04-23.
-> Feature entry: `FEATURES.md` #39.
-
-## Q1 — Apply worker runtime
-
-**Decision:** <Richie's answer>
-**Rationale:** <one line>
-**Open sub-questions:** <list if any>
-
-## Q2 — Done-definition
-
-…
-```
-
----
-
-## Phase 3 — Translate decisions into FEATURES.md
-
-Once Phase 2 concludes, translate the 6 Q&A outcomes into concrete Layer 8 sub-features. Replace the single "#39 NEEDS PLANNING" and "#40 NEEDS PLANNING" rows with decompositions like:
-
-**#39 apply worker sub-features** (from Q1, Q2, Q4, Q5, Q6):
-
-- #39a — Apply worker implementation (from Q1 — e.g. Pi Codex via Forge workflow)
-- #39b — Critic re-run gate + done-definition wiring (from Q2)
-- #39c — Per-issue PR emission + apply-log.json annotation (from Q4)
-- #39d — Skip+annotate fallback behaviour (from Q5)
-- #39e — Preview URL wiring (from Q6 — gates on host identification)
-
-**#40 image-gen tool sub-features** (from Q3):
-
-- #40a — Tool schema + enumerated type list (og_card, icon, hero_bg, section_illustration + any additions from Q3)
-- #40b — Backend wire-up (e.g. `gpt-image-1` client + retry + cost ceiling)
-- #40c — Brand-context input format + asset persistence path
-- #40d — #39 integration pattern (stub-when-absent, invoke-when-present per Q3 "soft dependency" decision)
-
-Assign `todo` status to each. Leave hours as estimate-after-grill-me.
-
-```bash
-# After editing FEATURES.md:
-git add context/FEATURES.md context/v2-design.md
-git commit -m "docs(v2): grill-me design doc + decomposed #39/#40 sub-features"
-git push origin main
-```
-
----
-
-## Phase 4 — Checkpoint + exit
-
-```bash
-CKPT=".claude/checkpoints/$(date -u +%Y-%m-%dT%H%M%SZ)-session-4-complete.md"
-cat > "$CKPT" <<EOF
----
-ts: $(date -u +%Y-%m-%dT%H:%M:%SZ)
-trigger: session-4-complete
----
-
-## What happened
-
-Session 4: forked certified.richerhealth.ca into site/before + site/after,
-manually applied week 2026-04-23 proposal to after, stood up local preview,
-grilled v2 apply+loop design in Phase 2, decomposed FEATURES.md #39.
-
-## Preview URLs (local only — kill http-server when done)
-
-- BEFORE: http://localhost:8080/site/before/
-- AFTER:  http://localhost:8080/site/after/
-
-## v2 decisions (see context/v2-design.md)
-
-- Q1 worker runtime: <filled in>
-- Q2 done-definition: <filled in>
-- Q3 #39↔#40 dependency strength: <filled in>
-- Q4 PR format: <filled in>
-- Q5 failure fallback: <filled in>
-- Q6 preview URL strategy: <filled in>
-
-## Next tick
-
-- Kill local http-server when done:  lsof -ti:8080 | xargs kill -9
-- Remaining submission-critical work:
-  - Cerebral Valley submission form (#37, Richie action)
-  - Demo video (Layer 6 — Richie voice record blocker)
-  - Bug fixes from session 2/3 (5 known)
-- Post-submission: build #39a–e per the decomposition.
-EOF
-echo "Checkpoint: $CKPT"
-```
-
-Checkpoints are gitignored by policy — do not add or commit this checkpoint file.
-
-```bash
-echo ""
-echo "══════════════════════════════════════════════════"
-echo "Session 4 complete."
-echo "  Site fork + apply:  site/before, site/after (committed)"
-echo "  v2 design doc:      context/v2-design.md (committed)"
-echo "  FEATURES Layer 8:   decomposed into #39a–e (committed)"
-echo "  Local preview:      http://localhost:8080/site/{before,after}/"
-echo "  Checkpoint:         $CKPT"
-echo "══════════════════════════════════════════════════"
-echo ""
-echo "Kill the preview server when done:  lsof -ti:8080 | xargs kill -9"
-exit 0
-```
-
-## If a step fails
-
-- **wget mirror incomplete / broken CSS in before/**: some LPs use CDN URLs that don't rewrite cleanly. Fallback: `curl -o site/before/index.html https://certified.richerhealth.ca/`, open in browser, accept that external CSS may break — the demo still shows the content structure even if styling is off.
-- **Apply edit: string not found**: the live LP may have changed since the critics last read it (24h+ old findings). Report the mismatch, ask Richie whether to force-apply via near-match or skip. Do NOT silently alter the edit.
-- **http.server port conflict**: change `8080` to `8081` throughout.
-- **Grill-me stalls on a question**: document the stall as an open sub-question, move to next Q. Don't force resolution on a question that's genuinely unresolved — pencil it in for the next grill-me.
-
-## What this prompt does NOT do
-
-- **Does not build the apply worker**. Phase 2 is planning, not implementation. Apply worker construction is a separate session after v2-design.md is signed off.
-- **Does not deploy to a public URL**. Preview is local-only. If Richie wants a public URL for the demo video, pipe `site/before/` + `site/after/` into a second session that wires Cloudflare Pages or `vercel --prod`.
-- **Does not modify existing council infrastructure**. The critic/redesigner/genealogy pipeline is frozen for submission.
diff --git a/prompts/sim-audit-fix-session.md b/prompts/sim-audit-fix-session.md
deleted file mode 100644
index 5d11b7d..0000000
--- a/prompts/sim-audit-fix-session.md
+++ /dev/null
@@ -1,311 +0,0 @@
-# Webster sim — audit, fix, dry-run E2E session (Pi/Forge)
-
-> Paste this whole file into a fresh Pi/Forge session. The mission is to find and fix every gap that caused the sim to silently no-op, then prove the pipeline works E2E via extensive dry runs **before** any wall-clock 10-week run.
->
-> **Token discipline is the whole point of this session.** Wall-clock spend on the broken pipeline so far: ~5 min, mostly idle polling. We are not doing another speculative run. Every API call after Phase 1 must be justified by a fix that earlier dry runs prove sound.
-
-## Mission
-
-Investigate, fix, and dry-run-verify the Webster simulation orchestrator (`prompts/sim-council.md` + `scripts/run-simulation.ts` + `scripts/run-simulation-{lp,site}.ts`) end-to-end so that a fresh Claude Code session can run `prompts/e2e-demo-run-session.md` and have it actually produce per-week site mutations, real screenshots that diverge across weeks, and meaningful Memory-Store summaries.
-
-Hackathon submission deadline is **2026-04-26**. Do not destroy any existing artifact in `assets/memory-stores-screenshots/manual/` or in `history/lp-demo/` / `history/site-demo/`.
-
-## Background — what we already know (do not re-discover this; verify only)
-
-Three cascading architectural gaps were diagnosed in chat-session immediately preceding this Forge run. Evidence is preserved at `/tmp/webster-sim/STUCK-REPORT.md` and at `/tmp/session-events.json` (full week-0 LP monitor session events).
-
-1. **`vault_ids` missing from `sim-council.md` `create_session()`** (lines ~91–109). Production at `prompts/second-wbs-session.md:102` defines `VAULT_ID="vlt_011CaLe2pEofWQptxQyV4UMd"` and passes it on session POST. The sim fork dropped this. Direct evidence: pulled session events show first event is `mcp_authentication_failed_error: "no credential is stored for this server URL"`. Agent then fell back to local `read` tool which errored on every path because the cloud sandbox has no working tree.
-
-2. **Demo branches local-only.** `git ls-remote --heads origin 'demo-sim-lp/*'` returns nothing. `scripts/run-simulation.ts` commits but does not push. Even with vault_ids attached, GitHub MCP `get_file_contents at ref=demo-sim-lp/w00` would 404 on `richsak/webster`.
-
-3. **Ugly-site working-tree mods never committed.** `demo-landing-page/ugly/*` and `demo-sites/northwest-reno/ugly/*` show as `M` in working tree but `run-simulation.ts` only stages `historyDir`/`outputWeekDir`. Even after gaps 1+2 are fixed, agents would read stale pre-modification content from the remote.
-
-4. **Bonus suspected gap — no apply step.** `sim-council.md` Step 5 (redesigner) sends a base-message and polls until idle, but never reads output events back or applies HTML mutations to the site. Production's `second-wbs-session.md` is presumed to have an apply step; the fork dropped it. **Phase 1 reviewers must confirm or refute this.**
-
-There may be additional gaps. The 3-reviewer audit in Phase 1 exists to enumerate them before any fix is committed.
-
-## Hard rules
-
-- Do not run any sim (`bun run sim:lp`, `bun run sim:site`, `bun scripts/run-simulation*.ts`) outside the explicit dry-run steps in Phase 4.
-- Do not modify production agents (`agents/webster-{monitor,planner,redesigner,visual-reviewer}.json`, `agents/{seo,brand-voice,fh-compliance,conversion,copy}-critic.json`).
-- Do not modify `prompts/second-wbs-session.md`. Read it freely; never write.
-- Do not skip the Phase-2 user-plan gate. Richie reads and approves the plan before any implementation begins.
-- Do not push to `main`. Work happens on a feature branch off `dev`. PR base is `dev`.
-- Do not bypass any pre-commit hook (`--no-verify`, `--no-gpg-sign`).
-- Do not bury failures. If a dry run produces output that looks suspicious (e.g. completes too fast, identical screenshots across weeks), stop and surface it. Speed of completion is a diagnostic signal.
-- Token-burn budget for this whole Forge session: **<= $20 of API spend**. If a fix design pushes you above that on the dry runs alone, surface and ask before continuing.
-
-## Phase 0 — Pre-flight (zero API spend)
-
-```bash
-git status --short
-git rev-parse --abbrev-ref HEAD
-bun run validate
-bun run sim:preflight
-git ls-remote --heads origin 'demo-sim-lp/*' 'demo-sim-site/*'
-ls assets/memory-stores-screenshots/manual/
-cat /tmp/webster-sim/STUCK-REPORT.md  # if it still exists
-```
-
-Expected: validate green, preflight green, ls-remote empty, manual PNG present. If any of these unexpectedly fail or unexpectedly pass (i.e. branches ARE on remote — that would change the diagnosis), pause and investigate before Phase 1.
-
-Create a worktree for this work:
-
-```bash
-git worktree add ../webster-sim-fix dev -b fix/sim-orchestrator-gaps
-cd ../webster-sim-fix
-```
-
-All subsequent work happens in the worktree.
-
-## Phase 1 — 3 parallel reviewer agents (no fixes, no API calls to Anthropic from inside the reviewers)
-
-Spawn three reviewer subagents IN PARALLEL. Each one reads code only and reports back. None of them executes the simulation. None of them calls the Anthropic API.
-
-### Reviewer A — Production-vs-sim diff (GPT-5.5, low reasoning)
-
-Focus: enumerate every architectural divergence between production and sim orchestrators.
-
-Inputs to read:
-
-- `prompts/second-wbs-session.md` (full)
-- `prompts/sim-council.md` (full)
-- `scripts/run-simulation.ts`
-- `scripts/run-simulation-lp.ts`
-- `scripts/run-simulation-site.ts`
-- `scripts/critic-genealogy.ts`
-- `scripts/apply-worker.ts` (if present)
-- `scripts/apply-worker-cli.ts` (if present)
-
-Output a markdown table:
-
-| Step | Production behavior | Sim behavior | Gap | Risk         |
-| ---- | ------------------- | ------------ | --- | ------------ |
-| ...  | ...                 | ...          | ... | low/med/high |
-
-Specifically confirm/refute:
-
-- vault_ids inclusion in session POST body (already known gap; confirm fix shape)
-- redesigner apply step (suspected gap; trace where production reads output events and produces a commit, and whether the same hook exists in sim)
-- visual-reviewer screenshot ingestion (does prod actually receive the screenshots? how?)
-- genealogy spawn invocation (where does prod call `critic-genealogy.ts` and with what inputs?)
-- memory-store write timing (does prod write summaries pre/post council? sim does post — is that right?)
-- monitor/critic findings persistence (prod commits findings via GitHub MCP `create_or_update_file`; does sim do the same?)
-
-Hard limit: read-only. Do not write any file. Do not call any API.
-
-### Reviewer B — Data lifecycle audit (GPT-5.5, low reasoning)
-
-Focus: trace every file in the simulation's data lifecycle from ugly source → final timelapse asset.
-
-Inputs to read:
-
-- `scripts/run-simulation.ts`
-- `scripts/run-simulation-{lp,site}.ts`
-- `prompts/sim-council.md`
-- `scripts/synthetic-analytics.ts` and `scripts/analytics-ingestion.ts`
-- `scripts/build-demo-manifest.ts`
-- `agents/webster-lp-sim-*.json` (read each system prompt — note any path or ref the agent expects)
-- `demo-landing-page/ugly/`, `demo-landing-page/context/` (just `ls -R`, do not read every file)
-- `demo-sites/northwest-reno/ugly/`, `demo-sites/northwest-reno/context/` (same)
-
-For every file in the data flow, report:
-
-- **Producer**: what writes it
-- **Consumers**: what reads it (script, agent, downstream artifact)
-- **Persistence**: working tree only / committed / pushed to remote
-- **Per-week reset**: does it get overwritten each week? appended? immutable?
-- **Risk**: missing-input scenarios, stale-content scenarios, race conditions
-
-Specifically trace:
-
-- `demo-landing-page/ugly/index.html` → who writes it, who commits it, who pushes it, who reads it via MCP, when does it become the input to week N council
-- redesigner-proposed HTML → where does it land (event log? committed file? PR?)
-- weekly screenshots → producer (Playwright via `captureScreenshots`), consumer (week-summary, build-demo-manifest, video composition session)
-- `history/{lp,site}-demo/w<NN>/analytics.json` → producer (synthetic-analytics), consumer (council session via base_message reference, ingestion?)
-- memory-store writes → producer (`writeMemorySummary` in run-simulation.ts), consumer (next-week planner via `attach`)
-
-Hard limit: read-only.
-
-### Reviewer C — Token-spend trap audit (GPT-5.5, x-high reasoning)
-
-Focus: find every place in the pipeline where API tokens can be burned without producing useful artifacts. The previous run's 3:21 completion across 11×9 sessions is the reference failure.
-
-Inputs to read:
-
-- `scripts/run-simulation.ts`
-- `prompts/sim-council.md`
-- `scripts/synthetic-analytics.ts`
-- All sim-agent JSONs under `agents/webster-{lp,site}-sim-*.json` — read system prompts in full; the system prompt's instruction set is what determines if the agent will attempt useless work when its inputs are unavailable
-- `environments/webster-council-env.json`
-- `scripts/critic-genealogy.ts`
-
-Report each token-trap with:
-
-- **Trap location**: file:line
-- **Failure mode**: what makes the API call happen with no productive output
-- **Detection signal**: what an honest pipeline would see/log when this trap fires (so a fix can add a fail-fast guard)
-- **Cost upper bound**: per-week API spend if this trap fires for every session, every week
-- **Suggested guard**: smallest viable check that would cause the pipeline to halt rather than spin
-
-Specifically reason about:
-
-- Session creation that proceeds even though `vault_ids` is missing → entire 9-session council burns tokens for nothing every week, every substrate. (Already known. Confirm fix-side guard: `create_session` should refuse to POST if `vault_ids` is empty AND any agent's system prompt references GitHub MCP.)
-- `poll_idle` accepting an `idle` status without checking whether the session produced ANY agent output events. Right now `idle` after a `session.error` is treated as success. Suggest a minimum-events threshold or an explicit "did the agent emit at least one tool_use?" check.
-- Synthetic-analytics agent calls — `requestOpusReview` in `run-simulation.ts:272`: how does this fail? Does it have its own token-trap?
-- Memory-store writes via REST API: do they cost? are they per-week?
-- Genealogy probe vs spawn: spawn is a `POST /v1/agents` (free) but the genealogy _decision_ may invoke an Opus session — confirm cost shape.
-- `bun run validate` is invoked from inside the pre-commit hook every week; does that itself trigger any API call? (It shouldn't, but trust nothing.)
-
-Also include a one-line **suspicious-completion heuristic** the wrapper could add: e.g. "wall-clock per-week elapsed < 60s implies no real council work; halt and surface". Even one such heuristic would have caught both of yesterday's runs in the first week.
-
-Hard limit: read-only.
-
-### Phase 1 deliverable
-
-Three reviewer reports merged into a single file at `context/sim-audit/phase1-findings.md` in the worktree. Format:
-
-```markdown
-# Sim audit — Phase 1 findings (3-reviewer)
-
-## Confirmed gaps (cross-reviewer agreement, must-fix)
-
-- ...
-
-## Suspected gaps (one reviewer flagged, needs verification)
-
-- ...
-
-## Token traps with suggested guards
-
-- ...
-
-## Out-of-scope notes
-
-- ...
-```
-
-## Phase 2 — Consolidated plan (user gate)
-
-Read `context/sim-audit/phase1-findings.md`. Author `context/sim-audit/phase2-plan.md` containing:
-
-1. **Fix list, ordered**, each with: file path(s), one-line summary of change, justification, dry-run that proves it works.
-2. **Risk assessment**: what fixes touch shared code (`scripts/run-simulation.ts`) vs sim-only (`prompts/sim-council.md`). Anything that touches shared code needs a "does production still work?" answer.
-3. **Estimated API spend** for Phase 4 dry runs (with breakdown).
-4. **Open questions** that Richie must answer before implementation.
-
-Then surface to Richie:
-
-```text
-[PLAN READY] context/sim-audit/phase2-plan.md
-Estimated dry-run spend: $<X>
-Open questions: <Y>
-Awaiting approval before Phase 3.
-```
-
-**Do not begin Phase 3 until Richie acknowledges the plan.** If a Forge runtime auto-approves, surface a `[STUCK: AWAITING USER PLAN APPROVAL]` instead.
-
-## Phase 3 — Implementation
-
-Apply fixes from `phase2-plan.md` in dependency order. One conventional commit per fix or one small bundled commit per group, per `AGENTS.md` git rules.
-
-Hard requirements:
-
-- Every commit passes `bun run validate`.
-- Every fix has a unit test added or updated. No fix is "tested by the dry run" alone.
-- Pushing demo branches: introduce push step in `run-simulation.ts` or a wrapper. Use the `gh` CLI authenticated to `richsak/webster` (verify this remote exists before depending on it).
-- Committing the ugly-site working-tree mods: do this as a clean separate commit on `dev` BEFORE any sim run, so the demo branches are based off a HEAD that contains the ugly content. The commit message should clarify these are the demo-substrate ugly baselines, not Nicolette-production state.
-- vault_ids fix in `sim-council.md`: include it in `create_session()` AND add a guard that errors loudly if `vault_ids` is empty.
-
-Do not invent fixes outside the Phase-2 plan. If you discover a new issue mid-implementation, surface it back to Richie rather than silently expanding scope.
-
-## Phase 4 — Extensive dry runs
-
-Each dry run is gated on the previous one passing. Stop at the first failure; do not roll forward.
-
-### 4.1 — Mocked sim end-to-end (zero API spend)
-
-Use the existing `WEBSTER_SIM_COUNCIL_CMD` env var (already supported in `scripts/run-simulation-lp.ts`) to point at a stub script that:
-
-- Echoes a fake council session ID
-- Writes synthetic-shaped output files where the real council would
-- Returns exit 0
-
-Run the LP sim end-to-end with this stub. Verify:
-
-- All 11 weeks complete
-- Each week's branch contains the expected files
-- Branches push successfully (use a sandbox remote like `richsak/webster-sim-dryrun` if you want to avoid polluting `richsak/webster`)
-- `bun scripts/build-demo-manifest.ts` runs cleanly on the output
-- Final `bun run validate` is green
-
-Cost: $0 (no Anthropic calls).
-
-### 4.2 — One-week LIVE dry run for one substrate (~$5–15)
-
-Run `bun run sim:lp` configured to run **only week 0**. Verify:
-
-- Wall-clock duration > 90s (anything under 60s is the failure signal)
-- Session events for the LP monitor contain >= 5 events including >= 1 `agent.message`, >= 1 `agent.tool_use`, and >= 1 successful `mcp_tool_result`
-- The redesigner session produces at least one apply-step output
-- The committed `demo-sim-lp/w00` HEAD diff vs base shows redesigner-driven file changes (not just history/screenshots)
-- Memory store contents grew (compare via API: total bytes or document count up vs before)
-
-Halt and surface immediately if any check fails.
-
-### 4.3 — Two-week LIVE dry run, BOTH substrates sequential (~$20–40)
-
-Only run if 4.2 fully passes. Run LP weeks 0–1, then site weeks 0–1.
-
-Verify:
-
-- Site state diverges between week 0 and week 1 for each substrate (HTML diff non-empty)
-- Memory-store summaries from week 0 actually inform week 1 (planner session for week 1 should reference week 0 findings; check session events)
-- Both substrates' demo branches push to the appropriate remote
-- `build-demo-manifest.ts` produces a valid manifest
-
-If any check fails: halt, capture evidence (session IDs, branch names, event payloads), and surface a fix recommendation. Do not roll forward to a 10-week run.
-
-### 4.4 — Decision gate
-
-If 4.1–4.3 all pass:
-
-- Write `context/sim-audit/phase4-greenlight.md` summarizing the dry-run evidence
-- Surface `[GREENLIGHT] Phase 4 complete. E2E pipeline verified for 1–2 week runs. Ready for Richie to invoke prompts/e2e-demo-run-session.md in a fresh Claude Code session for the full 10-week run.`
-
-If anything fails: do not auto-loop into more attempts. Surface a `[STUCK]` with the failing check, the evidence, and a one-line recommendation.
-
-## Acceptance criteria
-
-This Forge session is done when **all** of the following are true:
-
-- [ ] `context/sim-audit/phase1-findings.md` exists with 3-reviewer cross-confirmed findings
-- [ ] `context/sim-audit/phase2-plan.md` exists and was approved by Richie
-- [ ] All Phase-3 fixes are committed on a single feature branch off `dev`
-- [ ] `bun run validate` is green on the feature branch
-- [ ] `context/sim-audit/phase4-greenlight.md` documents passing dry runs at 4.1, 4.2, and 4.3
-- [ ] A PR is open against `dev` titled `fix: webster sim orchestrator E2E gaps` with a description that summarizes the 3 known gaps + any reviewer-discovered ones
-- [ ] No commits on `main`. No edits to `prompts/second-wbs-session.md` or production agents.
-
-## Handoff to Richie's Claude Code session
-
-When Phase 4 greenlights:
-
-1. Confirm PR is open and CI is green
-2. Surface the PR URL and the 1–2 line "what to do next" instruction:
-   `Ready: in your Claude Code session, run \`/clear\` then attach \`prompts/e2e-demo-run-session.md\`. The pipeline now does real council work; expect 30–60 min per substrate.`
-3. Save final state log at `context/sim-audit/handoff.md` with: PR URL, dry-run evidence summary, list of files changed, list of files explicitly NOT changed.
-
-## STUCK protocol
-
-If you reach a point that this prompt does not answer or where the next safe action is unclear:
-
-```text
-[STUCK] <one-line>
-Phase: <0|1|2|3|4>
-Evidence: <paths or session IDs>
-What I tried: ...
-What I need from Richie: <one specific question>
-```
-
-Do not paper over. Visible struggle is the contract.
diff --git a/prompts/sim-runner.md b/prompts/sim-runner.md
deleted file mode 100644
index de5b381..0000000
--- a/prompts/sim-runner.md
+++ /dev/null
@@ -1,187 +0,0 @@
-# Sim runner session prompt — automated sim + Console capture pipeline
-
-> Paste this into a fresh Pi (Forge worker) or Claude Code session ready to run the Webster simulation across both substrates with auto-capture of Anthropic Console memory store states. The output of this session is the asset bundle that the composition session and Beat 5 of the demo video depend on.
-
-## Mission
-
-You are running the simulation + capture pipeline for the Webster hackathon demo (deadline 2026-04-28).
-
-Your job: execute the full 10-week simulation across both substrates (Richer Health LP + Northwest Home Renovations site) and auto-capture Anthropic Console memory store screenshots at week 1, 5, and 10 for each substrate.
-
-**Do NOT** improvise, redesign critic specs, alter the council orchestrator, or modify the simulation scripts. Every parameter is locked in `context/VISION.md`, `context/EXPANSION-TASKS.md` (T7 + T8), and `context/ONBOARDING-CASE-STUDY.md` (Memory Stores capture plan).
-
-## First actions (in order)
-
-1. Read `AGENTS.md` (operator guide, branch conventions, do/don't rules)
-2. Read `context/EXPANSION-TASKS.md` — confirm T7 (sim wrapper) and T8 (per-substrate invocations) acceptance criteria
-3. Read `context/ONBOARDING-CASE-STUDY.md` "Memory Stores capture plan" section — capture protocol and targets
-4. Read `context/VIDEO-PLAN.md` Beat 5 section — confirm what the captures feed
-5. Confirm asset readiness checklist below
-6. Run pre-flight gate
-7. If anything is missing or ambiguous: surface `[STUCK]` to Richie with specific paths/symptoms. Do NOT silently fall back.
-
-## Asset readiness checklist
-
-Confirm each before kicking off the pipeline:
-
-### Code
-
-- [ ] `scripts/run-simulation-lp.ts` exists, builds, emits `CAPTURE_TRIGGER` events at weeks 1/5/10
-- [ ] `scripts/run-simulation-site.ts` exists, builds, emits `CAPTURE_TRIGGER` events at weeks 1/5/10
-- [ ] `scripts/capture-mem-stores.ts` exists, builds, accepts `{substrate, week, output}` arguments
-- [ ] `scripts/simulation-core.ts` exists with shared loop + trigger emission helper
-- [ ] All 18 sim agents registered in workspace (`webster-lp-sim-*` × 9, `webster-site-sim-*` × 9) — verify via `GET /v1/agents`
-- [ ] All 12 memory stores provisioned per `context/memory-stores.json` — verify via `GET /v1/memory_stores`
-
-### Auth + tooling
-
-- [ ] Anthropic API key with managed-agent + memory-store quota present in `.env.local`
-- [ ] GitHub PAT with repo scope present
-- [ ] `browser-use` CLI installed (`browser-use doctor` passes)
-- [ ] User's local Chrome "Default" profile logged into `console.anthropic.com` — `browser-use --profile "Default"` will reuse this session, no separate auth setup needed
-- [ ] One manual dry run: `browser-use --profile "Default" open https://console.anthropic.com/settings/memory-stores && browser-use screenshot /tmp/dryrun.png` — confirm the captured PNG shows the authenticated store list, not a login page
-
-### Output dirs
-
-- [ ] `assets/memory-stores-screenshots/lp/` (created on first run)
-- [ ] `assets/memory-stores-screenshots/site/` (created on first run)
-- [ ] `demo-output/lp/week-{1..10}/` (sim outputs land here)
-- [ ] `demo-output/site/week-{1..10}/` (sim outputs land here)
-
-## Pre-flight gate
-
-Before running either sim:
-
-```bash
-bun run sim:preflight
-# checks: agent count = 18, memory store count = 12, Console reachable, scripts compile
-```
-
-If preflight fails: stop. Surface the failure to Richie. Do not run the sim.
-
-## Pipeline phases
-
-### Phase 1 — LP substrate (Richer Health)
-
-```bash
-bun run sim:lp 2>&1 | bun run sim:capture-bridge
-```
-
-`sim:lp` runs `scripts/run-simulation-lp.ts`. The bridge script reads stdout JSON lines, spots `CAPTURE_TRIGGER` events, and spawns `scripts/capture-mem-stores.ts` for each.
-
-Expected sequence per week (1 through 10):
-
-1. Synthetic analytics agent fires (week N analytics generated)
-2. Sim spawns council session via `prompts/sim-council.md` for week N
-3. Council completes, screenshots/findings/manifests written to `demo-output/lp/week-N/`
-4. **At weeks 1, 5, 10 only**: sim emits a `CAPTURE_TRIGGER` JSON line to stdout
-5. Bridge reads trigger, spawns capture subprocess, waits for exit 0
-6. Sim moves to week N+1
-
-Total expected duration: 30–60 min per substrate (depends on session token volume).
-
-### Phase 2 — Site substrate (Northwest Home Renovations)
-
-Same shape:
-
-```bash
-bun run sim:site 2>&1 | bun run sim:capture-bridge
-```
-
-### Phase 3 — Manifest emit
-
-```bash
-bun run sim:emit-manifest
-# writes assets/memory-stores-screenshots/manifest.json
-# writes demo-output/lp/manifest.json (consolidating per-week manifests)
-# writes demo-output/site/manifest.json (consolidating per-week manifests)
-```
-
-The manifest is what the composition session reads to drive Beat 5 of the demo video.
-
-## Trigger protocol (the contract between sim and capture)
-
-Sim emits exactly one stdout JSON line per capture event:
-
-```jsonc
-{
-  "event": "CAPTURE_TRIGGER",
-  "substrate": "lp", // or "site"
-  "week": 5, // 1, 5, or 10
-  "output": "assets/memory-stores-screenshots/lp/week-5.png",
-  "console_url": "https://console.anthropic.com/settings/memory-stores",
-}
-```
-
-Bridge script behavior:
-
-- Reads stdin line-by-line; pipes through unchanged to its own stdout (so sim logs flow visible)
-- For lines parseable as `{"event":"CAPTURE_TRIGGER",...}`: spawn `scripts/capture-mem-stores.ts` with the trigger payload, wait for exit
-- If capture exits non-zero: print the failure, do not advance, halt the pipe (sim stalls — better than corrupt screenshots)
-
-## Capture subprocess (`scripts/capture-mem-stores.ts`)
-
-The TS script shells out to the `browser-use` CLI (it does NOT call any Claude-session-only skill). Sequence:
-
-```bash
-browser-use --profile "Default" open <console_url_from_trigger>
-browser-use wait selector "[data-testid='memory-stores-list']" --timeout 15000
-browser-use screenshot --full <output_path_from_trigger>
-```
-
-The `--profile "Default"` flag points `browser-use` at the user's real Chrome profile, so the existing logged-in Anthropic Console session is reused. No separate auth setup is needed.
-
-After the screenshot is written:
-
-1. Verify the file exists and is non-empty (`stat <output>`)
-2. Verify it doesn't appear to be a login page — quick heuristic: file size > 100KB AND `browser-use get text` for the page contains the word "Memory Stores"
-3. Exit 0 if both checks pass
-
-If the screenshot turns out to be a login page (auth expired): exit non-zero with a clear `AUTH_EXPIRED` marker on stderr. Bridge surfaces this; pipeline halts; user re-logs in via Chrome (no special tooling — just visit `console.anthropic.com` and sign in); pipeline resumed via the resume hook. Phases 1 + 2 are idempotent on per-week granularity — check `demo-output/{substrate}/week-N/manifest.json` exists; skip if so.
-
-## Escalation rules — when to surface `[STUCK]`
-
-Stop and surface if any of these:
-
-1. Preflight fails (agent or memory store count mismatch, scripts don't compile, Console unreachable)
-2. Any sim week's session fails repeatedly (3+ retry attempts) — diagnose root cause; do not paper over
-3. Capture subprocess fails with `AUTH_EXPIRED` — pause, ask Richie to re-login, then resume
-4. Capture subprocess fails for any other reason after 2 retries — surface immediately
-5. Sim completes but a milestone screenshot is missing — pipeline failed silently somewhere; surface
-6. Decision required that isn't covered by `context/VISION.md`, `EXPANSION-TASKS.md`, or `ONBOARDING-CASE-STUDY.md`
-
-Do NOT surface for:
-
-- Routine session retries within the council orchestrator (its own retry policy handles those)
-- Non-milestone weeks (no capture expected at weeks 2, 3, 4, 6, 7, 8, 9 — by design)
-
-## Hard rules
-
-- Do NOT modify the sim scripts, council orchestrator, or critic specs to "fix" issues mid-run. If something is broken, surface and stop.
-- Do NOT skip a milestone capture. If week 5 capture fails, halt — week 5 is required for Beat 5.
-- Do NOT manually screenshot Console as a fallback during the run. If auto-capture fails, the pipeline must be fixed and re-run from the failing week, not patched up.
-- Do NOT touch production agents, the production orchestrator (`prompts/second-wbs-session.md`), or anything in the existing 9 `webster-*` set.
-- Do NOT run both substrates in parallel. The browser skill drives a single browser context; concurrent captures will collide.
-
-## Output of the pipeline
-
-| path                                                      | contents                                                                                                                            |
-| --------------------------------------------------------- | ----------------------------------------------------------------------------------------------------------------------------------- |
-| `demo-output/lp/week-{1..10}/`                            | per-week sim outputs (screenshots, findings, manifests, analytics, council reasoning)                                               |
-| `demo-output/site/week-{1..10}/`                          | same for site substrate                                                                                                             |
-| `assets/memory-stores-screenshots/lp/week-{1,5,10}.png`   | 3 PNG for LP Console captures                                                                                                       |
-| `assets/memory-stores-screenshots/site/week-{1,5,10}.png` | 3 PNG for site Console captures                                                                                                     |
-| `assets/memory-stores-screenshots/manifest.json`          | one-line manifest for composition                                                                                                   |
-| `demo-output/lp/manifest.json`                            | consolidated per-week manifest for LP                                                                                               |
-| `demo-output/site/manifest.json`                          | consolidated per-week manifest for site                                                                                             |
-| `demo-output/genealogy-event.json`                        | captured POST /v1/agents request + 200 response from the organic spawn moment (whichever substrate fires; if both fire, both saved) |
-
-These are the inputs the composition session (`prompts/composition-session.md`) consumes.
-
-## When in doubt
-
-- Sim semantics → `context/VISION.md` + `context/EXPANSION-TASKS.md` T7/T8
-- Capture protocol → this file's "Trigger protocol" + "Capture subprocess" sections
-- Beat 5 target → `context/VIDEO-PLAN.md` Beat 5
-- Onboarding skill ↔ this pipeline relationship → `context/ONBOARDING-CASE-STUDY.md` "Memory Stores capture plan"
-- Anything else → surface `[STUCK]` to Richie. Do not guess.
diff --git a/prompts/third-wbs-session.md b/prompts/third-wbs-session.md
deleted file mode 100644
index 859ea10..0000000
--- a/prompts/third-wbs-session.md
+++ /dev/null
@@ -1,308 +0,0 @@
-# Third wbs session — operator review: decide & record
-
-> **Override default Operating Loop.** This is a review session. Do NOT scan `FEATURES.md`, do NOT launch feature workflows, do NOT create Anthropic managed-agent sessions. Execute the steps below end-to-end.
-
-## What this session does
-
-Closes the loop on the most recent council PR. The second session produced a draft PR; this session is the operator decision gate.
-
-1. Finds the oldest open draft PR on a `council/<date>` branch.
-2. Pulls the branch and verifies `proposal.md` + `decision.json` (+ any genealogy spawn).
-3. Opus 4.7 (you, in this session) reads the artifacts and presents an operator-facing review — summary, strengths, risks, three scored options.
-4. **Pauses** for the operator's decision: `merge` / `reject` / `defer` + a 1-sentence rationale.
-5. Writes `history/$WEEK_DATE/operator-decision.json` — the durable record that feeds next week's monitor ("last week's proposal was rejected for X — consider Y").
-6. Executes the decision: squash-merge, close-with-comment, or comment-and-leave-open.
-7. Writes a completion checkpoint.
-
-**Expected runtime:** 3–8 min wall-clock (artifact fetch + review synthesis + operator reply + merge).
-**Expected API cost:** ~$0 beyond this Opus session (subscription). No managed-agent calls.
-
-## Pre-flight (MANDATORY — do not skip)
-
-```bash
-# 1. gh CLI auth — needed to list PR, read it, merge or close it.
-if ! gh auth status >/dev/null 2>&1; then
-  echo "ABORT: gh CLI not authenticated."
-  echo "Fix: run 'gh auth login' outside wbs, then retry this prompt."
-  exit 1
-fi
-
-# 2. Working tree clean — we'll switch branches and commit on main.
-if ! git diff --quiet || ! git diff --cached --quiet; then
-  echo "ABORT: working tree has uncommitted changes."
-  echo "Fix: commit or stash, then retry."
-  git status --short
-  exit 1
-fi
-
-# 3. This session does NOT need ANTHROPIC_API_KEY — it makes no managed-agent calls.
-#    If the key is exported it won't hurt, but it's also not required.
-
-mkdir -p tmp .claude/checkpoints
-```
-
-## Step 1 — Locate the council PR (30s)
-
-Pick the oldest open draft PR whose branch starts `council/`. Oldest = if multiple weeks accumulated unreviewed, we review them in order.
-
-```bash
-PR_JSON=$(gh pr list --state open --draft \
-  --json number,headRefName,url,createdAt --limit 50 \
-  | jq 'map(select(.headRefName | startswith("council/"))) | sort_by(.createdAt) | .[0] // empty')
-
-if [[ -z "$PR_JSON" ]]; then
-  echo "ABORT: no open draft PR on a council/ branch found."
-  echo "Either (a) a prior third-session already closed the loop, or"
-  echo "       (b) session 2 has not been run for the current week yet."
-  exit 1
-fi
-
-PR_NUM=$(echo "$PR_JSON" | jq -r '.number')
-BRANCH=$(echo "$PR_JSON" | jq -r '.headRefName')
-PR_URL=$(echo "$PR_JSON" | jq -r '.url')
-WEEK_DATE=${BRANCH#council/}
-
-echo "Reviewing PR #$PR_NUM — $PR_URL"
-echo "Branch: $BRANCH   Week: $WEEK_DATE"
-```
-
-## Step 2 — Fetch branch + verify artifacts (1 min)
-
-```bash
-git fetch origin "$BRANCH"
-git checkout "$BRANCH"
-git pull origin "$BRANCH"
-
-PROPOSAL="history/$WEEK_DATE/proposal.md"
-DECISION="history/$WEEK_DATE/decision.json"
-GENEALOGY_DIR="history/$WEEK_DATE/genealogy"
-OPERATOR_DECISION="history/$WEEK_DATE/operator-decision.json"
-
-echo "── Artifact presence ─────────────────────────"
-[[ -f "$PROPOSAL" ]] && echo "  ✓ $PROPOSAL ($(wc -l < "$PROPOSAL") lines)" \
-                    || echo "  ✗ $PROPOSAL MISSING"
-[[ -f "$DECISION" ]] && echo "  ✓ $DECISION" \
-                    || echo "  ✗ $DECISION MISSING"
-[[ -d "$GENEALOGY_DIR" ]] && echo "  + genealogy spawn: $(ls "$GENEALOGY_DIR" | tr '\n' ' ')" \
-                         || echo "    (no genealogy spawn this week)"
-
-# Guard: proposal missing = redesigner failed; cannot meaningfully review.
-if [[ ! -f "$PROPOSAL" ]]; then
-  echo "ABORT: $PROPOSAL missing on $BRANCH. Redesigner output absent — nothing to review."
-  echo "Fix: re-run Step 5 of second-wbs-session.md, then retry this prompt."
-  exit 1
-fi
-
-# Guard: loop already closed for this week.
-if [[ -f "$OPERATOR_DECISION" ]]; then
-  echo "NOTE: $OPERATOR_DECISION already exists:"
-  cat "$OPERATOR_DECISION"
-  echo "The PR is still open-draft but the decision was already recorded."
-  echo "If you want to re-decide, delete that file on $BRANCH and re-run."
-  exit 0
-fi
-```
-
-## Step 3 — Opus review + present options
-
-**You (Opus 4.7) now read the artifacts and produce the review below, then STOP and wait for the operator's reply.**
-
-Tool calls for this step:
-
-- `Read` `$PROPOSAL` — the redesigner's full proposal.
-- `Read` `$DECISION` — the redesigner's structured picks (primary + alt + rejected).
-- If `$GENEALOGY_DIR` exists: `Read` the first `*.md` findings file inside it to see what the spawned critic added.
-- Do NOT re-read individual critic findings — the proposal already synthesizes them. Keep context tight.
-
-Produce in chat, using this exact structure (operator is Richie — lead with scores per his communication preference):
-
-```markdown
-### Summary
-
-[2–3 sentences: what the proposal changes and why, in plain language.]
-
-### Strengths (top 1–2)
-
-- [Specific, not generic. "Hero headline swaps passive voice for outcome framing
-  — directly addresses conversion critic's #1 finding" not "good copy work".]
-
-### Risks (top 1–2)
-
-- [Specific failure mode. "H1 change breaks SEO tracking on 'homepage' event
-  unless the analytics tag is updated" not "could affect SEO".]
-
-### Genealogy
-
-[One line: no spawn | spawned <name> — <what gap it covered>]
-
-### Options
-
-1. **Merge** (X/100) — [one-line why]
-2. **Reject** (X/100) — [one-line why]
-3. **Defer** (X/100) — [one-line why]
-
----
-
-**Decide**: reply `merge`, `reject`, or `defer` — plus a 1-sentence rationale.
-```
-
-**HARD STOP.** Do not execute Steps 4–7 until the operator replies with a decision.
-
-## Step 4 — Record the decision
-
-When the operator replies, parse their choice (`merge` | `reject` | `defer`) and rationale. Set these as bash vars at the top of Step 5:
-
-```bash
-# Fill these in from the operator's reply.
-DECISION_CHOICE="merge"         # merge | reject | defer
-DECISION_RATIONALE="<one-sentence rationale from operator's reply>"
-
-# Validate.
-case "$DECISION_CHOICE" in
-  merge|reject|defer) ;;
-  *) echo "ERROR: DECISION_CHOICE must be merge|reject|defer, got '$DECISION_CHOICE'"; exit 1 ;;
-esac
-```
-
-## Step 5 — Execute the decision
-
-All three paths end on `main` with `history/$WEEK_DATE/operator-decision.json` committed. Merge adds a `merge_sha`; reject closes the PR; defer leaves it open with a comment.
-
-```bash
-case "$DECISION_CHOICE" in
-  merge)
-    # Squash-merge with rationale as merge-commit body.
-    gh pr merge "$PR_NUM" --squash --delete-branch \
-      --body "$DECISION_RATIONALE"
-
-    # Grab the squash commit SHA for the record.
-    MERGE_SHA=$(gh pr view "$PR_NUM" --json mergeCommit --jq '.mergeCommit.oid' 2>/dev/null)
-    [[ -z "$MERGE_SHA" || "$MERGE_SHA" == "null" ]] && MERGE_SHA="unknown"
-
-    git checkout main
-    git pull origin main
-
-    jq -n \
-      --arg d "$DECISION_CHOICE" \
-      --arg r "$DECISION_RATIONALE" \
-      --arg pr "$PR_URL" \
-      --arg sha "$MERGE_SHA" \
-      --arg ts "$(date -u +%Y-%m-%dT%H:%M:%SZ)" \
-      '{decision: $d, rationale: $r, pr_url: $pr, merge_sha: $sha, timestamp: $ts}' \
-      > "$OPERATOR_DECISION"
-
-    git add "$OPERATOR_DECISION"
-    git commit -m "docs(council): operator approved $BRANCH — $DECISION_RATIONALE"
-    git push origin main
-    RESULT="merged (sha=$MERGE_SHA, branch deleted)"
-    ;;
-
-  reject)
-    gh pr close "$PR_NUM" --comment "Rejected: $DECISION_RATIONALE"
-
-    git checkout main
-    git pull origin main
-    mkdir -p "history/$WEEK_DATE"
-
-    jq -n \
-      --arg d "$DECISION_CHOICE" \
-      --arg r "$DECISION_RATIONALE" \
-      --arg pr "$PR_URL" \
-      --arg ts "$(date -u +%Y-%m-%dT%H:%M:%SZ)" \
-      '{decision: $d, rationale: $r, pr_url: $pr, timestamp: $ts}' \
-      > "$OPERATOR_DECISION"
-
-    git add "$OPERATOR_DECISION"
-    git commit -m "docs(council): operator rejected $BRANCH — $DECISION_RATIONALE"
-    git push origin main
-    RESULT="rejected (PR closed, branch kept for history)"
-    ;;
-
-  defer)
-    gh pr comment "$PR_NUM" --body "Deferred: $DECISION_RATIONALE"
-
-    git checkout main
-    git pull origin main
-    mkdir -p "history/$WEEK_DATE"
-
-    jq -n \
-      --arg d "$DECISION_CHOICE" \
-      --arg r "$DECISION_RATIONALE" \
-      --arg pr "$PR_URL" \
-      --arg ts "$(date -u +%Y-%m-%dT%H:%M:%SZ)" \
-      '{decision: $d, rationale: $r, pr_url: $pr, timestamp: $ts}' \
-      > "$OPERATOR_DECISION"
-
-    git add "$OPERATOR_DECISION"
-    git commit -m "docs(council): operator deferred $BRANCH — $DECISION_RATIONALE"
-    git push origin main
-    RESULT="deferred (PR still open)"
-    ;;
-esac
-
-echo ""
-echo "── Decision executed ────────────────────────"
-echo "  Choice: $DECISION_CHOICE"
-echo "  Result: $RESULT"
-echo "  Record: $OPERATOR_DECISION"
-```
-
-## Step 6 — Checkpoint + exit
-
-```bash
-CKPT=".claude/checkpoints/$(date -u +%Y-%m-%dT%H%M%SZ)-session-3-complete.md"
-cat > "$CKPT" <<EOF
----
-ts: $(date -u +%Y-%m-%dT%H:%M:%SZ)
-trigger: session-3-complete
----
-
-## What happened
-
-Operator review of council week $WEEK_DATE PR. Decision: **$DECISION_CHOICE**. Result: $RESULT.
-
-## Artifacts
-
-- PR: $PR_URL
-- Decision record: $OPERATOR_DECISION
-- Rationale: $DECISION_RATIONALE
-
-## Next tick
-
-- Next council run: week ending $(python3 - <<'PY'
-from datetime import datetime, timedelta, timezone
-print((datetime.now(timezone.utc) + timedelta(days=7)).strftime('%Y-%m-%d'))
-PY
-).
-- Next week's monitor should pick up \`$OPERATOR_DECISION\` and factor the rationale
-  into its WoW anomaly framing (e.g., if rejected, the previous week's proposed
-  change did not ship — baseline is unchanged).
-EOF
-
-git add "$CKPT"
-git commit -m "docs(checkpoint): session 3 complete — $DECISION_CHOICE week $WEEK_DATE"
-git push origin main
-
-echo ""
-echo "══════════════════════════════════════════════════"
-echo "Session 3 complete."
-echo "  PR #$PR_NUM — $DECISION_CHOICE"
-echo "  Record: $OPERATOR_DECISION"
-echo "  Checkpoint: $CKPT"
-echo "══════════════════════════════════════════════════"
-exit 0
-```
-
-## If a step fails
-
-- **No open `council/` draft PR**: second-session hasn't run this week, or a prior third-session already closed the loop. Run `prompts/second-wbs-session.md` first.
-- **`proposal.md` missing on branch**: the redesigner didn't finish. Re-run Step 5 of the second session (`run_agent_session redesigner "$REDESIGNER_ID" "$MSG_REDESIGNER"` against the same branch), then retry this prompt.
-- **`operator-decision.json` already exists**: the loop is already closed for this week. Either (a) accept and exit, or (b) delete the file on `$BRANCH`, push, retry.
-- **`gh pr merge` rejected (CI red, protected branch, conflicts)**: the PR has a blocker. Fix the blocker on `$BRANCH` and re-push, then re-run this prompt from Step 1.
-- **Operator replies with something other than `merge|reject|defer`**: Step 4 validation aborts cleanly. Re-run the prompt and reply with a valid choice.
-
-## What this prompt DOES NOT do
-
-- **Does not re-run any critic.** Findings are frozen at PR-open time. If a critic was wrong, either reject-and-retry next week, or defer and re-run session 2 after fixing the agent.
-- **Does not touch `site/`.** This repo is still brief-only — no forked landing page to diff. When `site/` exists, the merge path will also land the diff; no change to this prompt required.
-- **Does not update `FEATURES.md` or run `bun run validate`.** This is a review prompt, not a feature prompt. The only code path it commits is the JSON record + checkpoint.
diff --git a/scripts/onboarding/scaffold-repo.ts b/scripts/onboarding/scaffold-repo.ts
new file mode 100644
index 0000000..4e5d839
--- /dev/null
+++ b/scripts/onboarding/scaffold-repo.ts
@@ -0,0 +1,327 @@
+#!/usr/bin/env bun
+/**
+ * Creates a fresh GitHub repo for the user's site and scaffolds a minimal Astro
+ * starter using brand identity from context/business.yaml.
+ *
+ * Usage: bun run onboarding:scaffold-repo [--name <repo-name>] [--public]
+ *
+ * Defaults:
+ *   --name = slug(business.name) + "-webster"
+ *   visibility = private (override with --public)
+ *
+ * Idempotent: if the repo already exists under the user's account, the script
+ * verifies it's empty (or only contains the scaffold) and skips creation.
+ *
+ * Writes:
+ *   - the new repo on github.com
+ *   - context/onboarding-repo.json with {repo, owner, default_branch, scaffolded_at}
+ */
+
+import { execFileSync, spawnSync } from "node:child_process";
+import { existsSync, mkdirSync, readFileSync, writeFileSync } from "node:fs";
+import { join, resolve } from "node:path";
+
+const ROOT = resolve(import.meta.dir, "..", "..");
+const BUSINESS_YAML = join(ROOT, "context/business.yaml");
+const REPO_RECORD = join(ROOT, "context/onboarding-repo.json");
+
+interface Args {
+  name: string | null;
+  visibility: "public" | "private";
+}
+
+function parseArgs(): Args {
+  const args: Args = { name: null, visibility: "private" };
+  for (let i = 2; i < process.argv.length; i++) {
+    const arg = process.argv[i];
+    if (arg === "--name") {
+      const next = process.argv[i + 1];
+      if (next !== undefined) {
+        args.name = next;
+        i++;
+      }
+    } else if (arg === "--public") {
+      args.visibility = "public";
+    }
+  }
+  return args;
+}
+
+function readBusinessYaml(): {
+  name: string;
+  oneLine: string;
+  palettePrimary: string;
+  paletteAccent: string;
+  fontHeadline: string;
+  fontBody: string;
+} {
+  if (!existsSync(BUSINESS_YAML)) {
+    throw new Error(`context/business.yaml not found — run P1 of webster-onboarding first`);
+  }
+  const text = readFileSync(BUSINESS_YAML, "utf-8");
+  const get = (pattern: RegExp): string => {
+    const match = text.match(pattern);
+    const captured = match?.[1];
+    if (!captured) {
+      return "";
+    }
+    return captured.trim().replace(/^["']|["']$/g, "");
+  };
+  const name = get(/^\s{0,4}name:\s*(.+)$/m);
+  if (!name) {
+    throw new Error("business.name is empty in context/business.yaml");
+  }
+  const oneLine = get(/^\s{0,4}one_line:\s*(.+)$/m);
+  let palettePrimary = "#000000";
+  let paletteAccent = "#444444";
+  const paletteIdx = text.indexOf("palette:");
+  if (paletteIdx !== -1) {
+    const colors: string[] = [];
+    const afterLines = text.slice(paletteIdx).split("\n").slice(1);
+    for (const line of afterLines) {
+      const trimmed = line.trim();
+      if (trimmed === "") {
+        continue;
+      }
+      if (trimmed.startsWith("-")) {
+        const hex = trimmed.match(/#[0-9a-fA-F]{6}/);
+        if (hex) {
+          colors.push(hex[0]);
+        }
+        continue;
+      }
+      break;
+    }
+    if (colors[0]) {
+      palettePrimary = colors[0];
+    }
+    if (colors[1]) {
+      paletteAccent = colors[1];
+    }
+  }
+  const fontHeadline = get(/^\s{0,6}headline:\s*(.+)$/m) || "Inter";
+  const fontBody = get(/^\s{0,6}body:\s*(.+)$/m) || "Source Sans Pro";
+  return { name, oneLine, palettePrimary, paletteAccent, fontHeadline, fontBody };
+}
+
+function slugify(name: string): string {
+  return name
+    .toLowerCase()
+    .replace(/[^a-z0-9]+/g, "-")
+    .replace(/^-+|-+$/g, "")
+    .slice(0, 60);
+}
+
+function getGhUser(): string {
+  try {
+    const out = execFileSync("gh", ["api", "/user", "--jq", ".login"], { encoding: "utf-8" });
+    return out.trim();
+  } catch (err) {
+    throw new Error(
+      `gh CLI not authenticated or not installed: ${err instanceof Error ? err.message : String(err)}`,
+    );
+  }
+}
+
+function repoExists(owner: string, name: string): boolean {
+  const result = spawnSync("gh", ["repo", "view", `${owner}/${name}`, "--json", "name"], {
+    encoding: "utf-8",
+  });
+  return result.status === 0;
+}
+
+function repoIsEmpty(owner: string, name: string): boolean {
+  const result = spawnSync("gh", ["api", `/repos/${owner}/${name}/commits`, "--jq", "length"], {
+    encoding: "utf-8",
+  });
+  if (result.status !== 0) {
+    return true;
+  }
+  const out = (result.stdout ?? "").trim();
+  return out === "0" || out === "[]" || out === "";
+}
+
+function createRepo(
+  owner: string,
+  name: string,
+  visibility: "public" | "private",
+  description: string,
+): void {
+  const args = [
+    "repo",
+    "create",
+    `${owner}/${name}`,
+    visibility === "public" ? "--public" : "--private",
+    "--description",
+    description,
+  ];
+  const result = spawnSync("gh", args, { encoding: "utf-8" });
+  if (result.status !== 0) {
+    throw new Error(`gh repo create failed: ${result.stderr ?? "no stderr"}`);
+  }
+}
+
+function scaffoldFiles(
+  workDir: string,
+  brand: {
+    name: string;
+    oneLine: string;
+    palettePrimary: string;
+    paletteAccent: string;
+    fontHeadline: string;
+    fontBody: string;
+  },
+): void {
+  mkdirSync(workDir, { recursive: true });
+  mkdirSync(join(workDir, "src/pages"), { recursive: true });
+  mkdirSync(join(workDir, "src/styles"), { recursive: true });
+  mkdirSync(join(workDir, "context"), { recursive: true });
+
+  const slug = slugify(brand.name);
+
+  writeFileSync(
+    join(workDir, "package.json"),
+    JSON.stringify(
+      {
+        name: slug,
+        type: "module",
+        version: "0.0.1",
+        private: true,
+        scripts: {
+          dev: "astro dev",
+          start: "astro dev",
+          build: "astro build",
+          preview: "astro preview",
+        },
+        dependencies: {
+          astro: "^4.0.0",
+          "@astrojs/cloudflare": "^9.0.0",
+        },
+      },
+      null,
+      2,
+    ) + "\n",
+  );
+
+  writeFileSync(
+    join(workDir, "astro.config.mjs"),
+    `import { defineConfig } from "astro/config";\nimport cloudflare from "@astrojs/cloudflare";\n\nexport default defineConfig({\n  output: "server",\n  adapter: cloudflare(),\n});\n`,
+  );
+
+  writeFileSync(
+    join(workDir, "wrangler.jsonc"),
+    JSON.stringify(
+      {
+        name: slug,
+        main: "./dist/_worker.js",
+        compatibility_date: "2026-04-01",
+        assets: { directory: "./dist" },
+      },
+      null,
+      2,
+    ) + "\n",
+  );
+
+  writeFileSync(
+    join(workDir, "src/styles/global.css"),
+    `:root {\n  --color-primary: ${brand.palettePrimary};\n  --color-accent: ${brand.paletteAccent};\n  --font-headline: "${brand.fontHeadline}", system-ui, sans-serif;\n  --font-body: "${brand.fontBody}", system-ui, sans-serif;\n}\n\nbody {\n  font-family: var(--font-body);\n  margin: 0;\n  color: #1a1a1a;\n}\n\nh1, h2, h3 { font-family: var(--font-headline); }\n\n.hero {\n  background: var(--color-primary);\n  color: white;\n  padding: 4rem 1.5rem;\n}\n\n.cta {\n  background: var(--color-accent);\n  color: #1a1a1a;\n  padding: 0.75rem 1.5rem;\n  border-radius: 4px;\n  font-weight: 600;\n  text-decoration: none;\n  display: inline-block;\n}\n`,
+  );
+
+  writeFileSync(
+    join(workDir, "src/pages/index.astro"),
+    `---\nimport "../styles/global.css";\nconst businessName = ${JSON.stringify(brand.name)};\nconst tagline = ${JSON.stringify(brand.oneLine)};\n---\n\n<html lang="en">\n  <head>\n    <meta charset="UTF-8" />\n    <meta name="viewport" content="width=device-width, initial-scale=1.0" />\n    <title>{businessName}</title>\n    <meta name="description" content={tagline} />\n  </head>\n  <body>\n    <section class="hero">\n      <h1>{businessName}</h1>\n      <p>{tagline}</p>\n      <a class="cta" href="#contact">Get in touch</a>\n    </section>\n    <section id="contact">\n      <h2>Contact</h2>\n      <p>Webster's first council run will populate this section with your real conversion path.</p>\n    </section>\n  </body>\n</html>\n`,
+  );
+
+  writeFileSync(
+    join(workDir, ".gitignore"),
+    `node_modules/\ndist/\n.astro/\n.env\n.env.local\n.env.*.local\ntmp/\n`,
+  );
+
+  writeFileSync(
+    join(workDir, "README.md"),
+    `# ${brand.name}\n\n${brand.oneLine}\n\nThis site is managed by [Webster](https://github.com/richsak/webster) — a council of Claude agents that proposes weekly improvements via pull request.\n\n## Develop\n\n\`\`\`bash\nbun install\nbun run dev\n\`\`\`\n\n## Deploy\n\nMerging a PR triggers Cloudflare Workers Builds to deploy automatically.\n`,
+  );
+}
+
+function commitAndPush(workDir: string, owner: string, name: string): string {
+  const run = (cmd: [string, ...string[]], cwd: string): void => {
+    const [bin, ...rest] = cmd;
+    const result = spawnSync(bin, rest, { cwd, encoding: "utf-8" });
+    if (result.status !== 0) {
+      throw new Error(`${cmd.join(" ")} failed: ${result.stderr ?? "no stderr"}`);
+    }
+  };
+  run(["git", "init", "-b", "main"], workDir);
+  run(["git", "add", "."], workDir);
+  run(["git", "commit", "-m", "feat: scaffold Astro starter via webster-onboarding"], workDir);
+  run(["git", "remote", "add", "origin", `https://github.com/${owner}/${name}.git`], workDir);
+  run(["git", "push", "-u", "origin", "main"], workDir);
+  const sha = execFileSync("git", ["rev-parse", "HEAD"], {
+    cwd: workDir,
+    encoding: "utf-8",
+  }).trim();
+  return sha;
+}
+
+function recordScaffold(owner: string, name: string, sha: string): void {
+  mkdirSync(join(ROOT, "context"), { recursive: true });
+  writeFileSync(
+    REPO_RECORD,
+    JSON.stringify(
+      {
+        owner,
+        repo: name,
+        full_name: `${owner}/${name}`,
+        default_branch: "main",
+        scaffold_sha: sha,
+        scaffolded_at: new Date().toISOString(),
+      },
+      null,
+      2,
+    ) + "\n",
+  );
+}
+
+function main(): number {
+  const args = parseArgs();
+  const brand = readBusinessYaml();
+  const repoName = args.name ?? `${slugify(brand.name)}-webster`;
+  const owner = getGhUser();
+
+  console.log(`scaffolding ${owner}/${repoName} (${args.visibility})`);
+
+  if (repoExists(owner, repoName)) {
+    if (!repoIsEmpty(owner, repoName)) {
+      console.error(`✗ ${owner}/${repoName} already exists and is not empty`);
+      console.error(
+        `  hint: pick a different --name, or delete the existing repo first if it was a prior failed scaffold`,
+      );
+      return 1;
+    }
+    console.log(`reusing existing empty repo ${owner}/${repoName}`);
+  } else {
+    createRepo(owner, repoName, args.visibility, brand.oneLine || `Webster site for ${brand.name}`);
+    console.log(`created ${owner}/${repoName}`);
+  }
+
+  const workDir = join(ROOT, "tmp/onboarding-scaffold", repoName);
+  scaffoldFiles(workDir, brand);
+  console.log(`scaffolded files in ${workDir.replace(`${ROOT}/`, "")}`);
+
+  const sha = commitAndPush(workDir, owner, repoName);
+  console.log(`pushed initial commit ${sha} to ${owner}/${repoName}`);
+
+  recordScaffold(owner, repoName, sha);
+  console.log(`recorded scaffold metadata at ${REPO_RECORD.replace(`${ROOT}/`, "")}`);
+
+  return 0;
+}
+
+if (import.meta.main) {
+  try {
+    process.exit(main());
+  } catch (err) {
+    console.error(`scaffold-repo failed: ${err instanceof Error ? err.message : String(err)}`);
+    process.exit(1);
+  }
+}
diff --git a/scripts/onboarding/verify-all.ts b/scripts/onboarding/verify-all.ts
new file mode 100644
index 0000000..5d82814
--- /dev/null
+++ b/scripts/onboarding/verify-all.ts
@@ -0,0 +1,340 @@
+#!/usr/bin/env bun
+/**
+ * Rollup verifier for webster-onboarding phase exits.
+ *
+ * Usage: bun run onboarding:verify-all [--phase p3|p4]
+ *
+ * Verifies, in order:
+ *   1. .env.local exists and has all 3 required keys (live verify via verify-env.ts)
+ *   2. The configured GitHub repo is reachable via gh CLI
+ *   3. All production agents (agents/*.json excluding -lp-sim-*, -site-sim-*) are
+ *      registered with the Anthropic API (count match)
+ *   4. ≥6 memory stores are provisioned (read from context/memory-stores.json)
+ *
+ * Exit 0 only if every check passes. Each failure prints a one-liner with the
+ * failing check name + an actionable hint. See references/remediation.md.
+ */
+
+import { execFileSync, spawnSync } from "node:child_process";
+import { existsSync, readFileSync, readdirSync } from "node:fs";
+import { join, resolve } from "node:path";
+
+const ROOT = resolve(import.meta.dir, "..", "..");
+const ENV_FILE = join(ROOT, ".env.local");
+const AGENTS_DIR = join(ROOT, "agents");
+const MEMORY_STORES_FILE = join(ROOT, "context/memory-stores.json");
+const ENV_ID_FILE = join(ROOT, "environments/webster-council-env.id");
+
+const API_BASE = process.env.ANTHROPIC_API_BASE ?? "https://api.anthropic.com";
+const API = `${API_BASE.replace(/\/$/, "")}/v1`;
+const BETA = "managed-agents-2026-04-01";
+const VERSION = "2023-06-01";
+
+const SIM_PATTERN = /(?:^|\/)(?:webster-)?(?:lp|site)-sim-/;
+
+interface CheckResult {
+  name: string;
+  ok: boolean;
+  detail: string;
+  hint?: string;
+}
+
+function getApiKey(): string {
+  const fromEnv = process.env.ANTHROPIC_API_KEY;
+  if (fromEnv) {
+    return fromEnv;
+  }
+  if (existsSync(ENV_FILE)) {
+    for (const line of readFileSync(ENV_FILE, "utf-8").split("\n")) {
+      const trimmed = line.trim();
+      if (trimmed.startsWith("ANTHROPIC_API_KEY=")) {
+        return trimmed
+          .slice("ANTHROPIC_API_KEY=".length)
+          .trim()
+          .replace(/^["']|["']$/g, "");
+      }
+    }
+  }
+  try {
+    const key = execFileSync(
+      "security",
+      ["find-generic-password", "-s", "anthropic-webster", "-a", process.env.USER ?? "", "-w"],
+      { encoding: "utf-8" },
+    ).trim();
+    if (key) {
+      return key;
+    }
+  } catch {
+    // fall through
+  }
+  return "";
+}
+
+function checkEnvLocal(): CheckResult {
+  if (!existsSync(ENV_FILE)) {
+    return {
+      name: "env_local",
+      ok: false,
+      detail: ".env.local not found",
+      hint: "Create .env.local at repo root with the 3 required keys (see references/key-handling.md)",
+    };
+  }
+  const result = spawnSync("bun", ["run", "onboarding:verify-env"], {
+    cwd: ROOT,
+    encoding: "utf-8",
+  });
+  if (result.status === 0) {
+    return { name: "env_local", ok: true, detail: ".env.local verified live" };
+  }
+  return {
+    name: "env_local",
+    ok: false,
+    detail: (result.stdout ?? "").trim() || "verify-env returned non-zero",
+    hint: "Re-check the failing key in references/remediation.md (P3b section)",
+  };
+}
+
+function checkRepo(): CheckResult {
+  const repo = process.env.WEBSTER_TARGET_REPO ?? readBusinessRepo();
+  if (!repo) {
+    return {
+      name: "github_repo",
+      ok: false,
+      detail: "no target repo configured",
+      hint: "Set WEBSTER_TARGET_REPO env var or run scaffold-repo.ts to create one and record it",
+    };
+  }
+  const result = spawnSync("gh", ["repo", "view", repo, "--json", "name"], { encoding: "utf-8" });
+  if (result.status === 0) {
+    return { name: "github_repo", ok: true, detail: `${repo} reachable` };
+  }
+  return {
+    name: "github_repo",
+    ok: false,
+    detail: `${repo} not reachable (gh exit ${result.status})`,
+    hint: "Run `gh auth login` or run scaffold-repo to create the repo",
+  };
+}
+
+function readBusinessRepo(): string | null {
+  const businessYaml = join(ROOT, "context/business.yaml");
+  if (!existsSync(businessYaml)) {
+    return null;
+  }
+  const text = readFileSync(businessYaml, "utf-8");
+  const nameMatch = text.match(/^\s{0,4}name:\s*(.+)$/m);
+  const rawName = nameMatch?.[1];
+  if (!rawName) {
+    return null;
+  }
+  const ghUser = process.env.GITHUB_USER ?? process.env.USER ?? "";
+  if (!ghUser) {
+    return null;
+  }
+  const slug = rawName
+    .trim()
+    .replace(/^["']|["']$/g, "")
+    .toLowerCase()
+    .replace(/[^a-z0-9]+/g, "-")
+    .replace(/^-+|-+$/g, "");
+  return `${ghUser}/${slug}-webster`;
+}
+
+function listProductionAgentSpecs(): string[] {
+  if (!existsSync(AGENTS_DIR)) {
+    return [];
+  }
+  return readdirSync(AGENTS_DIR)
+    .filter((f) => f.endsWith(".json"))
+    .filter((f) => !SIM_PATTERN.test(f))
+    .map((f) => join(AGENTS_DIR, f));
+}
+
+function readSpecName(file: string): string {
+  const json = JSON.parse(readFileSync(file, "utf-8")) as { name?: string };
+  if (!json.name) {
+    throw new Error(`spec missing 'name' field: ${file}`);
+  }
+  return json.name;
+}
+
+async function listRegisteredAgentNames(apiKey: string): Promise<Set<string>> {
+  const names = new Set<string>();
+  let url = `${API}/agents`;
+  while (url) {
+    const res = await fetch(url, {
+      headers: {
+        "x-api-key": apiKey,
+        "anthropic-version": VERSION,
+        "anthropic-beta": BETA,
+      },
+    });
+    if (!res.ok) {
+      throw new Error(`agent list HTTP ${res.status}`);
+    }
+    const data = (await res.json()) as {
+      data?: { id: string; name: string }[];
+      next_page?: string | null;
+      has_more?: boolean;
+      last_id?: string | null;
+    };
+    for (const agent of data.data ?? []) {
+      names.add(agent.name);
+    }
+    if (data.next_page) {
+      url = data.next_page.startsWith("http") ? data.next_page : `${API}${data.next_page}`;
+    } else if (data.has_more && data.last_id) {
+      const next = new URL(`${API}/agents`);
+      next.searchParams.set("after_id", data.last_id);
+      url = next.toString();
+    } else {
+      url = "";
+    }
+  }
+  return names;
+}
+
+async function checkAgents(apiKey: string): Promise<CheckResult> {
+  const specs = listProductionAgentSpecs();
+  if (specs.length === 0) {
+    return {
+      name: "agents",
+      ok: false,
+      detail: "no production agent specs found in agents/",
+      hint: "agents/*.json should contain at least the production critic + monitor + planner + redesigner specs",
+    };
+  }
+  const expectedNames = specs.map(readSpecName);
+  let registered: Set<string>;
+  try {
+    registered = await listRegisteredAgentNames(apiKey);
+  } catch (err) {
+    return {
+      name: "agents",
+      ok: false,
+      detail: `agent list failed: ${err instanceof Error ? err.message : String(err)}`,
+      hint: "ANTHROPIC_API_KEY may be invalid; run `bun run onboarding:verify-env` first",
+    };
+  }
+  const missing = expectedNames.filter((n) => !registered.has(n));
+  if (missing.length === 0) {
+    return {
+      name: "agents",
+      ok: true,
+      detail: `${expectedNames.length} production agents registered`,
+    };
+  }
+  return {
+    name: "agents",
+    ok: false,
+    detail: `missing ${missing.length} agent(s): ${missing.join(", ")}`,
+    hint: "Re-run agent registration (see prompts/first-wbs-session.md Step 2)",
+  };
+}
+
+function checkMemoryStores(): CheckResult {
+  if (!existsSync(MEMORY_STORES_FILE)) {
+    return {
+      name: "memory_stores",
+      ok: false,
+      detail: `${MEMORY_STORES_FILE.replace(`${ROOT}/`, "")} not found`,
+      hint: "Run `bun run scripts/provision-memory-stores.ts` to create stores and write the manifest",
+    };
+  }
+  let manifest: Record<string, Record<string, string>>;
+  try {
+    manifest = JSON.parse(readFileSync(MEMORY_STORES_FILE, "utf-8"));
+  } catch (err) {
+    return {
+      name: "memory_stores",
+      ok: false,
+      detail: `manifest is invalid JSON: ${err instanceof Error ? err.message : String(err)}`,
+      hint: "Delete the manifest and re-run provision-memory-stores",
+    };
+  }
+  const ids = Object.values(manifest).flatMap((roles) => Object.values(roles).filter(Boolean));
+  if (ids.length >= 6) {
+    return { name: "memory_stores", ok: true, detail: `${ids.length} memory stores provisioned` };
+  }
+  return {
+    name: "memory_stores",
+    ok: false,
+    detail: `only ${ids.length} memory stores in manifest (need ≥6)`,
+    hint: "Re-run `bun run scripts/provision-memory-stores.ts` to fill missing stores",
+  };
+}
+
+function checkEnvId(): CheckResult {
+  if (!existsSync(ENV_ID_FILE)) {
+    return {
+      name: "env_id",
+      ok: false,
+      detail: "environments/webster-council-env.id not found",
+      hint: "Run env registration (prompts/first-wbs-session.md Step 1)",
+    };
+  }
+  const id = readFileSync(ENV_ID_FILE, "utf-8").trim();
+  if (!/^env_/.test(id)) {
+    return {
+      name: "env_id",
+      ok: false,
+      detail: `env id malformed: '${id}'`,
+      hint: "Re-run env registration to write a valid env_... id",
+    };
+  }
+  return { name: "env_id", ok: true, detail: id };
+}
+
+function parsePhase(): "p3" | "p4" {
+  const argIndex = process.argv.findIndex((a) => a === "--phase");
+  const raw = argIndex !== -1 ? process.argv[argIndex + 1] : undefined;
+  const value = raw?.toLowerCase();
+  if (value === "p3" || value === "p4") {
+    return value;
+  }
+  return "p4";
+}
+
+async function main(): Promise<number> {
+  const phase = parsePhase();
+  console.log(`onboarding:verify-all phase=${phase}`);
+
+  const apiKey = getApiKey();
+  if (!apiKey) {
+    console.error("fail: no Anthropic API key (env, .env.local, and keychain all empty)");
+    return 1;
+  }
+
+  const checks: CheckResult[] = [];
+  checks.push(checkEnvLocal());
+  checks.push(checkEnvId());
+  checks.push(checkRepo());
+  checks.push(await checkAgents(apiKey));
+  checks.push(checkMemoryStores());
+
+  let allOk = true;
+  for (const c of checks) {
+    if (c.ok) {
+      console.log(`✓ ${c.name}: ${c.detail}`);
+    } else {
+      allOk = false;
+      console.error(`✗ ${c.name}: ${c.detail}`);
+      if (c.hint) {
+        console.error(`  hint: ${c.hint}`);
+      }
+    }
+  }
+
+  console.log("");
+  console.log(allOk ? `phase ${phase} green` : `phase ${phase} BLOCKED`);
+  return allOk ? 0 : 1;
+}
+
+if (import.meta.main) {
+  main()
+    .then((code) => process.exit(code))
+    .catch((err) => {
+      console.error(`verify-all crashed: ${err instanceof Error ? err.message : String(err)}`);
+      process.exit(2);
+    });
+}
diff --git a/scripts/onboarding/verify-env.ts b/scripts/onboarding/verify-env.ts
new file mode 100644
index 0000000..2b9f946
--- /dev/null
+++ b/scripts/onboarding/verify-env.ts
@@ -0,0 +1,175 @@
+#!/usr/bin/env bun
+/**
+ * Reads .env.local, verifies each of the three required keys against its
+ * provider, and prints `<provider>: ok | fail (<reason>)` per key — never
+ * echoing key values.
+ *
+ * Exit 0 only if all three pass. Used as the P3b gate of webster-onboarding.
+ */
+
+import { existsSync, readFileSync } from "node:fs";
+import { resolve } from "node:path";
+
+const ENV_FILE = resolve(process.cwd(), ".env.local");
+
+const REQUIRED = ["ANTHROPIC_API_KEY", "GITHUB_TOKEN", "CLOUDFLARE_API_TOKEN"] as const;
+type RequiredKey = (typeof REQUIRED)[number];
+
+interface VerifyResult {
+  provider: string;
+  ok: boolean;
+  reason: string;
+}
+
+function parseEnvFile(path: string): Map<string, string> {
+  const out = new Map<string, string>();
+  if (!existsSync(path)) {
+    return out;
+  }
+  const text = readFileSync(path, "utf-8");
+  for (const rawLine of text.split("\n")) {
+    const line = rawLine.trim();
+    if (!line || line.startsWith("#")) {
+      continue;
+    }
+    const eq = line.indexOf("=");
+    if (eq === -1) {
+      continue;
+    }
+    const key = line.slice(0, eq).trim();
+    let value = line.slice(eq + 1).trim();
+    if (
+      (value.startsWith('"') && value.endsWith('"')) ||
+      (value.startsWith("'") && value.endsWith("'"))
+    ) {
+      value = value.slice(1, -1);
+    }
+    out.set(key, value);
+  }
+  return out;
+}
+
+async function verifyAnthropic(key: string): Promise<VerifyResult> {
+  if (!key) {
+    return { provider: "anthropic", ok: false, reason: "key empty in .env.local" };
+  }
+  try {
+    const res = await fetch("https://api.anthropic.com/v1/models", {
+      headers: {
+        "x-api-key": key,
+        "anthropic-version": "2023-06-01",
+      },
+    });
+    if (res.ok) {
+      return { provider: "anthropic", ok: true, reason: "200 OK" };
+    }
+    return { provider: "anthropic", ok: false, reason: `HTTP ${res.status}` };
+  } catch (err) {
+    return { provider: "anthropic", ok: false, reason: `fetch error: ${(err as Error).message}` };
+  }
+}
+
+async function verifyGitHub(token: string): Promise<VerifyResult> {
+  if (!token) {
+    return { provider: "github", ok: false, reason: "token empty in .env.local" };
+  }
+  try {
+    const res = await fetch("https://api.github.com/user", {
+      headers: {
+        Authorization: `Bearer ${token}`,
+        Accept: "application/vnd.github+json",
+        "X-GitHub-Api-Version": "2022-11-28",
+      },
+    });
+    if (res.ok) {
+      return { provider: "github", ok: true, reason: "200 OK" };
+    }
+    return { provider: "github", ok: false, reason: `HTTP ${res.status}` };
+  } catch (err) {
+    return { provider: "github", ok: false, reason: `fetch error: ${(err as Error).message}` };
+  }
+}
+
+async function verifyCloudflare(token: string): Promise<VerifyResult> {
+  if (!token) {
+    return { provider: "cloudflare", ok: false, reason: "token empty in .env.local" };
+  }
+  try {
+    const res = await fetch("https://api.cloudflare.com/client/v4/user/tokens/verify", {
+      headers: { Authorization: `Bearer ${token}` },
+    });
+    if (!res.ok) {
+      return { provider: "cloudflare", ok: false, reason: `HTTP ${res.status}` };
+    }
+    const body = (await res.json()) as { success?: boolean; result?: { status?: string } };
+    if (body.success && body.result?.status === "active") {
+      return { provider: "cloudflare", ok: true, reason: "active" };
+    }
+    return {
+      provider: "cloudflare",
+      ok: false,
+      reason: `inactive (status=${body.result?.status ?? "unknown"})`,
+    };
+  } catch (err) {
+    return { provider: "cloudflare", ok: false, reason: `fetch error: ${(err as Error).message}` };
+  }
+}
+
+function checkLineMissing(env: Map<string, string>, key: RequiredKey): VerifyResult | null {
+  if (env.has(key)) {
+    return null;
+  }
+  return {
+    provider: key.toLowerCase().replace(/_api_key$|_token$/, ""),
+    ok: false,
+    reason: `missing ${key}= line in .env.local`,
+  };
+}
+
+async function main(): Promise<number> {
+  if (!existsSync(ENV_FILE)) {
+    console.error("fail: .env.local not found at repo root");
+    console.error("hint: see references/key-handling.md for the exact file format");
+    return 1;
+  }
+
+  const env = parseEnvFile(ENV_FILE);
+
+  const missingResults: VerifyResult[] = [];
+  for (const key of REQUIRED) {
+    const result = checkLineMissing(env, key);
+    if (result) {
+      missingResults.push(result);
+    }
+  }
+  if (missingResults.length > 0) {
+    for (const r of missingResults) {
+      console.log(`${r.provider}: fail (${r.reason})`);
+    }
+    return 1;
+  }
+
+  const results = await Promise.all([
+    verifyAnthropic(env.get("ANTHROPIC_API_KEY") ?? ""),
+    verifyGitHub(env.get("GITHUB_TOKEN") ?? ""),
+    verifyCloudflare(env.get("CLOUDFLARE_API_TOKEN") ?? ""),
+  ]);
+
+  let allOk = true;
+  for (const r of results) {
+    console.log(`${r.provider}: ${r.ok ? "ok" : `fail (${r.reason})`}`);
+    if (!r.ok) {
+      allOk = false;
+    }
+  }
+  return allOk ? 0 : 1;
+}
+
+if (import.meta.main) {
+  main()
+    .then((code) => process.exit(code))
+    .catch((err) => {
+      console.error(`verify-env crashed: ${err instanceof Error ? err.message : String(err)}`);
+      process.exit(2);
+    });
+}
diff --git a/skills/webster-onboarding/SKILL.md b/skills/webster-onboarding/SKILL.md
new file mode 100644
index 0000000..47197d0
--- /dev/null
+++ b/skills/webster-onboarding/SKILL.md
@@ -0,0 +1,264 @@
+---
+name: webster-onboarding
+description: |
+  Use when a small-business owner installs Webster on their own landing page. Drives the six-phase first-time setup: brand context capture, key checklist, repo scaffold, agent + memory-store provisioning, verification, first council run.
+  Triggers: "install webster", "set up webster", "onboard webster", "webster onboarding", "new webster site", "webster setup".
+---
+
+# Webster Onboarding
+
+Guide a small-business owner (likely non-technical) through Webster's first-time setup. Plain language. Bracket-define unavoidable technical terms inline — e.g., "API key [the password your site uses to talk to Claude]".
+
+The skill is a thin shell over `scripts/onboarding/*` and the runtime registration patterns in `prompts/first-wbs-session.md`. It does NOT translate site code (deferred to a future `webster-design-import` skill) and does NOT touch DNS (deferred to a demo subdomain pattern).
+
+## Hard rules (security + integrity — never violate)
+
+- **Never ask the user to paste API keys into chat.** Keys are written by the user into `.env.local` on their own machine. Verification scripts read the file and hit each provider's verify endpoint; they never echo key values to stdout, stderr, or any committed file.
+- **`ANTHROPIC_API_KEY` for the dispatcher (the `claude` process running this skill) MUST come from the macOS keychain (`security find-generic-password -s anthropic-webster -a $USER`)**, not from the shell environment. If `$ANTHROPIC_API_KEY` is exported, billing switches from Max subscription to API credits and drains fast.
+- **No mock keys, no "test mode", no fallbacks.** If a key is missing or fails verification, halt at the failing phase, write the status file, surface the remediation hint from `references/remediation.md`. User fixes, re-runs the skill, resumes from the same phase.
+- **No fabricated brand details.** What the user doesn't say or supply, mark TBD or skip — never invent a certification, year, or stat.
+- **No silent broadening.** If a verify check passes by coincidence (e.g., `gh repo view` succeeds because gh is logged into a different account), the script must distinguish that and fail loud.
+
+## Phase pre-load checks
+
+Status file location: `context/onboarding-status.json`.
+
+```!
+test -f context/onboarding-status.json && cat context/onboarding-status.json || echo '{"phase":"P0","completed":[],"next_action":"start","started_at":null,"brand_corpus_paths":[]}'
+```
+
+```!
+ls agents/*.json 2>/dev/null | grep -v -E "lp-sim|site-sim" | wc -l | tr -d ' '
+```
+
+```!
+test -f environments/webster-council-env.id && printf "env_id_file: present\n" || printf "env_id_file: missing\n"
+```
+
+```!
+test -f .env.local && printf "env_local: present\n" || printf "env_local: missing\n"
+```
+
+```!
+security find-generic-password -s anthropic-webster -a "$USER" -w >/dev/null 2>&1 && printf "anthropic_keychain: present\n" || printf "anthropic_keychain: MISSING (run: security add-generic-password -U -s anthropic-webster -a \"\$USER\" -w \"sk-ant-...\")\n"
+```
+
+```!
+[[ -z "$ANTHROPIC_API_KEY" ]] && printf "anthropic_shell_env: clean (good)\n" || printf "anthropic_shell_env: EXPORTED (bad — unset before continuing or Max sub billing breaks)\n"
+```
+
+Read the status JSON above. If `phase` is anything other than `P0`, print one line: `Resuming P{N} — {next_action}` and jump straight to that phase's section. Do not re-run earlier phases.
+
+## P0 — Overview (target: 8s of video)
+
+State to the user, in plain language:
+
+> Webster is going to set up your site so it improves itself every week. We'll do six steps:
+>
+> 1. Capture your brand (logo, voice, past work)
+> 2. Confirm three keys you have ready
+> 3. Scaffold your site repo
+> 4. Wire up the council (9–10 agents + 6 memory stores)
+> 5. Verify everything's connected
+> 6. Run the first council and surface a pull request
+>
+> Total time: about 5 minutes. If anything fails, we stop, tell you what to fix, and pick up where we left off.
+
+Wait for the user to type "ready" (or any acknowledgment). Then write the status file:
+
+```bash
+mkdir -p context
+cat > context/onboarding-status.json <<EOF
+{"phase":"P1","completed":["P0"],"next_action":"capture brand context","started_at":"$(date -u +%Y-%m-%dT%H:%M:%SZ)","brand_corpus_paths":[]}
+EOF
+```
+
+**Gate (soft)**: user typed "ready". Advance to P1.
+
+## P1 — Brand context capture (target: 25s of video)
+
+Read `references/qa-bank.md` for the full Q&A flow. Summary: three input sources, dynamic Q&A only fills gaps from sources 1+2.
+
+**Source 1 (optional) — URL scrape**: ask "Do you have an existing site URL we can pull from?" If yes, fetch it (use WebFetch built-in tool), extract text + meta tags + visible palette/font signals + any image URLs. If the URL is parked / SPA / 404, surface the failure verbatim and offer: move on, retry, or abandon URL source.
+
+**Source 2 (optional) — file uploads**: ask "Drag any of these into chat: logo, business card, past-job photos, service list, customer reviews, voice notes." Accept `pdf, md, txt, jpg, png, csv`. Copy each into `context/brand-corpus/` (mkdir first). Reference paths from `business.yaml` `corpus:` array — never base64-inline.
+
+**Source 3 (always) — dynamic Q&A**: ask only the questions whose answers are missing from sources 1+2. The 6 essentials in priority order:
+
+1. Business name?
+2. One-line description (what you sell, to whom)?
+3. Brand voice register? (warm-direct / clinical / casual / premium / playful)
+4. Target customer / region?
+5. Do-not-use copy + visual list?
+6. Trust signals (years in business, certifications, insurance)?
+
+Ask one at a time. Wait for each answer. If the user answered something already (via URL scrape or file), skip it.
+
+For LP installs specifically, also capture the single-offer contract per `references/business-yaml-schema.md` `landing_page` section — what the page sells, primary audience, primary conversion, what NOT to promote. Without this, council critics drift from the LP into homepage / program-directory territory.
+
+Write to `context/business.yaml` per the schema in `references/business-yaml-schema.md`. Use the Empire example in that file as a structural template.
+
+Update status:
+
+```bash
+cat > context/onboarding-status.json <<EOF
+{"phase":"P2","completed":["P0","P1"],"next_action":"present checklist","started_at":"$(jq -r .started_at context/onboarding-status.json 2>/dev/null || date -u +%Y-%m-%dT%H:%M:%SZ)","brand_corpus_paths":$(find context/brand-corpus -type f 2>/dev/null | jq -R . | jq -s . || echo '[]')}
+EOF
+```
+
+**Gate (hard)**: `context/business.yaml` exists AND has at least one source signal (corpus file present, or non-empty business name). Verify:
+
+```bash
+test -f context/business.yaml || { echo "GATE FAIL P1: context/business.yaml missing"; exit 1; }
+test -n "$(jq -r '.business.name // empty' context/business.yaml 2>/dev/null || yq -r '.business.name // empty' context/business.yaml 2>/dev/null)" || { echo "GATE FAIL P1: business.name empty"; exit 1; }
+```
+
+(If neither `jq` nor `yq` is installed for YAML, `grep -E "^\s*name:" context/business.yaml` is sufficient.)
+
+## P2 — Prep checklist (target: 8s of video)
+
+Read `references/key-handling.md` and print the disclaimer block to the user verbatim. Do not paraphrase it — the wording is locked.
+
+Show the checklist:
+
+```text
+[ ] 1. Anthropic API key — from console.anthropic.com (must have Memory Stores + Managed Agents quota enabled)
+[ ] 2. GitHub fine-grained PAT — Contents:read+write, Metadata:read on the target repo
+[ ] 3. Cloudflare API token — "Workers Edit" scope, from dash.cloudflare.com/profile/api-tokens
+```
+
+Wait for the user to type "all ready" (or equivalent). Then advance.
+
+Update status:
+
+```bash
+cat > context/onboarding-status.json <<EOF
+{"phase":"P3","completed":["P0","P1","P2"],"next_action":"execute setup","started_at":"$(jq -r .started_at context/onboarding-status.json)","brand_corpus_paths":$(jq -c .brand_corpus_paths context/onboarding-status.json)}
+EOF
+```
+
+**Gate (hard)**: user confirmed all three keys are at hand. No verification yet (that's P3 — they need to be in `.env.local` first).
+
+## P3 — Execute (target: 15s of video)
+
+Three sub-steps. Do them in order. Stop on first failure.
+
+### P3a — User writes `.env.local` locally
+
+Print the disclaimer again, then exact instructions:
+
+> Open `.env.local` in your editor (it's already in `.gitignore`). Paste these three lines, replacing each `<paste>` with your actual key. Save. Tell me when done — do NOT paste the keys back here.
+>
+> ```dotenv
+> ANTHROPIC_API_KEY=<paste>
+> GITHUB_TOKEN=<paste>
+> CLOUDFLARE_API_TOKEN=<paste>
+> ```
+
+Wait for "done" (or equivalent). Confirm the file exists without reading its contents:
+
+```bash
+test -f .env.local || { echo "GATE FAIL P3a: .env.local not found"; exit 1; }
+grep -q "^ANTHROPIC_API_KEY=" .env.local || { echo "GATE FAIL P3a: ANTHROPIC_API_KEY line missing in .env.local"; exit 1; }
+grep -q "^GITHUB_TOKEN=" .env.local || { echo "GATE FAIL P3a: GITHUB_TOKEN line missing in .env.local"; exit 1; }
+grep -q "^CLOUDFLARE_API_TOKEN=" .env.local || { echo "GATE FAIL P3a: CLOUDFLARE_API_TOKEN line missing in .env.local"; exit 1; }
+echo "P3a OK: .env.local has all three keys (values not read)"
+```
+
+### P3b — Verify keys against live providers
+
+```bash
+bun run onboarding:verify-env
+```
+
+The script reads `.env.local`, hits the verify endpoints (`/v1/models` for Anthropic, `/user` for GitHub, `/user/tokens/verify` for Cloudflare), and prints `ok` or `fail` per key without echoing values. On any fail: surface the failing line + the remediation hint from `references/remediation.md`, halt, preserve status file.
+
+### P3c — Scaffold repo + provision council
+
+```bash
+bun run onboarding:scaffold-repo            # creates GitHub repo, scaffolds Astro starter from context/business.yaml
+bun run provision-memory-stores             # existing script — provisions 6 stores per substrate
+# Register environment + production agents using the patterns in prompts/first-wbs-session.md
+# Source the keychain Anthropic key into a SUBSHELL only — never export to outer shell
+(
+  ANTHROPIC_API_KEY=$(security find-generic-password -s anthropic-webster -a "$USER" -w)
+  bash prompts/first-wbs-session.md   # the bootstrap script section runs env + agent registration
+)
+```
+
+If `prompts/first-wbs-session.md` is structured as readable markdown rather than a runnable script, extract the bash blocks and execute them in the subshell — the same pattern, just inline.
+
+Update status:
+
+```bash
+cat > context/onboarding-status.json <<EOF
+{"phase":"P4","completed":["P0","P1","P2","P3"],"next_action":"verify rollup","started_at":"$(jq -r .started_at context/onboarding-status.json)","brand_corpus_paths":$(jq -c .brand_corpus_paths context/onboarding-status.json)}
+EOF
+```
+
+**Gate (hard rollup)**: `bun run onboarding:verify-all --phase p3` exits 0. That script verifies `.env.local` is live + GitHub repo reachable + agent count matches `agents/*.json` non-sim count + memory stores ≥ 6.
+
+## P4 — Verify (target: 12s of video)
+
+```bash
+bun run onboarding:verify-all --phase p4
+```
+
+Same rollup as P3 but re-run after the user has had a chance to fix anything. On green: print "All systems wired. Ready for first council." On any fail: surface the failing check + remediation hint, halt, preserve status.
+
+Update status:
+
+```bash
+cat > context/onboarding-status.json <<EOF
+{"phase":"P5","completed":["P0","P1","P2","P3","P4"],"next_action":"run first council","started_at":"$(jq -r .started_at context/onboarding-status.json)","brand_corpus_paths":$(jq -c .brand_corpus_paths context/onboarding-status.json)}
+EOF
+```
+
+**Gate (hard)**: rollup green.
+
+## P5 — First council (target: 22s of video)
+
+Trigger the first council session against the user's freshly scaffolded repo. Use the same session-creation pattern as `prompts/first-wbs-session.md` Step 3 (substituting the user's own repo URL for `richsak/webster` and reading the SEO critic ID from `context/critics/seo/id.txt`).
+
+Stream the session until idle (10 min timeout, then poll `/v1/sessions/{id}` for `status: idle`). On success: extract the PR URL from the session output and surface to the user:
+
+> Your first council ran. Here's the pull request: <URL>
+>
+> Webster will run again next Sunday. You'll get a PR email when improvements are proposed. Merge if you like the changes.
+
+Final status:
+
+```bash
+cat > context/onboarding-status.json <<EOF
+{"phase":"DONE","completed":["P0","P1","P2","P3","P4","P5"],"next_action":"none","started_at":"$(jq -r .started_at context/onboarding-status.json)","brand_corpus_paths":$(jq -c .brand_corpus_paths context/onboarding-status.json),"first_council_pr":"<PR_URL>","first_session_id":"<SESSION_ID>"}
+EOF
+```
+
+**Gate (hard)**: `session_id` returned non-empty AND PR URL visible in stream output.
+
+## End state (after onboarding is complete)
+
+- `context/business.yaml` with brand context (and `context/brand-corpus/` populated)
+- `.env.local` with 3 verified keys (file exists; values never read by the skill)
+- Astro site scaffolded in user's GitHub repo
+- `environments/webster-council-env.id` written
+- 10 production agents registered with IDs at `context/{role}/id.txt`
+- 6 memory stores provisioned, IDs at `context/memory-stores.json`
+- One open PR in the user's repo with week-1 council redesign
+- `context/onboarding-status.json` with `phase: DONE`
+
+## Reference files
+
+- `references/qa-bank.md` — full Q&A flow, dynamic-fill rules, URL-scrape failure modes
+- `references/business-yaml-schema.md` — `business.yaml` schema with Empire example as template
+- `references/key-handling.md` — locked disclaimer text, `.env.local` writing rules, verification flow
+- `references/remediation.md` — per-gate failure → remediation hint mapping
+- `references/empire-fixture.md` — Empire Asphalt Paving brand identity for hackathon case-study video
+
+## Companion scripts (in `scripts/onboarding/`)
+
+- `verify-env.ts` — reads `.env.local`, hits Anthropic + GitHub + Cloudflare verify endpoints, redacts values
+- `verify-all.ts` — rollup with `--phase {p3,p4}` flag (env + repo + agents + memory stores)
+- `scaffold-repo.ts` — creates GitHub repo + Astro starter using brand identity from `context/business.yaml`
+
+Bun script names: `bun run onboarding:verify-env`, `bun run onboarding:verify-all`, `bun run onboarding:scaffold-repo`.
diff --git a/skills/webster-onboarding/references/business-yaml-schema.md b/skills/webster-onboarding/references/business-yaml-schema.md
new file mode 100644
index 0000000..d47c328
--- /dev/null
+++ b/skills/webster-onboarding/references/business-yaml-schema.md
@@ -0,0 +1,159 @@
+# `context/business.yaml` schema
+
+The brand-context output of P1. Read by every council critic and the redesigner. Authoritative source for brand identity.
+
+## Schema
+
+```yaml
+business:
+  name: string # required
+  tagline: string | null
+  one_line: string # required — "what you sell, to whom"
+  industry: string | null
+  target_customer: string # required
+  region: string | null
+
+voice:
+  register: string # required — warm-direct | clinical | casual | premium | playful | <free-form>
+  reading_level: string # default "9th grade"
+  pronouns: string # default "we"
+  energy: string | null # e.g. "calm-confident", "high-energy", "understated"
+
+do_not_use:
+  copy: string[] # banned phrases / vibes
+  visual: string[] # banned visual tropes / stock-photo styles
+
+brand:
+  palette: string[] # hex codes, primary first; ≥1 entry
+  type:
+    headline: string # font family for headings
+    body: string # font family for body
+  logo_path: string | null # path under context/brand-corpus/
+
+trust:
+  certifications: string[]
+  insured: bool
+  years_in_business: int | null
+  awards: string[] | null
+
+corpus: # paths to files in context/brand-corpus/, populated by P1
+  - path: context/brand-corpus/logo.png
+    kind: logo
+  - path: context/brand-corpus/voice-notes.md
+    kind: voice-notes
+  # ... etc
+
+landing_page: # OPTIONAL — only present if installing on a single LP, not a multi-page site
+  primary_offer:
+    name: string
+    category: string
+    one_sentence: string
+    not: string[] # what this offer is NOT (defensive framing)
+  primary_audience: string # more specific than business.target_customer
+  primary_conversion: string # the action a visitor should take
+  allowed_supporting_mentions: string[] # other offers that may appear in passing
+  disallowed_page_drift: string[] # locked from webster-decision-log.md
+```
+
+### Notes on the `landing_page` block
+
+If the user is installing on a single landing page (not a multi-page site), the `landing_page` section is **mandatory**. Without it, council critics drift the LP into homepage / program-directory territory. This is locked in `webster-decision-log.md` 1249–1251.
+
+If the user is installing on a multi-page site, omit `landing_page` and rely on `business.*` + per-page metadata in the future site-context system.
+
+## Empire Asphalt Paving — example
+
+```yaml
+business:
+  name: Empire Asphalt Paving
+  tagline: Premium handcraft paving since 2008
+  one_line: Family-owned asphalt paving and repair for residential driveways, parking lots, and patches across the Greater Toronto Area
+  industry: asphalt paving
+  target_customer: Homeowners and small commercial property owners who care about craft over price
+  region: Greater Toronto Area
+
+voice:
+  register: warm-direct
+  reading_level: 8th-9th grade
+  pronouns: we
+  energy: calm-confident
+
+do_not_use:
+  copy:
+    - "industry-leading"
+    - "innovative solutions"
+    - "synergy"
+    - emoji
+    - hyperbole adjectives ("amazing", "incredible")
+  visual:
+    - stock-photo CGI trucks
+    - cartoon icons
+    - saturated primaries beyond brand colors
+    - generic "happy customer" stock photos
+
+brand:
+  palette:
+    - "#1B47A1" # royal blue (logo primary)
+    - "#F9D71C" # bright yellow (logo accent)
+    - "#292F2E" # near-black (text)
+  type:
+    headline: Inter
+    body: Source Sans Pro
+  logo_path: context/brand-corpus/logo.png
+
+trust:
+  certifications: []
+  insured: true
+  years_in_business: 18
+  awards: []
+
+corpus:
+  - path: context/brand-corpus/logo.png
+    kind: logo
+  - path: context/brand-corpus/business-card.jpg
+    kind: business-card
+  - path: context/brand-corpus/past-jobs/job-1.jpg
+    kind: past-job
+  - path: context/brand-corpus/past-jobs/job-2.jpg
+    kind: past-job
+  - path: context/brand-corpus/past-jobs/job-3.jpg
+    kind: past-job
+  - path: context/brand-corpus/service-list.md
+    kind: service-list
+  - path: context/brand-corpus/reviews.md
+    kind: reviews
+  - path: context/brand-corpus/voice-notes.md
+    kind: voice-notes
+
+landing_page:
+  primary_offer:
+    name: Driveway paving + sealcoat
+    category: residential paving
+    one_sentence: We pave or repair your driveway and seal it for the long haul — done by family, not subcontractors.
+    not:
+      - parking lot resurfacing (separate page)
+      - asphalt supply or wholesale
+      - snow removal
+  primary_audience: GTA homeowners with a driveway needing repair, repaving, or sealcoat
+  primary_conversion: Book a free on-site estimate
+  allowed_supporting_mentions:
+    - patch repair (mention as a related service in passing)
+    - line-striping (mention only if visitor asks)
+  disallowed_page_drift:
+    - parking lot job listings
+    - commercial pricing tables
+    - generic "all paving services" landing
+```
+
+## Validation rules
+
+When P1 finishes, the skill should validate:
+
+- `business.name`, `business.one_line`, `business.target_customer` are non-empty
+- `voice.register` is non-empty (free-form is fine)
+- `brand.palette` has ≥1 hex code (matches `/^#[0-9a-fA-F]{6}$/`)
+- If `landing_page` is present, `primary_offer.name`, `primary_audience`, `primary_conversion` are all non-empty
+- All `corpus[].path` files exist under `context/brand-corpus/`
+- `do_not_use.copy` has ≥1 entry (forces user to commit to at least one banned phrase — "no banned phrases" is a smell)
+
+If any validation fails, surface the failure + offer to re-ask the relevant question. Do not advance to P2 with an incomplete `business.yaml`.
diff --git a/skills/webster-onboarding/references/empire-fixture.md b/skills/webster-onboarding/references/empire-fixture.md
new file mode 100644
index 0000000..cf1ed86
--- /dev/null
+++ b/skills/webster-onboarding/references/empire-fixture.md
@@ -0,0 +1,59 @@
+# Empire Asphalt Paving — hackathon case-study fixture
+
+Reference data for the 90-second case-study video showing Webster installation on Richie's dad's paving business. Used by the recording, not by the skill at runtime.
+
+The full storyboard, recording surface, and pre-recording checklist live in `context/ONBOARDING-CASE-STUDY.md`. This file is the brand-data shape used to dry-run the skill before recording.
+
+## Brand identity
+
+| field             | value                                                                              |
+| ----------------- | ---------------------------------------------------------------------------------- |
+| primary color     | royal blue `#1B47A1` (from logo)                                                   |
+| accent color      | bright yellow `#F9D71C` (from logo)                                                |
+| voice register    | warm-direct, premium-handcraft, family-business                                    |
+| reading level     | 8th–9th grade                                                                      |
+| pronouns          | "we"                                                                               |
+| do-not-use copy   | "industry-leading", "innovative solutions", emoji, "synergy", hyperbole adjectives |
+| do-not-use visual | stock-photo CGI trucks, cartoon icons, saturated primaries beyond brand colors     |
+| trust signals     | 18 years, family-owned, fully insured, real past-job photos                        |
+
+## Brand corpus directory (must exist before recording)
+
+```text
+context/brand-corpus/
+├── logo.png                 ← royal blue circle + yellow crown + cursive "e"
+├── business-card.jpg        ← real if available; mock if not (consistent with logo palette)
+├── past-jobs/
+│   ├── job-1.jpg            ← driveway paving
+│   ├── job-2.jpg            ← parking lot resurfacing
+│   └── job-3.jpg            ← patch repair / sealcoat
+├── service-list.md          ← typed by Richie from dad's known services
+├── reviews.md               ← 2-3 paraphrased real reviews; star count, name, year
+└── voice-notes.md           ← Richie-paraphrased dad quotes capturing voice tone
+```
+
+## `business.yaml` (full Empire example)
+
+See `references/business-yaml-schema.md` "Empire Asphalt Paving — example" section for the canonical YAML.
+
+## Pre-recording checklist (subset relevant to the skill)
+
+- [ ] `webster-onboarding` skill exists at this path with the P0–P5 phase model
+- [ ] `bun run onboarding:verify-all` passes against a fresh test environment
+- [ ] Empire's ugly v0 HTML committed to a fresh GitHub repo (e.g., `richsak/empire-paving-demo`) — handled by T13, not by the skill
+- [ ] `context/brand-corpus/` populated with all corpus files for Empire
+- [ ] Anthropic API key has Memory Stores + Managed Agents quota
+- [ ] Cloudflare API token + GitHub PAT in `.env.local`
+- [ ] One dry-run install completed successfully end-to-end before live take
+
+## Why this fixture matters
+
+The Empire case study is the second of three real humans in the demo chain (Nicolette in Beat 1, Dad here, Richie as builder/operator). It supplements the main 3-minute demo with a 90s "what does this look like for a real non-technical owner" view. The skill must produce the same end state Richie shows in the video — drift between the recording and what the skill actually does kills credibility.
+
+When dry-running the skill before recording, use this Empire fixture as the input. After the dry-run, confirm:
+
+1. `context/business.yaml` matches the schema example
+2. `context/brand-corpus/` has all 7 expected files
+3. `bun run onboarding:verify-all --phase p4` exits 0
+4. The first council session opens a PR against `richsak/empire-paving-demo` with a week-1 redesign
+5. `context/onboarding-status.json` reads `phase: DONE`
diff --git a/skills/webster-onboarding/references/key-handling.md b/skills/webster-onboarding/references/key-handling.md
new file mode 100644
index 0000000..4fc6b17
--- /dev/null
+++ b/skills/webster-onboarding/references/key-handling.md
@@ -0,0 +1,108 @@
+# Key handling — security-critical
+
+This is the part of the skill where the user's secrets enter the system. Mistakes here are unrecoverable (key leaks). Read every rule before P2.
+
+## The locked disclaimer
+
+Print verbatim at the start of P2 and again at the start of P3a. Do not paraphrase.
+
+> **For your safety, do NOT paste API keys into this chat.**
+>
+> Open `.env.local` in a text editor on your own computer and paste them there. The skill will read the file directly and verify each key against the provider — no key value is ever sent through chat, written to logs, or committed to git.
+>
+> If you accidentally paste a key in chat: stop, rotate the key on the provider dashboard, and start over. Do not assume "deleting the message" is enough — chat history may have been logged elsewhere.
+
+## What goes in `.env.local`
+
+```dotenv
+ANTHROPIC_API_KEY=<your key here>
+GITHUB_TOKEN=<your fine-grained PAT here>
+CLOUDFLARE_API_TOKEN=<your Workers Edit token here>
+```
+
+Three lines, no quotes, no spaces around `=`. The user pastes their actual key values in place of `<...>`.
+
+## Why each key
+
+| key                    | scope                                                                            | what it does                                                       |
+| ---------------------- | -------------------------------------------------------------------------------- | ------------------------------------------------------------------ |
+| `ANTHROPIC_API_KEY`    | full account                                                                     | runs the council agents (each session bills against this account)  |
+| `GITHUB_TOKEN`         | fine-grained PAT, Contents:read+write + Metadata:read on the user's webster repo | lets agents clone, push branches, open PRs                         |
+| `CLOUDFLARE_API_TOKEN` | "Workers Edit" scope                                                             | deploys the user's site (used by `wrangler deploy` after PR merge) |
+
+## File location
+
+`.env.local` lives at the repo root. It is `.gitignore`-d (the repo's `.gitignore` already excludes `.env*`). Confirm before P3a:
+
+```bash
+grep -q "^\.env" .gitignore || echo "WARNING: .gitignore does not exclude .env files — add this line: .env.local"
+```
+
+## Verification flow
+
+After the user reports they've saved `.env.local`:
+
+1. **Confirm file presence and key-line presence WITHOUT reading values:**
+
+   ```bash
+   test -f .env.local
+   grep -q "^ANTHROPIC_API_KEY=" .env.local
+   grep -q "^GITHUB_TOKEN=" .env.local
+   grep -q "^CLOUDFLARE_API_TOKEN=" .env.local
+   ```
+
+   `grep -q` exits 0/1 without printing values. Safe.
+
+2. **Run the live verifier:**
+
+   ```bash
+   bun run onboarding:verify-env
+   ```
+
+   The script (`scripts/onboarding/verify-env.ts`):
+   - Reads `.env.local` into process env
+   - Hits each provider's verify endpoint
+   - Prints one line per key: `anthropic: ok` / `anthropic: fail (HTTP 401)` etc.
+   - **Never prints key values, key prefixes, or any substring of the keys**
+   - Exits 0 only if all three pass
+
+3. **On any fail:** look up the failing key in `references/remediation.md`, print the matching remediation hint, halt P3, preserve `context/onboarding-status.json`. User fixes (rotates key / fixes scope / re-pastes), runs `bun run onboarding:verify-env` again. Once green, re-enter the skill — it resumes at P3.
+
+## Dispatcher key handling (separate rule)
+
+The `claude` process running this skill itself needs `ANTHROPIC_API_KEY`. **It must come from the macOS keychain, not from the shell environment**, otherwise the dispatcher bills against API credits instead of the Max subscription.
+
+Check at skill start:
+
+```bash
+if [[ -n "$ANTHROPIC_API_KEY" ]]; then
+  echo "ERROR: \$ANTHROPIC_API_KEY is exported in your shell."
+  echo "This makes the claude dispatcher bill against API credits, not Max subscription."
+  echo "Fix: exit this session, run 'unset ANTHROPIC_API_KEY', start a new session, retry."
+  exit 1
+fi
+
+if ! security find-generic-password -s anthropic-webster -a "$USER" -w >/dev/null 2>&1; then
+  echo "ERROR: anthropic-webster keychain entry missing."
+  echo "One-time setup: security add-generic-password -U -s anthropic-webster -a \"\$USER\" -w \"sk-ant-...\""
+  exit 1
+fi
+```
+
+This is separate from the user-facing `ANTHROPIC_API_KEY` in `.env.local`. They can be the same key value, but the dispatcher fetches from keychain, while runtime council agents read from `.env.local` (or, in the cloud Managed Agents environment, from the vault credential).
+
+## Anti-patterns (never do these)
+
+- ❌ "Just paste your key here once and I'll save it for you" — even temporarily, even with redaction promises
+- ❌ Reading `.env.local` contents into a chat-visible variable (`$(cat .env.local)`) — even for diagnosis
+- ❌ Echoing the first/last 4 chars of a key for "verification" — leaks key prefix, which is enough to attack
+- ❌ Logging API responses that contain the key in error messages — strip the `Authorization` / `x-api-key` header before printing any HTTP error body
+- ❌ Falling back to a shared "demo key" if user's key fails — there is no demo key, halt instead
+
+## Anti-pattern detection
+
+If the user types something that looks like a key in chat (e.g., starts with `sk-ant-`, `ghp_`, `github_pat_`, or is a 32+ char alphanumeric string near the words "key" / "token"), interrupt them:
+
+> Stop — that looks like an API key. Don't paste it in chat. Save it to `.env.local` instead. If you already pasted it: rotate the key now on the provider dashboard, then come back.
+
+This is a courtesy guard, not a security guarantee — assume any key that touches chat is leaked.
diff --git a/skills/webster-onboarding/references/qa-bank.md b/skills/webster-onboarding/references/qa-bank.md
new file mode 100644
index 0000000..082273c
--- /dev/null
+++ b/skills/webster-onboarding/references/qa-bank.md
@@ -0,0 +1,91 @@
+# P1 — Q&A bank
+
+The brand-context capture phase has three input sources. Q&A only fills gaps left by sources 1 and 2.
+
+## Source 1 — URL scrape (optional)
+
+Ask: "Do you have an existing site URL we can pull from?"
+
+If yes, fetch it via the WebFetch built-in tool. Extract:
+
+- **Text**: headings, hero copy, body text, footer
+- **Meta tags**: title, description, og:title, og:description, og:image
+- **Visible palette signals**: dominant colors from background/heading inline styles or linked CSS
+- **Font signals**: `font-family` declarations from inline styles or linked CSS
+- **Image URLs**: hero image, logo, any product/job photos
+
+Map extracted signals to `business.yaml` fields:
+
+| extracted signal                     | yaml field                                                                    |
+| ------------------------------------ | ----------------------------------------------------------------------------- |
+| `<title>` or `<h1>`                  | `business.name` (if not already set)                                          |
+| meta description / hero subheading   | `business.one_line`                                                           |
+| dominant background color            | `brand.palette[0]`                                                            |
+| accent color (button bg, link color) | `brand.palette[1]`                                                            |
+| `font-family` heading                | `brand.type.headline`                                                         |
+| `font-family` body                   | `brand.type.body`                                                             |
+| logo image URL                       | download to `context/brand-corpus/logo.<ext>`, reference in `brand.logo_path` |
+
+### URL scrape failure handling
+
+If the URL is parked, returns 404, is a JS-only SPA (empty `<body>`), or times out:
+
+- Surface the failure verbatim to the user (don't paraphrase the error)
+- Offer three choices: **(a) move on** — skip URL source, continue to file uploads; **(b) retry** — try the URL again (rate-limit signals may have cleared); **(c) abandon URL source** — never ask again this session
+
+Do not silently skip. Do not auto-retry without asking.
+
+## Source 2 — File uploads (optional)
+
+Ask: "Drag any of these into the chat — logo, business card, past-job photos, service list, customer reviews, voice notes. I accept pdf, md, txt, jpg, png, csv."
+
+For each file:
+
+1. `mkdir -p context/brand-corpus/`
+2. Copy the file into `context/brand-corpus/` preserving its name (sanitize spaces → hyphens, lowercase)
+3. If it's a `past-job` photo or there are 3+ similar images, group them under `context/brand-corpus/past-jobs/{1..N}.jpg`
+4. Reference paths in `business.yaml` under `corpus:` array — never base64-inline file contents
+5. If it's a text-bearing file (`md`, `txt`, `csv`, OCR-readable `pdf`/`jpg`), extract the text and use it to auto-fill `business.yaml` fields per the same mapping as Source 1
+
+Recommended brand corpus layout (from `context/ONBOARDING-CASE-STUDY.md`):
+
+```text
+context/brand-corpus/
+├── logo.png
+├── business-card.jpg
+├── past-jobs/
+│   ├── job-1.jpg
+│   ├── job-2.jpg
+│   └── job-3.jpg
+├── service-list.md
+├── reviews.md
+└── voice-notes.md
+```
+
+## Source 3 — Dynamic Q&A (always)
+
+Ask only the questions whose answers are still missing after sources 1 and 2.
+
+Order of essentials (1 → 6, ask one at a time, wait for each answer):
+
+1. **Business name?**
+2. **One-line description** — what you sell, to whom?
+3. **Brand voice register?** Pick one or describe in your own words: warm-direct, clinical, casual, premium, playful.
+4. **Target customer + region?** Who are you trying to reach, and where do they live?
+5. **Do-not-use list** — any words, phrases, visual styles, or stock-photo tropes you want Webster to avoid? (Examples: "industry-leading", "synergy", emoji, CGI trucks, cartoon icons.)
+6. **Trust signals** — years in business, certifications, insurance status, real past-job photos available?
+
+If the user is installing on a **landing page** (not a multi-page site), also capture the single-offer contract (per `business-yaml-schema.md` `landing_page` section). Continue the same one-at-a-time pattern with these four follow-ups:
+
+- **Primary offer** — what specifically does this page sell?
+- **Primary audience** — who is this page for? (More specific than overall target customer.)
+- **Primary conversion** — what action do you want a visitor to take?
+- **Do not promote on this page** — what other things you sell should this page NOT mention? (Without this, council critics drift the LP into homepage / program-directory territory — locked in `webster-decision-log.md`.)
+
+## Q&A discipline
+
+- **One question at a time.** Wait for each answer. Don't batch.
+- **Bracket-define jargon inline.** "Voice register [the personality your writing comes across as]"
+- **Never invent answers.** If the user says "I don't know" or skips, write `TBD` to the YAML field and continue. Do not fabricate.
+- **Show the user what you wrote.** After each answer, echo back: "Got it — saving as `voice.register: warm-direct`."
+- **Confirm at end of P1.** Before advancing to P2, print the full `business.yaml` and ask "Anything wrong before we continue?"
diff --git a/skills/webster-onboarding/references/remediation.md b/skills/webster-onboarding/references/remediation.md
new file mode 100644
index 0000000..a7ae016
--- /dev/null
+++ b/skills/webster-onboarding/references/remediation.md
@@ -0,0 +1,128 @@
+# Per-gate failure → remediation hints
+
+When a phase exit gate fails, look up the specific check in this file and print the matching hint to the user. Halt the skill, preserve `context/onboarding-status.json`. User fixes, re-enters the skill, resumes from the same phase.
+
+## P1 — Brand context
+
+| failure                         | hint                                                                                                                              |
+| ------------------------------- | --------------------------------------------------------------------------------------------------------------------------------- |
+| `context/business.yaml` missing | "P1 didn't write `business.yaml`. Did you skip the Q&A? Re-enter the skill — it'll resume P1 and re-ask only the missing fields." |
+| `business.name` empty           | "Business name is required. Re-enter the skill, answer Q1."                                                                       |
+| URL scrape failed               | (handled inline in P1, not a gate failure)                                                                                        |
+
+## P2 — Prep checklist
+
+| failure                                     | hint                                                                                                   |
+| ------------------------------------------- | ------------------------------------------------------------------------------------------------------ |
+| User typed something other than "all ready" | "Take your time. The skill paused. When you have all three keys in hand, type 'all ready' to advance." |
+
+## P3a — `.env.local` write
+
+| failure                              | hint                                                                                                                                                                                                        |
+| ------------------------------------ | ----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------- |
+| `.env.local` not found               | "I don't see `.env.local` in the repo root. Create it (in your editor, not in chat), paste the three key=value lines per `references/key-handling.md`, save, then say 'done'."                              |
+| `ANTHROPIC_API_KEY=` line missing    | "`.env.local` is missing the `ANTHROPIC_API_KEY=` line. Add it (no quotes, no spaces around `=`), save, retry."                                                                                             |
+| `GITHUB_TOKEN=` line missing         | "`.env.local` is missing the `GITHUB_TOKEN=` line. Add it, save, retry."                                                                                                                                    |
+| `CLOUDFLARE_API_TOKEN=` line missing | "`.env.local` is missing the `CLOUDFLARE_API_TOKEN=` line. Add it, save, retry."                                                                                                                            |
+| `.gitignore` doesn't exclude `.env*` | "Critical: `.gitignore` doesn't exclude `.env.local`. Add a line `.env*` to `.gitignore` and commit it BEFORE running `bun run onboarding:verify-env`. Otherwise your keys could be committed by accident." |
+
+## P3b — Live key verification
+
+### `anthropic: fail (HTTP 401)`
+
+> Your `ANTHROPIC_API_KEY` was rejected by Anthropic. Most common causes:
+>
+> - Key was copied with whitespace — re-copy from console.anthropic.com without trailing spaces
+> - Key was rotated/revoked — generate a new one
+> - Key is for a different account than the one you intended
+>
+> Fix `.env.local`, run `bun run onboarding:verify-env` again.
+
+### `anthropic: fail (HTTP 403)` or "Insufficient quota"
+
+> Your Anthropic account doesn't have access to Memory Stores or Managed Agents. These are required for Webster.
+>
+> - Check your account at console.anthropic.com → Settings → Plan
+> - Memory Stores need to be enabled (it's a public beta feature; some accounts need to opt in)
+> - Managed Agents API needs the `managed-agents-2026-04-01` beta header — confirm your account has access
+>
+> If your account doesn't have access yet, request it via Anthropic support. Do NOT proceed without quota — the skill will fail at P3c.
+
+### `github: fail (HTTP 401)`
+
+> Your `GITHUB_TOKEN` was rejected by GitHub. Most common causes:
+>
+> - Token expired (fine-grained PATs have expiration dates)
+> - Token was revoked
+> - Token is for a personal account but you're trying to scaffold a repo under an org
+>
+> Generate a new fine-grained PAT at github.com/settings/personal-access-tokens/new. Required scopes:
+>
+> - **Contents**: Read and write
+> - **Metadata**: Read
+>   Repo access: select the specific repo (or "all repositories" if you don't have one yet — `scaffold-repo` will create one).
+>
+> Paste the new token in `.env.local`, retry.
+
+### `github: fail (HTTP 403)`
+
+> Your `GITHUB_TOKEN` is valid but lacks required permissions. Webster needs Contents:write to push branches. Re-issue the token with the right scopes (see above), retry.
+
+### `cloudflare: fail (HTTP 401)` or `(invalid)`
+
+> Your `CLOUDFLARE_API_TOKEN` was rejected. Common causes:
+>
+> - Token was copied incorrectly
+> - Token is for a different Cloudflare account than the one hosting your site
+> - Token doesn't have the "Workers Edit" scope (the only scope Webster requires)
+>
+> Generate a new token at dash.cloudflare.com/profile/api-tokens. Use the "Edit Cloudflare Workers" template, scope it to your account.
+
+## P3c — Scaffold + provision
+
+### `scaffold-repo: GitHub repo already exists`
+
+> A repo by this name already exists under your account. Two options:
+>
+> - **Use the existing repo**: edit `context/business.yaml` `business.name` to match the existing repo name exactly, OR delete the existing repo on github.com if it's empty.
+> - **Pick a different name**: re-run scaffold with a different repo name via `bun run onboarding:scaffold-repo --name <new-name>`.
+
+### `provision-memory-stores: HTTP 429 (rate limit)`
+
+> Anthropic rate-limited the memory store creation calls. Wait 60 seconds, then re-run `bun run provision-memory-stores`. The script is idempotent — already-created stores will be reused.
+
+### `register-agents: env_id_file missing`
+
+> The environment hasn't been registered yet. Re-run the bootstrap section of `prompts/first-wbs-session.md` (Step 1) which writes `environments/webster-council-env.id`. Then retry agent registration.
+
+## P4 — Verify rollup
+
+### `agent_count_mismatch: expected N, found M`
+
+> Some agents didn't register. Check `tmp/logs/` for the registration session output, find the failing agent name, and re-run registration for just that one. The script is idempotent for successful agents.
+
+### `memory_stores_low: expected ≥6, found N`
+
+> Memory store provisioning didn't complete. Re-run `bun run provision-memory-stores` — already-created stores will be reused, missing ones will be added.
+
+### `repo_unreachable: HTTP 404 from gh repo view`
+
+> The `gh` CLI couldn't reach your repo. Either:
+>
+> - The repo wasn't created (re-run scaffold-repo)
+> - The repo is private and `gh` isn't authenticated for that account (run `gh auth login`)
+> - The repo name in `context/business.yaml` doesn't match the actual repo name on github.com
+
+## P5 — First council
+
+### Session creation HTTP 400 / 422
+
+> The session creation request was malformed. Most common cause: the agent ID in `context/critics/seo/id.txt` is stale (e.g., a previous registration was rolled back). Re-run agent registration to refresh IDs.
+
+### Session timed out before idle
+
+> The first council session ran longer than 10 minutes. Check `tmp/logs/seo-hello-stream.log` for the last activity. If the session is still progressing, re-run with a longer timeout. If it's stuck, surface `[STUCK]` to the operator and capture the session ID for debugging.
+
+### No PR URL in session output
+
+> The redesigner ran but didn't open a PR. Check that `GITHUB_TOKEN` has Contents:write on the target repo (re-verify with `bun run onboarding:verify-env`). If the token is fine, the redesigner may have hit a content moderation block — check the session output for the actual error.