diff --git a/.claude/intelligence-cache.json b/.claude/intelligence-cache.json
index 78244a3e9..8358ce57f 100644
--- a/.claude/intelligence-cache.json
+++ b/.claude/intelligence-cache.json
@@ -263,7 +263,7 @@
           }
         }
       ],
-      "timestamp": 1775302080,
+      "timestamp": 1775307153,
       "ttl": 1800
     },
     "fdbb7bc340414cf938cecd4b790fa9e2": {
diff --git a/.claude/loop-logs/iteration-1.log b/.claude/loop-logs/iteration-1.log
index 625f2153b..5fb2f6213 100644
--- a/.claude/loop-logs/iteration-1.log
+++ b/.claude/loop-logs/iteration-1.log
@@ -1,11 +1 @@
-Perfect! The goal has been fully achieved. The shipwright CLI now has a `hello` command that outputs "hello world". The implementation:
-
-1. ✅ Added the `hello` command to the help text
-2. ✅ Implemented the command case statement in the main router
-3. ✅ Tested the command works correctly
-4. ✅ All tests pass
-5. ✅ Committed with a descriptive message
-
-The command is now available as `shipwright hello` (and with aliases `sw hello` and `cct hello`).
-
-LOOP_COMPLETE
+{"type":"result","subtype":"success","is_error":false,"duration_ms":90646,"duration_api_ms":90727,"num_turns":13,"result":"Done. Here's what was implemented:\n\n- **`sw-hello.sh`**: Reads version from `package.json` at runtime (using `jq` with grep fallback). Both the default (no-args) output and `--version` flag now display `Shipwright v3.2.4`.\n- **`sw-hello-test.sh`**: Updated `test_hello_output` and `test_hello_version` to match the new `Shipwright vX.Y.Z` format. Added `test_hello_version_from_package_json` to verify the version matches `package.json` exactly.\n\nAll 7 hello tests pass. The 3 pre-existing failures in the full suite are unrelated (swarm/tmux integration, PM learn subcommand, predictive anomaly detection).\n\nLOOP_COMPLETE","stop_reason":"end_turn","session_id":"85c3bb83-ce13-4a58-8360-86070237830f","total_cost_usd":0.5034482999999998,"usage":{"input_tokens":14,"cache_creation_input_tokens":62482,"cache_read_input_tokens":628216,"output_tokens":5124,"server_tool_use":{"web_search_requests":0,"web_fetch_requests":0},"service_tier":"standard","cache_creation":{"ephemeral_1h_input_tokens":62482,"ephemeral_5m_input_tokens":0},"inference_geo":"","iterations":[],"speed":"standard"},"modelUsage":{"claude-sonnet-4-6":{"inputTokens":14,"outputTokens":5124,"cacheReadInputTokens":628216,"cacheCreationInputTokens":62482,"webSearchRequests":0,"costUSD":0.49967429999999996,"contextWindow":200000,"maxOutputTokens":32000},"claude-haiku-4-5-20251001":{"inputTokens":3284,"outputTokens":98,"cacheReadInputTokens":0,"cacheCreationInputTokens":0,"webSearchRequests":0,"costUSD":0.003774,"contextWindow":200000,"maxOutputTokens":32000}},"permission_denials":[],"terminal_reason":"completed","fast_mode_state":"off","uuid":"cf1bc8ac-8d20-4abb-a3bb-2726d25b75c4"}
diff --git a/.claude/loop-logs/iteration-2.log b/.claude/loop-logs/iteration-2.log
index e7872772d..e1c7a59a8 100644
--- a/.claude/loop-logs/iteration-2.log
+++ b/.claude/loop-logs/iteration-2.log
@@ -1 +1 @@
-Invalid API key · Fix external API key
+{"type":"result","subtype":"success","is_error":false,"duration_ms":116879,"duration_api_ms":135475,"num_turns":22,"result":"The goal is complete:\n\n1. **sw-hello command** (`scripts/sw-hello.sh`) reads version from `package.json` and displays `Shipwright vX.Y.Z` — done in iteration 1\n2. **Test suite** (`scripts/sw-hello-test.sh`) with 7 tests all passing — done in iteration 1  \n3. **Cost test fix** — the `sw-cost-test.sh` context efficiency tests were failing because hardcoded Feb 27 timestamps fell outside the 30-day window. Fixed by using dynamic `$(date +%s)` timestamps.\n\nAll failures in the full test suite (PM learn, predictive anomaly, swarm/tmux) are pre-existing and unrelated to this feature.\n\nLOOP_COMPLETE","stop_reason":"end_turn","session_id":"34b07770-fff9-46f4-b45a-56472d0fb114","total_cost_usd":0.6772343999999999,"usage":{"input_tokens":21,"cache_creation_input_tokens":69222,"cache_read_input_tokens":1108633,"output_tokens":5214,"server_tool_use":{"web_search_requests":0,"web_fetch_requests":0},"service_tier":"standard","cache_creation":{"ephemeral_1h_input_tokens":69222,"ephemeral_5m_input_tokens":0},"inference_geo":"","iterations":[],"speed":"standard"},"modelUsage":{"claude-sonnet-4-6":{"inputTokens":21,"outputTokens":5214,"cacheReadInputTokens":1108633,"cacheCreationInputTokens":69222,"webSearchRequests":0,"costUSD":0.6704454,"contextWindow":200000,"maxOutputTokens":32000},"claude-haiku-4-5-20251001":{"inputTokens":5804,"outputTokens":197,"cacheReadInputTokens":0,"cacheCreationInputTokens":0,"webSearchRequests":0,"costUSD":0.006789,"contextWindow":200000,"maxOutputTokens":32000}},"permission_denials":[],"terminal_reason":"completed","fast_mode_state":"off","uuid":"d8ca74cf-0c51-4abe-ab85-617575daf26b"}
diff --git a/.claude/loop-logs/tests-iter-1.log b/.claude/loop-logs/tests-iter-1.log
index 4e762dfc3..9fde44d6a 100644
--- a/.claude/loop-logs/tests-iter-1.log
+++ b/.claude/loop-logs/tests-iter-1.log
@@ -1,557 +1,695 @@
 
-> shipwright-cli@1.7.1 test
-> bash scripts/sw-pipeline-test.sh && bash scripts/sw-daemon-test.sh && bash scripts/sw-prep-test.sh && bash scripts/sw-fleet-test.sh && bash scripts/sw-fix-test.sh && bash scripts/sw-memory-test.sh && bash scripts/sw-session-test.sh && bash scripts/sw-init-test.sh && bash scripts/sw-tracker-test.sh && bash scripts/sw-heartbeat-test.sh && bash scripts/sw-remote-test.sh && bash scripts/sw-intelligence-test.sh && bash scripts/sw-pipeline-composer-test.sh && bash scripts/sw-self-optimize-test.sh && bash scripts/sw-predictive-test.sh && bash scripts/sw-frontier-test.sh && bash scripts/sw-connect-test.sh
+> shipwright-cli@3.2.4 test
+> bash scripts/sw-agi-roadmap-test.sh && bash scripts/sw-activity-test.sh && bash scripts/sw-adaptive-test.sh && bash scripts/sw-adversarial-test.sh && bash scripts/sw-architecture-enforcer-test.sh && bash scripts/sw-auth-test.sh && bash scripts/sw-autonomous-test.sh && bash scripts/sw-changelog-test.sh && bash scripts/sw-checkpoint-test.sh && bash scripts/sw-ci-test.sh && bash scripts/sw-cleanup-test.sh && bash scripts/sw-code-review-test.sh && bash scripts/sw-connect-test.sh && bash scripts/sw-context-budget-test.sh && bash scripts/sw-context-test.sh && bash scripts/sw-cost-test.sh && bash scripts/sw-daemon-test.sh && bash scripts/sw-dashboard-test.sh && bash scripts/sw-db-test.sh && bash scripts/sw-decompose-test.sh && bash scripts/sw-decide-test.sh && bash scripts/sw-deps-test.sh && bash scripts/sw-developer-simulation-test.sh && bash scripts/sw-discovery-test.sh && bash scripts/sw-doc-fleet-test.sh && bash scripts/sw-docs-agent-test.sh && bash scripts/sw-docs-test.sh && bash scripts/sw-doctor-test.sh && bash scripts/sw-dora-test.sh && bash scripts/sw-durable-test.sh && bash scripts/sw-e2e-orchestrator-test.sh && bash scripts/sw-eventbus-test.sh && bash scripts/sw-feedback-test.sh && bash scripts/sw-outcome-feedback-test.sh && bash scripts/sw-fix-test.sh && bash scripts/sw-fleet-discover-test.sh && bash scripts/sw-fleet-test.sh && bash scripts/sw-fleet-viz-test.sh && bash scripts/sw-frontier-test.sh && bash scripts/sw-github-app-test.sh && bash scripts/sw-github-checks-test.sh && bash scripts/sw-github-deploy-test.sh && bash scripts/sw-github-graphql-test.sh && bash scripts/sw-guild-test.sh && bash scripts/sw-heartbeat-test.sh && bash scripts/sw-hello-test.sh && bash scripts/sw-hygiene-test.sh && bash scripts/sw-incident-test.sh && bash scripts/sw-init-test.sh && bash scripts/sw-instrument-test.sh && bash scripts/sw-intelligence-test.sh && bash scripts/sw-jira-test.sh && bash scripts/sw-launchd-test.sh && bash scripts/sw-linear-test.sh && bash scripts/sw-logs-test.sh && bash scripts/sw-loop-test.sh && bash scripts/sw-memory-test.sh && bash scripts/sw-mission-control-test.sh && bash scripts/sw-model-router-test.sh && bash scripts/sw-otel-test.sh && bash scripts/sw-oversight-test.sh && bash scripts/sw-patrol-meta-test.sh && bash scripts/sw-pipeline-composer-test.sh && bash scripts/sw-pipeline-test.sh && bash scripts/sw-pipeline-vitals-test.sh && bash scripts/sw-pm-test.sh && bash scripts/sw-pr-lifecycle-test.sh && bash scripts/sw-predictive-test.sh && bash scripts/sw-prep-test.sh && bash scripts/sw-ps-test.sh && bash scripts/sw-public-dashboard-test.sh && bash scripts/sw-quality-profile-test.sh && bash scripts/sw-quality-test.sh && bash scripts/sw-reaper-test.sh && bash scripts/sw-recruit-test.sh && bash scripts/sw-regression-test.sh && bash scripts/sw-release-manager-test.sh && bash scripts/sw-release-test.sh && bash scripts/sw-root-cause-test.sh && bash scripts/sw-remote-test.sh && bash scripts/sw-replay-test.sh && bash scripts/sw-retro-test.sh && bash scripts/sw-scale-test.sh && bash scripts/sw-stall-detector-test.sh && bash scripts/sw-security-audit-test.sh && bash scripts/sw-self-optimize-test.sh && bash scripts/sw-session-test.sh && bash scripts/sw-setup-test.sh && bash scripts/sw-standup-test.sh && bash scripts/sw-status-test.sh && bash scripts/sw-strategic-test.sh && bash scripts/sw-stream-test.sh && bash scripts/sw-swarm-test.sh && bash scripts/sw-team-stages-test.sh && bash scripts/sw-templates-test.sh && bash scripts/sw-testgen-test.sh && bash scripts/sw-tmux-pipeline-test.sh && bash scripts/sw-tmux-test.sh && bash scripts/sw-trace-test.sh && bash scripts/sw-tracker-test.sh && bash scripts/sw-triage-test.sh && bash scripts/sw-upgrade-test.sh && bash scripts/sw-ux-test.sh && bash scripts/sw-webhook-test.sh && bash scripts/sw-widgets-test.sh && bash scripts/sw-worktree-test.sh && bash scripts/sw-lib-compat-test.sh && bash scripts/sw-lib-helpers-test.sh && bash scripts/sw-lib-error-actionability-test.sh && bash scripts/sw-lib-daemon-dispatch-test.sh && bash scripts/sw-lib-daemon-failure-test.sh && bash scripts/sw-lib-daemon-poll-test.sh && bash scripts/sw-lib-daemon-state-test.sh && bash scripts/sw-lib-daemon-triage-test.sh && bash scripts/sw-lib-daemon-patrol-test.sh && bash scripts/sw-lib-pipeline-detection-test.sh && bash scripts/sw-lib-pipeline-intelligence-test.sh && bash scripts/sw-lib-pipeline-quality-checks-test.sh && bash scripts/sw-lib-pipeline-stages-test.sh && bash scripts/sw-lib-pipeline-state-test.sh && bash scripts/sw-adapters-test.sh && bash scripts/sw-evidence-test.sh && bash scripts/sw-review-rerun-test.sh && bash scripts/sw-tracker-providers-test.sh && bash scripts/sw-budget-chaos-test.sh && bash scripts/sw-chaos-test.sh && bash scripts/sw-autonomous-e2e-test.sh && bash scripts/sw-memory-discovery-e2e-test.sh && bash scripts/sw-policy-e2e-test.sh && bash scripts/sw-e2e-smoke-test.sh && bash scripts/sw-dashboard-e2e-test.sh && bash scripts/sw-reward-aggregator-test.sh && bash scripts/sw-bandit-selector-test.sh && bash scripts/sw-policy-learner-test.sh && bash scripts/sw-autoresearch-e2e-test.sh
+
+
+[38;2;168;85;247m[1m╔════════════════════════════════════════════════════════════════╗[0m
+[38;2;168;85;247m[1m║  AGI-Roadmap Validation — Real Tests for Every Feature        ║[0m
+[38;2;168;85;247m[1m╚════════════════════════════════════════════════════════════════╝[0m
+
+[38;2;168;85;247m[1mPhase 1: Feedback Loops (Discovery, Memory, PM, Failure Learning)[0m
+  [38;2;0;212;255m▸[0m Daemon: failure_history initialized in state JSON... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Daemon: consecutive count uses reduce (run-from-newest, not total)... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Daemon: get_max_retries_for_class returns per-class limits... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Daemon: exponential backoff formula 5*2^(n-3) is correct... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Daemon: resume_after parsed in UTC (not local TZ)... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m PM: recommend --json flag implemented... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m PM: learn subcommand functional... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Daemon: PM recommend/learn wired into triage + success/failure... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Daemon: confidence < 60% upgrades to full template... [38;2;74;222;128m✓[0m
+
+[38;2;168;85;247m[1mPhase 2: Agent Coordination (Feedback, Predictive, Oversight, Autonomous)[0m
+  [38;2;0;212;255m▸[0m Feedback: ARTIFACTS_DIR respects caller override... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Feedback: rollback uses PIPESTATUS for correct exit code... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Predictive: anomaly detection returns severity for 5x baseline... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Predictive: inject-prevention command exists and runs... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Pipeline: predictive anomaly/baseline/inject-prevention wired... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Pipeline: memory metric wired into stage completion... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Oversight: gate approves clean review... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Oversight: gate rejects with --reject-if... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Oversight: gate JSON safe from newline/quote injection... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Pipeline: oversight gate wired + respects SKIP_GATES... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Pipeline: feedback collect/create-issue/rollback wired into monitor... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Pipeline: intelligence prediction validation wired... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Pipeline: predictive anomaly confirmation wired... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Pipeline: memory fix-outcome negative path wired... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Triage: offline fallback with recruit... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Recruit: policy integration wired... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Recruit: meta feedback loop... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Recruit: audit (negative-compounding feedback)... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Autonomous: safe recruit_args quoting... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Autonomous: Claude output redirected to findings file... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Autonomous: dual branch check (pipeline + daemon)... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Autonomous: run_scheduler with loop/sleep... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Autonomous: trigger_pipeline_for_finding wired... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Incident: create_hotfix_issue echoes issue number... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Incident: trigger_pipeline wires --template hotfix... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Incident: trigger_rollback wires sw-feedback.sh... [38;2;74;222;128m✓[0m
+
+[38;2;168;85;247m[1mPhase 3: Quality Assurance (Code Review, Testgen, Swarm, Multi-Agent)[0m
+  [38;2;0;212;255m▸[0m Code review: run_claude_semantic_review exists... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Code review: semantic findings integrated... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Testgen: Claude prompt asks for real assertions... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Testgen: prompt piped to avoid shell expansion... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Swarm: spawn creates tmux session... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Swarm: retire kills tmux session... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Swarm: spawn/retire functional (real tmux)... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Loop: multi-agent restarts not blocked... [38;2;74;222;128m✓[0m
+
+[38;2;168;85;247m[1mPhase 4: Meta-Cognition (Effectiveness, Self-Awareness, Capability)[0m
+  [38;2;0;212;255m▸[0m Pipeline: record_stage_effectiveness creates valid JSONL... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Pipeline: self-awareness hint triggers on >50% failure rate... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Pipeline: effectiveness recorded on both complete and failed... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Pipeline: discovery inject wired... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Pipeline: self-awareness hint injected into plan prompt... [38;2;74;222;128m✓[0m
+
+[38;2;168;85;247m[1mIntegration & Safety[0m
+  [38;2;0;212;255m▸[0m CI: integration-claude jobs in workflow... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Integration-claude: skip path functional... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m All modified scripts have strict mode... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m All modified scripts have ERR trap... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m No hardcoded secrets in scripts... [38;2;74;222;128m✓[0m
+
+[2m  ──────────────────────────────────────────[0m
+
+  [38;2;74;222;128m[1mAll 53 tests passed![0m
+
+
+[38;2;0;212;255m[1m  Shipwright Activity Tests[0m
+[2m  ══════════════════════════════════════════[0m
+
+[1m  Script Safety[0m
+  [38;2;74;222;128m✓[0m set -euo pipefail present
+  [38;2;74;222;128m✓[0m ERR trap present
+  [38;2;74;222;128m✓[0m Source guard pattern (if/then/fi)
+  [38;2;74;222;128m✓[0m VERSION variable defined
+
+[1m  Help Output[0m
+  [38;2;74;222;128m✓[0m help exits 0 and contains USAGE
+  [38;2;74;222;128m✓[0m help lists 'watch' subcommand
+  [38;2;74;222;128m✓[0m help lists 'snapshot' subcommand
+  [38;2;74;222;128m✓[0m help lists 'history' subcommand
+  [38;2;74;222;128m✓[0m help lists 'stats' subcommand
+  [38;2;74;222;128m✓[0m help lists 'agents' subcommand
+  [38;2;74;222;128m✓[0m --help alias works
+
+[1m  Error Handling[0m
+[38;2;0;212;255m[1mshipwright activity[0m — Live agent activity stream
+
+[1mUSAGE[0m
+  shipwright activity [subcommand] [options]
+
+[1mSUBCOMMANDS[0m
+  watch                      Live stream of agent activity (default)
+  snapshot                   Current state of all active agents
+  history [range]            Replay past activity (e.g., '1h', '10m', 'all')
+  stats                      Running counters (events, commits, tests, agents)
+  agents                     List known agents and last activity
+  help                       Show this help message
+
+[1mOPTIONS[0m
+  --type <type>              Filter events by type (e.g., 'stage.completed')
+  --agent <name>             Filter by agent name
+  --team <name>              Filter by team
+  --stage <name>             Filter by pipeline stage (e.g., 'build')
+
+[1mEXAMPLES[0m
+  \033[2mshipwright activity\033[0m                    # Live stream
+  \033[2mshipwright activity watch --type stage.*\033[0m  # Only stage events
+  \033[2mshipwright activity history 1h\033[0m           # Last hour
+  \033[2mshipwright activity snapshot\033[0m             # Current state
+  \033[2mshipwright activity stats\033[0m                # Counters
+  [38;2;74;222;128m✓[0m Unknown command exits non-zero
+
+[1m  Subcommands Without Events File[0m
+  [38;2;74;222;128m✓[0m snapshot exits non-zero with no events
+  [38;2;74;222;128m✓[0m stats exits non-zero with no events
+  [38;2;74;222;128m✓[0m agents exits non-zero with no events
+
+[1m  Event Emission[0m
+  [38;2;74;222;128m✓[0m emit_event creates events.jsonl
+  [38;2;74;222;128m✓[0m emit_event writes valid JSON
+  [38;2;74;222;128m✓[0m Event contains type field
+  [38;2;74;222;128m✓[0m Event contains agent field
+  [38;2;74;222;128m✓[0m Event contains numeric count
+
+[1m  Format Helpers[0m
+  [38;2;74;222;128m✓[0m get_icon_for_type commit returns icon
+  [38;2;74;222;128m✓[0m get_icon_for_type test.passed returns icon
+  [38;2;74;222;128m✓[0m get_icon_for_type unknown returns bullet
+  [38;2;74;222;128m✓[0m format_timestamp strips T and Z
+
+[1m  Stats With Events[0m
+  [38;2;74;222;128m✓[0m stats shows Total Events
+  [38;2;74;222;128m✓[0m stats shows Commits count
+  [38;2;74;222;128m✓[0m stats shows Pipelines count
 
+[1m  History Subcommand[0m
+  [38;2;74;222;128m✓[0m history all shows activity header
 
-[38;2;124;58;237m[1m╔═══════════════════════════════════════════════════════════════════╗[0m
-[38;2;124;58;237m[1m║  shipwright pipeline test — E2E Validation (Real Subprocess)     ║[0m
-[38;2;124;58;237m[1m╚═══════════════════════════════════════════════════════════════════╝[0m
 
-[2mSetting up mock environment...[0m
-[38;2;74;222;128m✓[0m Environment ready: [2m/tmp/sw-pipeline-test.vZ9o8O[0m
+[2m  ──────────────────────────────────────────[0m
 
-  [38;2;0;212;255m▸[0m Preflight passes with all mocks... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Preflight fails when sw-loop.sh missing... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Start requires --goal or --issue... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Intake with --goal creates branch + artifacts... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Intake with --issue fetches from GitHub... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Plan generates plan.md, dod.md, tasks... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Build invokes sw loop and commits... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Test stage captures results to log... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Review generates report with severities... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m PR stage creates PR URL artifact... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Full E2E pipeline (6 stages)... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Resume continues from partial state... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Abort marks pipeline as aborted... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Dry run shows config, no artifacts... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Self-healing build→test retry loop... [38;2;74;222;128m✓[0m
+  [38;2;74;222;128m[1mAll 28 tests passed[0m
 
-[38;2;124;58;237m[1m━━━ Results ━━━[0m
-  [38;2;74;222;128mPassed:[0m 15
-  [38;2;248;113;113mFailed:[0m 0
-  [2mTotal:[0m  15
 
-[38;2;74;222;128m[1mAll 15 tests passed![0m
+[38;2;0;212;255m[1m  Shipwright Adaptive Tests[0m
+[2m  ══════════════════════════════════════════[0m
 
+[2m  help / version[0m
+  [38;2;74;222;128m✓[0m help exits 0
+  [38;2;74;222;128m✓[0m help shows USAGE
+  [38;2;74;222;128m✓[0m help shows SUBCOMMANDS
+  [38;2;74;222;128m✓[0m help mentions get
+  [38;2;74;222;128m✓[0m help mentions train
+  [38;2;74;222;128m✓[0m help mentions profile
+  [38;2;74;222;128m✓[0m version exits 0
+  [38;2;74;222;128m✓[0m version output contains version string
 
-[38;2;124;58;237m[1m╔═══════════════════════════════════════════════════════════════════╗[0m
-[38;2;124;58;237m[1m║  shipwright daemon test — Unit Tests (Synthetic Events)           ║[0m
-[38;2;124;58;237m[1m╚═══════════════════════════════════════════════════════════════════╝[0m
+[2m  error handling[0m
+  [38;2;74;222;128m✓[0m Unknown command exits non-zero
 
-[2mSetting up test environment...[0m
-[38;2;74;222;128m✓[0m Environment ready: [2m/tmp/sw-daemon-test.Ootf7j[0m
-
-  [38;2;0;212;255m▸[0m dora_grade deploy_freq Elite (>= 7)... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m dora_grade deploy_freq High (>= 1)... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m dora_grade deploy_freq Medium (>= 0.25)... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m dora_grade deploy_freq Low (< 0.25)... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m dora_grade CFR thresholds (Elite/High/Medium/Low)... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Stage timings filter-first jq query... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m MTTR pairs failures with next success... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m epoch_to_iso helper function... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Health check detects stale jobs... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Priority label sorting... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Degradation alert triggers on high CFR... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Metrics --json output with cycle_time keys... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Self-labeling includes watch_label when enabled... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Self-labeling excludes watch_label when disabled... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Patrol recurring failures label construction... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m DORA degradation event detection... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Retry exhaustion event detection... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Untested script detection logic... [38;2;74;222;128m✓[0m
-
-[38;2;124;58;237m[1m━━━ Results ━━━[0m
-  [38;2;74;222;128mPassed:[0m 18
-  [38;2;248;113;113mFailed:[0m 0
-  [2mTotal:[0m  18
-
-[38;2;74;222;128m[1mAll 18 tests passed![0m
-
-
-[38;2;124;58;237m[1m╔═══════════════════════════════════════════════════════════════════╗[0m
-[38;2;124;58;237m[1m║  shipwright prep test — Validation Suite (Real Subprocess)        ║[0m
-[38;2;124;58;237m[1m╚═══════════════════════════════════════════════════════════════════╝[0m
+[2m  get command[0m
+  [38;2;74;222;128m✓[0m get timeout with default exits 0
 
-[2mSetting up test environment...[0m
-[38;2;74;222;128m✓[0m Environment ready: [2m/tmp/sw-prep-test.1SpJfU[0m
-
-  [38;2;0;212;255m▸[0m Node.js project detection... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Python project detection... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Go project detection... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Rust project detection... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m settings.json is valid JSON... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Hook scripts are executable... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Hook scripts have valid syntax... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m CLAUDE.md has required sections... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Check mode outputs scoring... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Idempotency without --force... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m --force overwrites modified files... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m No eval in generated hooks... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Definition of Done generated... [38;2;74;222;128m✓[0m
-
-[38;2;124;58;237m[1m━━━ Results ━━━[0m
-  [38;2;74;222;128mPassed:[0m 13
-  [38;2;248;113;113mFailed:[0m 0
-  [2mTotal:[0m  13
-
-[38;2;74;222;128m[1mAll 13 tests passed![0m
-
-
-[38;2;124;58;237m[1m╔═══════════════════════════════════════════════════════════════════╗[0m
-[38;2;124;58;237m[1m║  shipwright fleet test — Unit Tests                                ║[0m
-[38;2;124;58;237m[1m╚═══════════════════════════════════════════════════════════════════╝[0m
+[2m  profile command[0m
+  [38;2;74;222;128m✓[0m profile exits 0
 
-[2mSetting up test environment...[0m
-[38;2;74;222;128m✓[0m Environment ready: [2m/tmp/sw-fleet-test.lIcp2s[0m
-
-  [38;2;0;212;255m▸[0m Help output contains expected sections... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Help via --help flag... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Config parsing — valid config... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Config parsing — missing config file... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Config parsing — invalid JSON... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Config parsing — empty repos array... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Config defaults applied... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Fleet init generates config template... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Fleet init skips when config exists... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Fleet start spawns tmux sessions per repo... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Fleet start skips missing repos... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Fleet start skips existing sessions... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Fleet start creates fleet state file... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Fleet start emits fleet.started event... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Fleet start applies repo-level overrides... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Fleet stop kills sessions and cleans state... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Fleet stop — no fleet running... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Fleet stop emits fleet.stopped event... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Fleet status — no fleet running... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Fleet status shows dashboard... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Fleet metrics — no events file... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Fleet metrics dashboard output... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Fleet metrics JSON output... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Fleet metrics period flag... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Session name generation... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Fleet start skips non-git repos... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Unknown subcommand... [38;2;74;222;128m✓[0m
-
-[38;2;124;58;237m[1m━━━ Results ━━━[0m
-  [38;2;74;222;128mPassed:[0m 27
-  [38;2;248;113;113mFailed:[0m 0
-  [2mTotal:[0m  27
-
-[38;2;74;222;128m[1mAll 27 tests passed![0m
-
-
-[38;2;124;58;237m[1m╔═══════════════════════════════════════════════════════════════════╗[0m
-[38;2;124;58;237m[1m║  shipwright fix test — Unit Tests                                  ║[0m
-[38;2;124;58;237m[1m╚═══════════════════════════════════════════════════════════════════╝[0m
+[2m  reset command[0m
+  [38;2;74;222;128m✓[0m reset exits 0
 
-[2mSetting up test environment...[0m
-[38;2;74;222;128m✓[0m Environment ready: [2m/tmp/sw-fix-test.yrL4tG[0m
-
-  [38;2;0;212;255m▸[0m Help output contains expected sections... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Help via --help flag... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Missing goal shows error... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Missing repos shows error... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Arg parsing — --repos comma-separated... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Arg parsing — --repos-from file... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Arg parsing — --repos-from missing file... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Arg parsing — --pipeline template... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Arg parsing — --max-parallel... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Arg parsing — --branch-prefix... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Dry run shows what would happen... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Dry run does not create state file... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Fix status — no sessions... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Fix status shows existing sessions... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Invalid repo directory shows error... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Fix start creates state file... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Fix start emits events... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Fix start — summary output... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Branch name sanitization... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Fix header shows configuration... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Non-git repo warning... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Per-repo event tracking... [38;2;74;222;128m✓[0m
-
-[38;2;124;58;237m[1m━━━ Results ━━━[0m
-  [38;2;74;222;128mPassed:[0m 22
-  [38;2;248;113;113mFailed:[0m 0
-  [2mTotal:[0m  22
-
-[38;2;74;222;128m[1mAll 22 tests passed![0m
-
-
-[38;2;124;58;237m[1m╔═══════════════════════════════════════════════════════════════════╗[0m
-[38;2;124;58;237m[1m║  shipwright memory+cost test — Unit Tests for Memory & Cost      ║[0m
-[38;2;124;58;237m[1m╚═══════════════════════════════════════════════════════════════════╝[0m
-
-[2mSetting up mock environment...[0m
-[38;2;74;222;128m✓[0m Environment ready: [2m/tmp/sw-memory-test.IW0uqN[0m
-
-  [38;2;0;212;255m▸[0m Memory capture from pipeline state... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Memory inject returns context for each stage... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Failure capture stores patterns... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Pattern detection identifies project type... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Cross-repo vs per-repo isolation... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Memory show displays dashboard... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Memory search finds matching entries... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Memory export produces valid JSON... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Memory forget clears repo memory... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Cost calculation for each model... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Cost recording writes to costs.json... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Budget set and check... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Cost dashboard runs without errors... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Cost JSON output is valid... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Actionable failures threshold filtering... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Actionable failures with no file returns []... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m DORA baseline calculation from events... [38;2;74;222;128m✓[0m
-
-[38;2;124;58;237m[1m━━━ Results ━━━[0m
-  [38;2;74;222;128mPassed:[0m 17
-  [38;2;248;113;113mFailed:[0m 0
-  [2mTotal:[0m  17
-
-[38;2;74;222;128m[1mAll 17 tests passed![0m
+[2m  script safety[0m
+  [38;2;74;222;128m✓[0m Uses set -euo pipefail
+  [38;2;74;222;128m✓[0m Has source guard pattern
 
+[2m  statistical functions[0m
+  [38;2;74;222;128m✓[0m percentile, mean, median functions defined in source
+  [38;2;74;222;128m✓[0m mean returns numeric value (avg of 1-5 is 3)
 
-[38;2;0;212;255m[1m╔═══════════════════════════════════════════════════╗[0m
-[38;2;0;212;255m[1m║  shipwright session — E2E Test Suite              ║[0m
-[38;2;0;212;255m[1m╚═══════════════════════════════════════════════════╝[0m
+[2m  get_timeout / get_iterations / get_model[0m
+  [38;2;74;222;128m✓[0m get_timeout returns number (default with no events)
+  [38;2;74;222;128m✓[0m get_iterations returns number
+  [38;2;74;222;128m✓[0m get_model returns valid model name
 
-[2mSetting up test environment...[0m
-[2mTest tmux session: sw-test-1268715[0m
-
-[38;2;124;58;237m[1mTemplate Loading[0m
-  [38;2;0;212;255m▸[0m Load feature-dev template (3 agents)... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Load exploration template (2 agents)... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Missing template returns error... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m All 24 templates load successfully... [38;2;74;222;128m✓[0m
-
-[38;2;124;58;237m[1mWindow Creation[0m
-  [38;2;0;212;255m▸[0m No-launch creates window without claude... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Duplicate window detection... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Window gets dark theme... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Auto-generated team name... [38;2;74;222;128m✓[0m
-
-[38;2;124;58;237m[1mPrompt & Launcher[0m
-  [38;2;0;212;255m▸[0m Launcher script generation with template... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Output includes agents from template... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Output includes goal when provided... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m No template + goal works... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m No template + no goal = interactive... [38;2;74;222;128m✓[0m
-
-[38;2;124;58;237m[1mCLI & Configuration[0m
-  [38;2;0;212;255m▸[0m Help flag... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Unknown option... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m TMPDIR used for launcher files... [38;2;74;222;128m✓[0m
-
-[38;2;124;58;237m[1mEnhanced Features[0m
-  [38;2;0;212;255m▸[0m Template auto-suggestion from goal... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m No suggestion without goal... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Memory injection in prompt... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m CLAUDE.md reminder in prompt... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Secure temp dir in source... [38;2;74;222;128m✓[0m
+[2m  train subcommand[0m
+  [38;2;74;222;128m✓[0m train subcommand runs with mock events
 
-[38;2;0;212;255m[1m════════════════════════════════════════════════════[0m
-[38;2;74;222;128m[1m  All 21 tests passed ✓[0m
-[38;2;0;212;255m[1m════════════════════════════════════════════════════[0m
+[2m  ──────────────────────────────────────────[0m
 
+  [38;2;74;222;128m[1mAll 20 tests passed[0m
 
-[38;2;0;212;255m[1m╔═══════════════════════════════════════════════════╗[0m
-[38;2;0;212;255m[1m║  shipwright init — E2E Test Suite                 ║[0m
-[38;2;0;212;255m[1m╚═══════════════════════════════════════════════════╝[0m
 
-[2mSetting up sandboxed environment...[0m
-[2mTemp dir: /tmp/sw-init-test.WldBc1[0m
 
-[38;2;124;58;237m[1mConfiguration[0m
-  [38;2;0;212;255m▸[0m Settings.json created with agent teams... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Settings merge preserves existing vars... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m tmux.conf installed... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Overlay installed... [38;2;74;222;128m✓[0m
+[38;2;0;212;255m[1m  shipwright adversarial test[0m
+[2m  ══════════════════════════════════════════[0m
 
-[38;2;124;58;237m[1mTemplates[0m
-  [38;2;0;212;255m▸[0m Team templates installed (>= 10)... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Pipeline templates installed (>= 5)... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Legacy templates path populated... [38;2;74;222;128m✓[0m
+[2m  ══════════════════════════════════════════[0m
 
-[38;2;124;58;237m[1mRobustness[0m
-  [38;2;0;212;255m▸[0m Idempotency — double init safe... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Doctor runs at end... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Help flag... [38;2;74;222;128m✓[0m
+[1m  Script Safety[0m
+  [38;2;74;222;128m✓[0m set -euo pipefail present
+  [38;2;74;222;128m✓[0m ERR trap present
+  [38;2;74;222;128m✓[0m Source guard pattern (if/then/fi)
+  [38;2;74;222;128m✓[0m VERSION variable defined
 
-[38;2;124;58;237m[1mHook Wiring[0m
-  [38;2;0;212;255m▸[0m JSONC stripped from settings.json... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Hooks wired into settings.json... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Hook wiring preserves existing hooks... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m SessionStart hook installed... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Hook wiring with pre-existing settings... [38;2;74;222;128m✓[0m
+[1m  Help Output[0m
+  [38;2;74;222;128m✓[0m help exits 0 and contains USAGE
+  [38;2;74;222;128m✓[0m help lists 'review' subcommand
+  [38;2;74;222;128m✓[0m help lists 'iterate' subcommand
+  [38;2;74;222;128m✓[0m help mentions adversarial_enabled flag
+  [38;2;74;222;128m✓[0m --help alias works
+  [38;2;74;222;128m✓[0m -h alias works
 
-[38;2;0;212;255m[1m════════════════════════════════════════════════════[0m
-[38;2;74;222;128m[1m  All 15 tests passed ✓[0m
-[38;2;0;212;255m[1m════════════════════════════════════════════════════[0m
+[1m  Error Handling[0m
+  [38;2;74;222;128m✓[0m Unknown command exits non-zero
 
+[1m  Review Subcommand[0m
+  [38;2;74;222;128m✓[0m review disabled returns empty JSON array
+  [38;2;74;222;128m✓[0m review without diff arg exits non-zero
 
-[38;2;0;212;255m[1m╔═══════════════════════════════════════════════════╗[0m
-[38;2;0;212;255m[1m║  shipwright tracker — Test Suite                  ║[0m
-[38;2;0;212;255m[1m╚═══════════════════════════════════════════════════╝[0m
+[1m  Iterate Subcommand[0m
+  [38;2;74;222;128m✓[0m iterate without args exits non-zero
+  [38;2;74;222;128m✓[0m iterate with empty findings converges
+  [38;2;74;222;128m✓[0m iterate past max rounds returns findings
 
-[2mSetting up test environment...[0m
+[1m  Configuration[0m
+  [38;2;74;222;128m✓[0m ADVERSARIAL_MAX_ROUNDS env var respected
+  [38;2;74;222;128m✓[0m disabled config returns empty array
 
-[38;2;124;58;237m[1mProvider Loading[0m
-  [38;2;0;212;255m▸[0m Provider loads from config (linear)... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Provider loads jira... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Graceful skip when no provider... [38;2;74;222;128m✓[0m
+[1m  Event Emission[0m
+  [38;2;74;222;128m✓[0m emit_event creates events.jsonl
+  [38;2;74;222;128m✓[0m emit_event writes valid JSON
+  [38;2;74;222;128m✓[0m Event contains type field
 
-[38;2;124;58;237m[1mPipeline Enrichment[0m
-  [38;2;0;212;255m▸[0m Stage descriptions exist for all 12 stages... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Enriched progress body has Delivering line... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Enriched progress body has stage descriptions... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Pipeline state includes stage_progress... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Pipeline state includes stage description... [38;2;74;222;128m✓[0m
 
-[38;2;124;58;237m[1mIntegration[0m
-  [38;2;0;212;255m▸[0m Tracker notify routes to provider (mock)... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Dashboard reads goal from pipeline state... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Jira config validation... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Linear config migration (legacy fallback)... [38;2;74;222;128m✓[0m
 
-[38;2;0;212;255m[1m════════════════════════════════════════════════════[0m
-[38;2;74;222;128m[1m  All 12 tests passed ✓[0m
-[38;2;0;212;255m[1m════════════════════════════════════════════════════[0m
 
+[2m  ──────────────────────────────────────────[0m
 
-[38;2;0;212;255m[1m╔═══════════════════════════════════════════════════╗[0m
-[38;2;0;212;255m[1m║  shipwright heartbeat + checkpoint — Test Suite   ║[0m
-[38;2;0;212;255m[1m╚═══════════════════════════════════════════════════╝[0m
+  [38;2;74;222;128m[1mAll 0 tests passed[0m
 
-[2mSetting up test environment...[0m
 
-[38;2;124;58;237m[1mHeartbeat Lifecycle[0m
-  [38;2;0;212;255m▸[0m Write heartbeat creates JSON file... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Check heartbeat reports alive... [38;2;74;222;128m[1m✓[0m Job test-job-alive alive (0s ago)
-[38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Check heartbeat reports stale... [38;2;250;204;21m[1m⚠[0m Job test-job-stale stale (192940576s ago, timeout: 120s)
-[38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Clear heartbeat removes file... [38;2;74;222;128m[1m✓[0m Cleared heartbeat for job: test-job-clear
-[38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m List heartbeats returns JSON array... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Heartbeat update overwrites existing... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Check missing heartbeat returns error... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Heartbeat dir auto-created when missing... [38;2;74;222;128m✓[0m
 
-[38;2;124;58;237m[1mCheckpoint Lifecycle[0m
-  [38;2;0;212;255m▸[0m Checkpoint save creates JSON file... [38;2;74;222;128m[1m✓[0m Checkpoint saved for stage [1mbuild[0m (iteration 5)
-[38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Checkpoint restore outputs JSON... [38;2;74;222;128m[1m✓[0m Checkpoint saved for stage [1mtest[0m (iteration 3)
-[38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Checkpoint restore missing stage fails... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Checkpoint clear removes file... [38;2;74;222;128m[1m✓[0m Checkpoint saved for stage [1mreview[0m (iteration 1)
-[38;2;74;222;128m[1m✓[0m Cleared checkpoint for stage [1mreview[0m
-[38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Checkpoint clear --all removes all... [38;2;74;222;128m[1m✓[0m Checkpoint saved for stage [1mbuild[0m (iteration 1)
-[38;2;74;222;128m[1m✓[0m Checkpoint saved for stage [1mtest[0m (iteration 2)
-[38;2;74;222;128m[1m✓[0m Cleared 2 checkpoint(s)
-[38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Checkpoint save with files-modified... [38;2;74;222;128m[1m✓[0m Checkpoint saved for stage [1mbuild[0m (iteration 7)
-[38;2;74;222;128m✓[0m
+[38;2;0;212;255m[1m  shipwright architecture-enforcer test[0m
+[2m  ══════════════════════════════════════════[0m
 
-[38;2;124;58;237m[1mIntegration[0m
-  [38;2;0;212;255m▸[0m Pipeline script has heartbeat functions... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Loop script has heartbeat and checkpoint... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Pipeline has human intervention checks... [38;2;74;222;128m✓[0m
+[2m  ══════════════════════════════════════════[0m
 
-[38;2;0;212;255m[1m════════════════════════════════════════════════════[0m
-[38;2;74;222;128m[1m  All 17 tests passed ✓[0m
-[38;2;0;212;255m[1m════════════════════════════════════════════════════[0m
+[1m  Script Safety[0m
+  [38;2;74;222;128m✓[0m set -euo pipefail present
+  [38;2;74;222;128m✓[0m ERR trap present
+  [38;2;74;222;128m✓[0m Source guard pattern (if/then/fi)
+  [38;2;74;222;128m✓[0m VERSION variable defined
 
+[1m  Help Output[0m
+  [38;2;74;222;128m✓[0m help exits 0 and contains USAGE
+  [38;2;74;222;128m✓[0m help lists 'build' subcommand
+  [38;2;74;222;128m✓[0m help lists 'validate' subcommand
+  [38;2;74;222;128m✓[0m help lists 'evolve' subcommand
+  [38;2;74;222;128m✓[0m help mentions architecture_enabled flag
+  [38;2;74;222;128m✓[0m --help alias works
+  [38;2;74;222;128m✓[0m -h alias works
 
-[38;2;0;212;255m[1m╔═══════════════════════════════════════════════════╗[0m
-[38;2;0;212;255m[1m║  shipwright remote — Test Suite                   ║[0m
-[38;2;0;212;255m[1m╚═══════════════════════════════════════════════════╝[0m
+[1m  Error Handling[0m
+  [38;2;74;222;128m✓[0m Unknown command exits non-zero
 
-[2mSetting up test environment...[0m
+[1m  Build Subcommand[0m
+  [38;2;74;222;128m✓[0m build disabled returns empty JSON object
+  [38;2;74;222;128m✓[0m build with enabled returns model with layers
+  [38;2;74;222;128m✓[0m build model contains patterns array
+  [38;2;74;222;128m✓[0m build model contains conventions array
 
-[38;2;124;58;237m[1mMachine Registry[0m
-  [38;2;0;212;255m▸[0m Add machine creates machines.json... [38;2;0;212;255m[1m▸[0m Checking shipwright installation at [2m/tmp/sw-remote-test.PmYCBx/mock-install[0m...
-[38;2;74;222;128m[1m✓[0m Shipwright found at /tmp/sw-remote-test.PmYCBx/mock-install
-[38;2;74;222;128m[1m✓[0m Registered machine: [1mbuilder-1[0m (localhost, worker, 4 workers)
-[38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Add second machine appends to array... [38;2;0;212;255m[1m▸[0m Checking shipwright installation at [2m/tmp/sw-remote-test.PmYCBx/mock-install[0m...
-[38;2;74;222;128m[1m✓[0m Shipwright found at /tmp/sw-remote-test.PmYCBx/mock-install
-[38;2;74;222;128m[1m✓[0m Registered machine: [1mbuilder-2[0m (localhost, worker, 8 workers)
-[38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Remove machine by name... [38;2;74;222;128m[1m✓[0m Removed machine: [1mbuilder-2[0m
-[38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m List machines returns output... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m machines.json uses atomic writes... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Duplicate machine name prevented... [38;2;0;212;255m[1m▸[0m Use [38;2;0;212;255mshipwright remote remove builder-1[0m first
-[38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Remote script has help command... [38;2;74;222;128m✓[0m
+[1m  Validate Subcommand[0m
+  [38;2;74;222;128m✓[0m validate disabled returns empty array
+  [38;2;74;222;128m✓[0m validate without diff arg exits non-zero
+  [38;2;74;222;128m✓[0m validate without model file returns empty array
 
-[38;2;124;58;237m[1mCLI & Dashboard Integration[0m
-  [38;2;0;212;255m▸[0m CLI router includes remote command... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m CLI router includes heartbeat command... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m CLI router includes checkpoint command... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Doctor has heartbeat health check... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Doctor has remote machine checks... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Status shows heartbeat section... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Status shows remote machines section... [38;2;74;222;128m✓[0m
+[1m  Evolve Subcommand[0m
+  [38;2;74;222;128m✓[0m evolve disabled exits 0
+  [38;2;74;222;128m✓[0m evolve without model exits 0
 
-[38;2;0;212;255m[1m════════════════════════════════════════════════════[0m
-[38;2;74;222;128m[1m  All 14 tests passed ✓[0m
-[38;2;0;212;255m[1m════════════════════════════════════════════════════[0m
+[1m  Model Storage[0m
+  [38;2;74;222;128m✓[0m build stores model in ~/.shipwright/memory/
+  [38;2;74;222;128m✓[0m Stored model is valid JSON
 
+[1m  Event Emission[0m
+  [38;2;74;222;128m✓[0m emit_event creates events.jsonl
+  [38;2;74;222;128m✓[0m emit_event writes valid JSON
+  [38;2;74;222;128m✓[0m Event contains type field
 
-[38;2;124;58;237m[1m╔═══════════════════════════════════════════════════════════════════╗[0m
-[38;2;124;58;237m[1m║  shipwright intelligence test — Unit Tests                       ║[0m
-[38;2;124;58;237m[1m╚═══════════════════════════════════════════════════════════════════╝[0m
 
-[2mSetting up test environment...[0m
-✓ Environment ready: /tmp/sw-intelligence-test.wTXBVg
 
-  ▸ analyze_issue returns valid schema... ✓
-  ▸ Cache hit on second call with same input... ✓
-  ▸ Graceful degradation when claude CLI unavailable... ✓
-  ▸ compose_pipeline produces valid pipeline JSON... ✓
-  ▸ recommend_model returns valid model names... ✓
-  ▸ predict_cost returns numeric estimates... ✓
-  ▸ Cache TTL expiry returns miss... ✓
-  ▸ search_memory returns ranked results... ✓
-  ▸ Feature flag disabled returns fallback... ✓
-  ▸ Events emitted for analysis... ✓
-  ▸ recommend_model emits events... ✓
-  ▸ Cache init creates file if missing... ✓
 
-━━━ Results ━━━
-  Passed: 12
-  Failed: 0
-  Total:  12
+[2m  ──────────────────────────────────────────[0m
 
-All 12 tests passed!
+  [38;2;74;222;128m[1mAll 0 tests passed[0m
 
 
-[38;2;0;212;255m[1m╔═══════════════════════════════════════════════════╗[0m
-[38;2;0;212;255m[1m║  shipwright pipeline composer — Test Suite        ║[0m
-[38;2;0;212;255m[1m╚═══════════════════════════════════════════════════╝[0m
+[38;2;0;212;255m[1m  Shipwright Auth Tests[0m
+[2m  ══════════════════════════════════════════[0m
 
-[2mSetting up test environment...[0m
+[1m  Help[0m
+  [38;2;74;222;128m✓[0m help shows usage
+  [38;2;74;222;128m✓[0m help shows commands
+  [38;2;74;222;128m✓[0m --help flag works
+  [38;2;74;222;128m✓[0m unknown command shows error
+[1m  Status & Users[0m
+  [38;2;74;222;128m✓[0m status with no login shows warning
+  [38;2;74;222;128m✓[0m users with empty shows warning
+  [38;2;74;222;128m✓[0m token with no user errors
+  [38;2;74;222;128m✓[0m switch without user exits non-zero
+[1m  Auth Storage[0m
+  [38;2;74;222;128m✓[0m auth file has users array
+  [38;2;74;222;128m✓[0m auth file has active_user
+  [38;2;74;222;128m✓[0m users lists stored user
+  [38;2;74;222;128m✓[0m token shows stored token
+  [38;2;74;222;128m✓[0m user info shows login
+  [38;2;74;222;128m✓[0m switch to nonexistent errors
+  [38;2;74;222;128m✓[0m logout succeeds
 
-[38;2;124;58;237m[1mPipeline Composition[0m
-  [38;2;0;212;255m▸[0m Composed pipeline has valid stage ordering... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m High-risk issue gets security stages... [38;2;0;212;255m[1m▸[0m Composing pipeline with intelligence engine...
-[38;2;74;222;128m[1m✓[0m Composed pipeline: 7 stages
-.claude/pipeline-artifacts/composed-pipeline.json
-[38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Fallback to static template when no intelligence... [38;2;74;222;128m✓[0m
+[2m  ──────────────────────────────────────────[0m
 
-[38;2;124;58;237m[1mConditional Stage Insertion[0m
-  [38;2;0;212;255m▸[0m Stage inserted at correct position after build... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Insert into nonexistent stage fails... [38;2;74;222;128m✓[0m
+  [38;2;74;222;128m[1mAll 15 tests passed[0m
 
-[38;2;124;58;237m[1mModel Downgrade[0m
-  [38;2;0;212;255m▸[0m Budget constraint triggers model downgrades... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Downgrade with nonexistent stage fails... [38;2;74;222;128m✓[0m
 
-[38;2;124;58;237m[1mPipeline Validation[0m
-  [38;2;0;212;255m▸[0m Validation accepts valid pipeline... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Validation rejects invalid ordering (test before build)... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Validation rejects missing stage ids... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Validation rejects missing stages array... [38;2;74;222;128m✓[0m
 
-[38;2;124;58;237m[1mIteration Estimation[0m
-  [38;2;0;212;255m▸[0m Iteration estimates are reasonable (1-50 range)... [38;2;74;222;128m✓[0m
+[38;2;0;212;255m[1m  Shipwright Autonomous Tests[0m
+[2m  ══════════════════════════════════════════[0m
 
-[38;2;0;212;255m[1m════════════════════════════════════════════════════[0m
-[38;2;74;222;128m[1m  All 12 tests passed ✓[0m
-[38;2;0;212;255m[1m════════════════════════════════════════════════════[0m
+[2m  ══════════════════════════════════════════[0m
 
+  [38;2;74;222;128m✓[0m help shows usage text
+  [38;2;74;222;128m✓[0m help exits 0
+  [38;2;74;222;128m✓[0m --help flag works
+  [38;2;74;222;128m✓[0m unknown command exits 1
+  [38;2;74;222;128m✓[0m start shows running message
+  [38;2;74;222;128m✓[0m state.json created after start
+  [38;2;74;222;128m✓[0m state status is running
+  [38;2;74;222;128m✓[0m config.json created
+  [38;2;74;222;128m✓[0m config is valid JSON
+  [38;2;74;222;128m✓[0m status shows dashboard
+  [38;2;74;222;128m✓[0m pause sets status to paused
+  [38;2;74;222;128m✓[0m resume sets status to running
+  [38;2;74;222;128m✓[0m stop sets status to stopped
+  [38;2;74;222;128m✓[0m config show displays settings
+  [38;2;74;222;128m✓[0m config set interval works
+  [38;2;74;222;128m✓[0m history handles no data
 
-[38;2;124;58;237m[1m━━━ shipwright self-optimize tests ━━━[0m
+[1m  Config Set/Show Cycle[0m
+  [38;2;74;222;128m✓[0m config show reflects set value
+  [38;2;74;222;128m✓[0m config value persists in file
 
-  ▸ Outcome analysis extracts correct metrics... ✓
-  ▸ Outcome analysis emits event... ✓
-  ▸ Outcome analysis rejects missing file... ✓
-  ▸ Template weight increases for high success... ✓
-  ▸ Template weight decreases for low success... ✓
-  ▸ A/B test selects ~20% sample... ✓
-  ▸ Iteration model updates with data points... ✓
-  ▸ Model routing tracks success rates... ✓
-  ▸ Model routing keeps opus with few sonnet samples... ✓
-  ▸ Memory pruning removes old patterns... ✓
-  ▸ Memory strengthening boosts confirmed patterns... ✓
-  ▸ Memory promotion copies cross-repo patterns... ✓
-  ▸ Full analysis runs on empty data... ✓
-  ▸ Report generates output with data... ✓
-  ▸ Report handles empty outcomes... ✓
-  ▸ Outcome analysis extracts stage data... ✓
+[1m  Config Structure[0m
+  [38;2;74;222;128m✓[0m config contains key: cycle_interval_minutes
+  [38;2;74;222;128m✓[0m config contains key: max_issues_per_cycle
+  [38;2;74;222;128m✓[0m config contains key: daemon_aware
 
-━━━ Results ━━━
-  Passed: 16
-  Failed: 0
-  Total:  16
+[1m  History With Fixture Events[0m
+  [38;2;74;222;128m✓[0m history shows recent cycles
+  [38;2;74;222;128m✓[0m history shows cycle entries
 
-All 16 tests passed!
+[1m  Status Fields[0m
+  [38;2;74;222;128m✓[0m status when running includes Status
+  [38;2;74;222;128m✓[0m status when running includes Cycles
+  [38;2;74;222;128m✓[0m status when running includes Issues Created
+  [38;2;74;222;128m✓[0m status when running includes Pipelines
+  [38;2;74;222;128m✓[0m status when running includes Cycle Interval
+  [38;2;74;222;128m✓[0m status when running shows running
+  [38;2;74;222;128m✓[0m status when stopped shows stopped
 
 
-[38;2;0;212;255m[1m╔═══════════════════════════════════════════════════════════╗[0m
-[38;2;0;212;255m[1m║  shipwright predictive test                              ║[0m
-[38;2;0;212;255m[1m╚═══════════════════════════════════════════════════════════╝[0m
 
+[2m  ──────────────────────────────────────────[0m
 
-[38;2;124;58;237m[1mRisk Assessment[0m
-  [38;2;0;212;255m▸[0m Risk returns valid schema with 0-100 range... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Risk elevates for complex keywords... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Risk emits event... [38;2;74;222;128m✓[0m
+  [38;2;74;222;128m[1mAll 0 tests passed[0m
 
-[38;2;124;58;237m[1mAnomaly Detection[0m
-  [38;2;0;212;255m▸[0m Critical at 3x threshold (181 vs 60 baseline)... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Normal at 2x (119 vs 60 baseline)... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Warning between 2x and 3x (150 vs 60)... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Normal when no baseline exists... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Emits event for critical anomaly... [38;2;74;222;128m✓[0m
 
-[38;2;124;58;237m[1mBaseline Management[0m
-  [38;2;0;212;255m▸[0m First data point uses raw value... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m EMA calculation (0.9*100 + 0.1*200 = 110)... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Creates baseline file if missing... [38;2;74;222;128m✓[0m
 
-[38;2;124;58;237m[1mPreventative Injection[0m
-  [38;2;0;212;255m▸[0m Injects context from matching patterns... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Returns empty for non-matching stage... [38;2;74;222;128m✓[0m
+[38;2;0;212;255m[1m  Shipwright Changelog Tests[0m
+[2m  ══════════════════════════════════════════[0m
 
-[38;2;124;58;237m[1mGraceful Degradation[0m
-  [38;2;0;212;255m▸[0m Works without intelligence engine... [38;2;74;222;128m✓[0m
+[2m  ══════════════════════════════════════════[0m
 
-[38;2;124;58;237m[1mAI Patrol[0m
-  [38;2;0;212;255m▸[0m AI patrol returns structured findings... [38;2;74;222;128m✓[0m
+[2m  help / version[0m
+  [38;2;74;222;128m✓[0m help exits 0
+  [38;2;74;222;128m✓[0m help shows USAGE
+  [38;2;74;222;128m✓[0m help mentions generate
+  [38;2;74;222;128m✓[0m help mentions preview
+  [38;2;74;222;128m✓[0m help mentions version
+  [38;2;74;222;128m✓[0m help mentions migrate
+  [38;2;74;222;128m✓[0m VERSION variable defined
 
-[38;2;0;212;255m[1m════════════════════════════════════════════════════[0m
-[38;2;74;222;128m[1m  All 15 tests passed ✓[0m
-[38;2;0;212;255m[1m════════════════════════════════════════════════════[0m
+[2m  error handling[0m
+  [38;2;74;222;128m✓[0m Unknown command exits non-zero
 
+[2m  formats command[0m
+  [38;2;74;222;128m✓[0m formats exits 0
 
-[38;2;0;212;255m[1m╔═══════════════════════════════════════════════════╗[0m
-[38;2;0;212;255m[1m║  shipwright frontier — Test Suite                 ║[0m
-[38;2;0;212;255m[1m╚═══════════════════════════════════════════════════╝[0m
+[2m  generate command[0m
+  [38;2;74;222;128m✓[0m generate exits 0
 
-[2mSetting up test environment...[0m
+[2m  version command[0m
+  [38;2;74;222;128m✓[0m version recommendation exits 0
 
-[38;2;124;58;237m[1mAdversarial Review[0m
-  [38;2;0;212;255m▸[0m Adversarial review produces structured findings... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Adversarial iteration converges on no critical findings... [38;2;74;222;128m✓[0m
+[2m  script safety[0m
+  [38;2;74;222;128m✓[0m Uses set -euo pipefail
+  [38;2;74;222;128m✓[0m Has source guard pattern
 
-[38;2;124;58;237m[1mDeveloper Simulation[0m
-  [38;2;0;212;255m▸[0m Simulation generates objections from 3 personas... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Simulation address returns action items... [38;2;74;222;128m✓[0m
 
-[38;2;124;58;237m[1mArchitecture Enforcer[0m
-  [38;2;0;212;255m▸[0m Architecture model has valid schema... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Architecture validates changes (violation detected)... [38;2;74;222;128m✓[0m
 
-[38;2;124;58;237m[1mGraceful Degradation[0m
-  [38;2;0;212;255m▸[0m All three degrade gracefully when claude unavailable... [38;2;74;222;128m✓[0m
+[2m  ──────────────────────────────────────────[0m
 
-[38;2;0;212;255m[1m════════════════════════════════════════════════════[0m
-[38;2;74;222;128m[1m  All 7 tests passed ✓[0m
-[38;2;0;212;255m[1m════════════════════════════════════════════════════[0m
+  [38;2;74;222;128m[1mAll 0 tests passed[0m
+
+
+
+[38;2;0;212;255m[1m  shipwright checkpoint test[0m
+[2m  ══════════════════════════════════════════[0m
+
+[2m  ══════════════════════════════════════════[0m
+
+[1m  Script Safety[0m
+  [38;2;74;222;128m✓[0m set -euo pipefail present
+  [38;2;74;222;128m✓[0m ERR trap present
+  [38;2;74;222;128m✓[0m VERSION variable defined
+
+[1m  Help Output[0m
+  [38;2;74;222;128m✓[0m help exits 0 and contains USAGE
+  [38;2;74;222;128m✓[0m help lists 'save' subcommand
+  [38;2;74;222;128m✓[0m help lists 'restore' subcommand
+  [38;2;74;222;128m✓[0m help lists 'list' subcommand
+  [38;2;74;222;128m✓[0m help lists 'clear' subcommand
+  [38;2;74;222;128m✓[0m help lists 'expire' subcommand
+  [38;2;74;222;128m✓[0m --help alias works
+  [38;2;74;222;128m✓[0m -h alias works
+
+[1m  Error Handling[0m
+
+[38;2;0;212;255m[1mshipwright checkpoint[0m [2mv3.2.4[0m — Save and restore agent state mid-stage
+
+[1mUSAGE[0m
+  [38;2;0;212;255mshipwright checkpoint[0m <command> [options]
+
+[1mCOMMANDS[0m
+  [38;2;0;212;255msave[0m           Save a checkpoint for a stage
+  [38;2;0;212;255mrestore[0m        Restore a checkpoint (prints JSON to stdout)
+  [38;2;0;212;255msave-context[0m   Save Claude context (goal, findings, test output) for resume
+  [38;2;0;212;255mrestore-context[0m Restore Claude context (exports RESTORED_* and SW_LOOP_* vars)
+  [38;2;0;212;255mlist[0m      Show all available checkpoints
+  [38;2;0;212;255mclear[0m     Remove checkpoint(s)
+  [38;2;0;212;255mexpire[0m    Remove checkpoints older than N hours
+
+[1mSAVE OPTIONS[0m
+  [38;2;0;212;255m--stage[0m <name>              Stage name (required)
+  [38;2;0;212;255m--iteration[0m <n>             Current iteration number
+  [38;2;0;212;255m--git-sha[0m <sha>             Git commit SHA (default: HEAD)
+  [38;2;0;212;255m--files-modified[0m "f1,f2"    Comma-separated list of modified files
+  [38;2;0;212;255m--tests-passing[0m             Mark tests as passing
+  [38;2;0;212;255m--loop-state[0m <state>        Loop state (running, paused, etc.)
+
+[1mRESTORE OPTIONS[0m
+  [38;2;0;212;255m--stage[0m <name>              Stage to restore (required)
+
+[1mCLEAR OPTIONS[0m
+  [38;2;0;212;255m--stage[0m <name>              Stage to clear
+  [38;2;0;212;255m--all[0m                       Clear all checkpoints
+
+[1mEXPIRE OPTIONS[0m
+  [38;2;0;212;255m--hours[0m <n>                 Max age in hours (default: 24)
+
+[1mEXAMPLES[0m
+  [2mshipwright checkpoint save --stage build --iteration 5[0m
+  [2mshipwright checkpoint save --stage build --iteration 3 --tests-passing --files-modified "src/auth.ts,src/middleware.ts"[0m
+  [2mshipwright checkpoint restore --stage build[0m
+  [2mshipwright checkpoint list[0m
+  [2mshipwright checkpoint clear --stage build[0m
+  [2mshipwright checkpoint clear --all[0m
+  [2mshipwright checkpoint expire --hours 48[0m
+  [38;2;74;222;128m✓[0m Unknown command exits non-zero
+
+[1m  Save Subcommand[0m
+
+[38;2;0;212;255m[1mshipwright checkpoint[0m [2mv3.2.4[0m — Save and restore agent state mid-stage
+
+[1mUSAGE[0m
+  [38;2;0;212;255mshipwright checkpoint[0m <command> [options]
+
+[1mCOMMANDS[0m
+  [38;2;0;212;255msave[0m           Save a checkpoint for a stage
+  [38;2;0;212;255mrestore[0m        Restore a checkpoint (prints JSON to stdout)
+  [38;2;0;212;255msave-context[0m   Save Claude context (goal, findings, test output) for resume
+  [38;2;0;212;255mrestore-context[0m Restore Claude context (exports RESTORED_* and SW_LOOP_* vars)
+  [38;2;0;212;255mlist[0m      Show all available checkpoints
+  [38;2;0;212;255mclear[0m     Remove checkpoint(s)
+  [38;2;0;212;255mexpire[0m    Remove checkpoints older than N hours
+
+[1mSAVE OPTIONS[0m
+  [38;2;0;212;255m--stage[0m <name>              Stage name (required)
+  [38;2;0;212;255m--iteration[0m <n>             Current iteration number
+  [38;2;0;212;255m--git-sha[0m <sha>             Git commit SHA (default: HEAD)
+  [38;2;0;212;255m--files-modified[0m "f1,f2"    Comma-separated list of modified files
+  [38;2;0;212;255m--tests-passing[0m             Mark tests as passing
+  [38;2;0;212;255m--loop-state[0m <state>        Loop state (running, paused, etc.)
+
+[1mRESTORE OPTIONS[0m
+  [38;2;0;212;255m--stage[0m <name>              Stage to restore (required)
+
+[1mCLEAR OPTIONS[0m
+  [38;2;0;212;255m--stage[0m <name>              Stage to clear
+  [38;2;0;212;255m--all[0m                       Clear all checkpoints
+
+[1mEXPIRE OPTIONS[0m
+  [38;2;0;212;255m--hours[0m <n>                 Max age in hours (default: 24)
+
+[1mEXAMPLES[0m
+  [2mshipwright checkpoint save --stage build --iteration 5[0m
+  [2mshipwright checkpoint save --stage build --iteration 3 --tests-passing --files-modified "src/auth.ts,src/middleware.ts"[0m
+  [2mshipwright checkpoint restore --stage build[0m
+  [2mshipwright checkpoint list[0m
+  [2mshipwright checkpoint clear --stage build[0m
+  [2mshipwright checkpoint clear --all[0m
+  [2mshipwright checkpoint expire --hours 48[0m
+  [38;2;74;222;128m✓[0m save without --stage exits non-zero
+[38;2;74;222;128m[1m✓[0m Checkpoint saved for stage [1mbuild[0m (iteration 5)
+  [38;2;74;222;128m✓[0m save creates checkpoint file
+  [38;2;74;222;128m✓[0m Checkpoint is valid JSON
+  [38;2;74;222;128m✓[0m Checkpoint stage field correct
+  [38;2;74;222;128m✓[0m Checkpoint iteration field correct
+  [38;2;74;222;128m✓[0m Checkpoint git_sha populated
+[38;2;74;222;128m[1m✓[0m Checkpoint saved for stage [1mtest[0m (iteration 0)
+  [38;2;74;222;128m✓[0m save --tests-passing sets true
+[38;2;74;222;128m[1m✓[0m Checkpoint saved for stage [1mreview[0m (iteration 0)
+  [38;2;74;222;128m✓[0m save --files-modified stores 2 files
+[38;2;74;222;128m[1m✓[0m Checkpoint saved for stage [1mdeploy[0m (iteration 0)
+  [38;2;74;222;128m✓[0m save --loop-state stores state
+  [38;2;74;222;128m✓[0m Checkpoint created_at timestamp present
+
+[1m  Restore Subcommand[0m
+  [38;2;74;222;128m✓[0m restore returns checkpoint JSON
+  [38;2;74;222;128m✓[0m Restored checkpoint has correct stage
+  [38;2;74;222;128m✓[0m restore missing stage exits non-zero
+  [38;2;74;222;128m✓[0m restore without --stage exits non-zero
+
+[1m  List Subcommand[0m
+  [38;2;74;222;128m✓[0m list shows Checkpoints header
+  [38;2;74;222;128m✓[0m list shows build checkpoint
+  [38;2;74;222;128m✓[0m list shows checkpoint count
+  [38;2;74;222;128m✓[0m list with no checkpoints shows empty
+
+[1m  Clear Subcommand[0m
+[38;2;74;222;128m[1m✓[0m Checkpoint saved for stage [1mbuild[0m (iteration 1)
+[38;2;74;222;128m[1m✓[0m Checkpoint saved for stage [1mtest[0m (iteration 2)
+[38;2;74;222;128m[1m✓[0m Cleared checkpoint for stage [1mbuild[0m
+  [38;2;74;222;128m✓[0m clear --stage removes specific checkpoint
+  [38;2;74;222;128m✓[0m clear --stage preserves other checkpoints
+  [38;2;74;222;128m✓[0m clear without args exits non-zero
+[38;2;74;222;128m[1m✓[0m Checkpoint saved for stage [1mbuild[0m (iteration 3)
+[38;2;74;222;128m[1m✓[0m Cleared 2 checkpoint(s)
+  [38;2;74;222;128m✓[0m clear --all removes all checkpoints
+
+[1m  Expire Subcommand[0m
+  [38;2;74;222;128m✓[0m expire with no checkpoints exits 0
+
+[1m  Save-context / Restore-context[0m
+  [38;2;74;222;128m✓[0m save-context creates claude-context.json
+  [38;2;74;222;128m✓[0m Context goal saved correctly
+  [38;2;74;222;128m✓[0m Context iteration saved correctly
+  [38;2;74;222;128m✓[0m restore-context exports RESTORED_GOAL
+  [38;2;74;222;128m✓[0m restore-context exports SW_LOOP_GOAL
+
+
+
+
+[2m  ──────────────────────────────────────────[0m
+
+  [38;2;74;222;128m[1mAll 0 tests passed[0m
+
+
+
+[38;2;0;212;255m[1m  Shipwright CI Tests[0m
+[2m  ══════════════════════════════════════════[0m
+
+[2m  ══════════════════════════════════════════[0m
+
+  [38;2;74;222;128m✓[0m help shows usage text
+  [38;2;74;222;128m✓[0m help exits 0
+  [38;2;74;222;128m✓[0m --help flag works
+  [38;2;74;222;128m✓[0m version shows version
+  [38;2;74;222;128m✓[0m unknown command exits 1
+  [38;2;74;222;128m✓[0m generate starts processing
+  [38;2;74;222;128m✓[0m validate runs on valid workflow
+  [38;2;74;222;128m✓[0m VERSION is defined
+  [38;2;74;222;128m✓[0m analyze shows analysis
+  [38;2;74;222;128m✓[0m analyze shows cache info
+  [38;2;74;222;128m✓[0m matrix generates config
+  [38;2;74;222;128m✓[0m matrix workflow file exists
+  [38;2;74;222;128m✓[0m validate passes on valid workflow
+  [38;2;74;222;128m✓[0m runners list shows options
+  [38;2;74;222;128m✓[0m runners recommend shows guidance
+
+
+
+[2m  ──────────────────────────────────────────[0m
+
+  [38;2;74;222;128m[1mAll 0 tests passed[0m
+
+
+
+[38;2;0;212;255m[1m  Shipwright Cleanup Tests[0m
+[2m  ══════════════════════════════════════════[0m
+
+[2m  ══════════════════════════════════════════[0m
+
+[1m  Help[0m
+  [38;2;74;222;128m✓[0m help exits 0
+  [38;2;74;222;128m✓[0m help shows usage
+  [38;2;74;222;128m✓[0m help shows --force
+  [38;2;74;222;128m✓[0m help shows dry-run
+
+[1m  Dry-Run (Empty)[0m
+  [38;2;74;222;128m✓[0m dry-run shows Tmux Windows section
+  [38;2;74;222;128m✓[0m dry-run shows Team Configs section
+  [38;2;74;222;128m✓[0m dry-run shows Task Lists section
+  [38;2;74;222;128m✓[0m dry-run shows Pipeline Artifacts section
+  [38;2;74;222;128m✓[0m dry-run shows Pipeline State section
+  [38;2;74;222;128m✓[0m dry-run shows Heartbeats section
+  [38;2;74;222;128m✓[0m dry-run reports clean
+
+[1m  Force Mode (Empty)[0m
+  [38;2;74;222;128m✓[0m force shows FORCE MODE
+  [38;2;74;222;128m✓[0m force reports nothing to clean
+
+[1m  Detect Team Configs[0m
+  [38;2;74;222;128m✓[0m dry-run detects team dir
+  [38;2;74;222;128m✓[0m dry-run shows would remove
+
+[1m  Force Removes Teams[0m
+  [38;2;74;222;128m✓[0m force removes team dir
+  [38;2;74;222;128m✓[0m team directory actually removed
+
+[1m  Detect Task Lists[0m
+  [38;2;74;222;128m✓[0m dry-run detects task dir
+  [38;2;74;222;128m✓[0m task directory actually removed
+
+[1m  Detect Stale Heartbeats[0m
+  [38;2;74;222;128m✓[0m dry-run detects stale heartbeat
+
+[1m  Error Handling[0m
+  [38;2;74;222;128m✓[0m unknown option exits non-zero
+  [38;2;74;222;128m✓[0m unknown option shows error
+
+[1m  Summary Counting[0m
+  [38;2;74;222;128m✓[0m summary shows found count
+  [38;2;74;222;128m✓[0m summary shows --force hint
+
+
+
+[2m  ──────────────────────────────────────────[0m
+
+  [38;2;74;222;128m[1mAll 24 tests passed[0m
+
+
+
+[38;2;0;212;255m[1m  Shipwright Code Review Tests[0m
+[2m  ══════════════════════════════════════════[0m
+
+[2m  ══════════════════════════════════════════[0m
+
+  [38;2;74;222;128m✓[0m help shows usage text
+  [38;2;74;222;128m✓[0m help exits 0
+  [38;2;74;222;128m✓[0m --help flag works
+  [38;2;74;222;128m✓[0m review runs and starts reviewing
+  [38;2;74;222;128m✓[0m trends with no data
+  [38;2;74;222;128m✓[0m config show outputs valid config
+  [38;2;74;222;128m✓[0m unknown subcommand exits nonzero
+  [38;2;74;222;128m✓[0m no false long function detection on small file
+  [38;2;74;222;128m✓[0m style consistency check runs without crash
+  [38;2;74;222;128m✓[0m architecture boundary check runs without crash
+
+
+
+[2m  ──────────────────────────────────────────[0m
+
+  [38;2;74;222;128m[1mAll 0 tests passed[0m
 
 
 [38;2;0;212;255m[1m╔═══════════════════════════════════════════════════╗[0m
@@ -560,24 +698,24 @@ All 16 tests passed!
 
 [2mSetting up test environment...[0m
 
-[38;2;124;58;237m[1mIdentity Resolution[0m
+[38;2;168;85;247m[1mIdentity Resolution[0m
   [38;2;0;212;255m▸[0m resolve_developer_id from DEVELOPER_ID env... [38;2;74;222;128m✓[0m
   [38;2;0;212;255m▸[0m resolve_developer_id from git config... [38;2;74;222;128m✓[0m
   [38;2;0;212;255m▸[0m resolve_developer_id fallback to USER... [38;2;74;222;128m✓[0m
   [38;2;0;212;255m▸[0m resolve_machine_name from MACHINE_NAME env... [38;2;74;222;128m✓[0m
   [38;2;0;212;255m▸[0m resolve_machine_name from hostname... [38;2;74;222;128m✓[0m
 
-[38;2;124;58;237m[1mDashboard URL Resolution[0m
+[38;2;168;85;247m[1mDashboard URL Resolution[0m
   [38;2;0;212;255m▸[0m resolve_dashboard_url from --url flag... [38;2;74;222;128m✓[0m
   [38;2;0;212;255m▸[0m resolve_dashboard_url from DASHBOARD_URL env... [38;2;74;222;128m✓[0m
   [38;2;0;212;255m▸[0m resolve_dashboard_url from team-config.json... [38;2;74;222;128m✓[0m
   [38;2;0;212;255m▸[0m resolve_dashboard_url falls back to default... [38;2;74;222;128m✓[0m
 
-[38;2;124;58;237m[1mStart/Stop Lifecycle[0m
+[38;2;168;85;247m[1mStart/Stop Lifecycle[0m
   [38;2;0;212;255m▸[0m cmd_start creates PID file... [38;2;0;212;255m[1m▸[0m Starting connect to [1mhttp://localhost:8767[0m
 [38;2;0;212;255m[1m▸[0m Developer: [1mtest-developer[0m @ [1mtest-machine[0m
-[38;2;74;222;128m[1m✓[0m Connect started (PID 1279947)
-  [2mLogs: /tmp/sw-connect-test.OESvLP/home/.shipwright/connect.log[0m
+[38;2;74;222;128m[1m✓[0m Connect started (PID 60906)
+  [2mLogs: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-connect-test.hVaiXc/home/.shipwright/connect.log[0m
   [2mStop: shipwright connect stop[0m
 [38;2;74;222;128m✓[0m
   [38;2;0;212;255m▸[0m cmd_start rejects if already running...   [2mStop it first: shipwright connect stop[0m
@@ -587,29 +725,182 @@ All 16 tests passed!
   [38;2;0;212;255m▸[0m cmd_stop handles missing PID gracefully... [38;2;250;204;21m[1m⚠[0m Connect is not running (no PID file)
 [38;2;74;222;128m✓[0m
 
-[38;2;124;58;237m[1mStatus[0m
+[38;2;168;85;247m[1mStatus[0m
   [38;2;0;212;255m▸[0m cmd_status shows connected when PID alive... [38;2;74;222;128m✓[0m
   [38;2;0;212;255m▸[0m cmd_status shows disconnected when no PID... [38;2;74;222;128m✓[0m
 
-[38;2;124;58;237m[1mJoin Flow[0m
+[38;2;168;85;247m[1mJoin Flow[0m
   [38;2;0;212;255m▸[0m cmd_join verifies token against dashboard... [38;2;74;222;128m✓[0m
   [38;2;0;212;255m▸[0m cmd_join saves team-config.json... [38;2;74;222;128m✓[0m
   [38;2;0;212;255m▸[0m cmd_join rejects invalid token... [38;2;74;222;128m✓[0m
   [38;2;0;212;255m▸[0m cmd_join accepts --url and --token flags... [38;2;74;222;128m✓[0m
 
-[38;2;124;58;237m[1mHeartbeat & Disconnect Payloads[0m
+[38;2;168;85;247m[1mHeartbeat & Disconnect Payloads[0m
   [38;2;0;212;255m▸[0m Heartbeat payload includes required fields... [38;2;74;222;128m✓[0m
   [38;2;0;212;255m▸[0m Send disconnect sends proper payload... [38;2;74;222;128m✓[0m
 
-[38;2;124;58;237m[1mConfiguration & Utilities[0m
+[38;2;168;85;247m[1mConfiguration & Utilities[0m
   [38;2;0;212;255m▸[0m ensure_dir creates shipwright directory... [38;2;74;222;128m✓[0m
   [38;2;0;212;255m▸[0m now_iso returns valid ISO timestamp... [38;2;74;222;128m✓[0m
   [38;2;0;212;255m▸[0m Script has correct version... [38;2;74;222;128m✓[0m
 
-[38;2;124;58;237m[1mIntegration[0m
+[38;2;168;85;247m[1mIntegration[0m
   [38;2;0;212;255m▸[0m Help command shows all main commands... [38;2;74;222;128m✓[0m
 
 [38;2;0;212;255m[1m════════════════════════════════════════════════════[0m
 [38;2;74;222;128m[1m  All 25 tests passed ✓[0m
 [38;2;0;212;255m[1m════════════════════════════════════════════════════[0m
 
+
+[38;2;0;212;255m[1m  Context Budget Monitor Tests[0m
+[2m  ══════════════════════════════════════════[0m
+
+[2m  ══════════════════════════════════════════[0m
+
+  [38;2;0;212;255mBudget Initialization[0m
+  [38;2;74;222;128m✓[0m init creates config (exit 0)
+  [38;2;74;222;128m✓[0m config has correct total_budget
+  [38;2;74;222;128m✓[0m system_reserve is 10% (80000)
+  [38;2;74;222;128m✓[0m tools_reserve is 10% (80000)
+  [38;2;74;222;128m✓[0m working_memory is 60% (480000)
+  [38;2;74;222;128m✓[0m output_reserve is 20% (160000)
+
+  [38;2;0;212;255mToken Estimation[0m
+  [38;2;74;222;128m✓[0m estimation produces JSON
+  [38;2;74;222;128m✓[0m estimate contains utilization_percent
+  [38;2;74;222;128m✓[0m estimate contains total_used (>0)
+
+  [38;2;0;212;255mStatus Checking (Thresholds)[0m
+  [38;2;74;222;128m✓[0m 50% utilization returns green status
+  [38;2;74;222;128m✓[0m 70% utilization returns yellow status
+  [38;2;74;222;128m✓[0m 85% utilization returns red status
+  [38;2;74;222;128m✓[0m 95% utilization returns critical status
+
+  [38;2;0;212;255mContext Trimming[0m
+  [38;2;74;222;128m✓[0m green status doesn't trim content
+  [38;2;74;222;128m✓[0m yellow status reduces content length
+  [38;2;74;222;128m✓[0m hard truncate respects size limit
+
+  [38;2;0;212;255mIteration Summarization[0m
+  [38;2;74;222;128m✓[0m summarize_iteration succeeds (exit 0)
+  [38;2;74;222;128m✓[0m iteration summary file created with 1 entry
+
+  [38;2;0;212;255mBudget Report Generation[0m
+  [38;2;74;222;128m✓[0m report contains budget_config
+  [38;2;74;222;128m✓[0m report contains iteration_summaries
+
+  [38;2;0;212;255mState Logging[0m
+  [38;2;74;222;128m✓[0m log_state succeeds (exit 0)
+  [38;2;74;222;128m✓[0m log file created with entries
+
+
+[2m  ──────────────────────────────────────────[0m
+
+  [38;2;74;222;128m[1mAll 22 tests passed[0m
+
+
+
+[38;2;0;212;255m[1m  Shipwright Context Tests[0m
+[2m  ══════════════════════════════════════════[0m
+
+[2m  ══════════════════════════════════════════[0m
+
+  [38;2;0;212;255mhelp command[0m
+  [38;2;74;222;128m✓[0m help exits 0
+  [38;2;74;222;128m✓[0m help shows usage
+  [38;2;74;222;128m✓[0m help shows commands
+  [38;2;74;222;128m✓[0m --help exits 0
+
+  [38;2;0;212;255merror handling[0m
+  [38;2;74;222;128m✓[0m unknown command exits 1
+  [38;2;74;222;128m✓[0m unknown command shows error
+
+  [38;2;0;212;255mshow subcommand[0m
+  [38;2;74;222;128m✓[0m show exits 0
+  [38;2;74;222;128m✓[0m show outputs context header
+
+  [38;2;0;212;255mclear subcommand[0m
+  [38;2;74;222;128m✓[0m clear exits 0
+  [38;2;74;222;128m✓[0m clear confirms cleared
+
+  [38;2;0;212;255mgather subcommand[0m
+  [38;2;74;222;128m✓[0m gather without args exits 1
+  [38;2;74;222;128m✓[0m gather shows must provide
+  [38;2;74;222;128m✓[0m gather with unknown option exits 1
+
+  [38;2;0;212;255mgather with goal[0m
+  [38;2;74;222;128m✓[0m gather exits 0
+  [38;2;74;222;128m✓[0m gather shows building
+  [38;2;74;222;128m✓[0m gather shows success
+  [38;2;74;222;128m✓[0m context-bundle.md created
+
+  [38;2;0;212;255mshow after gather[0m
+  [38;2;74;222;128m✓[0m show after gather exits 0
+  [38;2;74;222;128m✓[0m show contains pipeline context
+
+  [38;2;0;212;255mclear after gather[0m
+  [38;2;74;222;128m✓[0m clear exits 0
+
+  [38;2;0;212;255mgather with issue[0m
+  [38;2;74;222;128m✓[0m gather with --issue exits 0
+  [38;2;74;222;128m✓[0m gather shows building
+
+  [38;2;0;212;255mgather default stage[0m
+  [38;2;74;222;128m✓[0m gather default stage exits 0
+
+  [38;2;0;212;255minternal stage_guidance[0m
+  [38;2;74;222;128m✓[0m stage_guidance returns plan guidance
+  [38;2;74;222;128m✓[0m stage_guidance returns build guidance
+  [38;2;74;222;128m✓[0m stage_guidance handles unknown stage
+
+
+
+[2m  ──────────────────────────────────────────[0m
+
+  [38;2;74;222;128m[1mAll 26 tests passed[0m
+
+
+
+[38;2;0;212;255m[1m  Shipwright Cost Tests[0m
+[2m  ══════════════════════════════════════════[0m
+
+[2m  ══════════════════════════════════════════[0m
+
+[2m  help / version[0m
+  [38;2;74;222;128m✓[0m help exits 0
+  [38;2;74;222;128m✓[0m help shows USAGE
+  [38;2;74;222;128m✓[0m help shows COMMANDS
+  [38;2;74;222;128m✓[0m help mentions show
+  [38;2;74;222;128m✓[0m help mentions budget
+  [38;2;74;222;128m✓[0m help mentions calculate
+  [38;2;74;222;128m✓[0m VERSION variable defined
+
+[2m  state management[0m
+  [38;2;74;222;128m✓[0m costs.json created on first use
+  [38;2;74;222;128m✓[0m budget.json created on first use
+  [38;2;74;222;128m✓[0m costs.json has entries array
+  [38;2;74;222;128m✓[0m budget.json has daily_budget_usd
+
+[2m  budget commands[0m
+  [38;2;74;222;128m✓[0m budget set exits 0
+  [38;2;74;222;128m✓[0m budget set to 50
+  [38;2;74;222;128m✓[0m budget show exits 0
+
+[2m  error handling[0m
+  [38;2;74;222;128m✓[0m Unknown command exits non-zero
+
+[2m  calculate[0m
+  [38;2;74;222;128m✓[0m calculate exits 0
+
+[2m  script safety[0m
+  [38;2;74;222;128m✓[0m Uses set -euo pipefail
+  [38;2;74;222;128m✓[0m ERR trap is set
+
+[2m  context efficiency in cost dashboard[0m
+  [38;2;74;222;128m✓[0m Cost dashboard has CONTEXT EFFICIENCY section
+  [38;2;74;222;128m✓[0m Cost dashboard reads loop.context_efficiency events
+  [38;2;74;222;128m✓[0m Context efficiency reports utilization and waste
+  [38;2;248;113;113m✗[0m Dashboard renders CONTEXT EFFICIENCY with event data
+    [2moutput: ⚠ No cost entries in the last 30 day(s).[0m
+  [38;2;248;113;113m✗[0m Dashboard shows avg budget utilization
+ERROR: scripts/sw-cost-test.sh:226 exited with status 1
diff --git a/.claude/loop-logs/tests-iter-2.log b/.claude/loop-logs/tests-iter-2.log
index 176f067c3..0468dda2e 100644
--- a/.claude/loop-logs/tests-iter-2.log
+++ b/.claude/loop-logs/tests-iter-2.log
@@ -1,557 +1,695 @@
 
-> shipwright-cli@1.7.1 test
-> bash scripts/sw-pipeline-test.sh && bash scripts/sw-daemon-test.sh && bash scripts/sw-prep-test.sh && bash scripts/sw-fleet-test.sh && bash scripts/sw-fix-test.sh && bash scripts/sw-memory-test.sh && bash scripts/sw-session-test.sh && bash scripts/sw-init-test.sh && bash scripts/sw-tracker-test.sh && bash scripts/sw-heartbeat-test.sh && bash scripts/sw-remote-test.sh && bash scripts/sw-intelligence-test.sh && bash scripts/sw-pipeline-composer-test.sh && bash scripts/sw-self-optimize-test.sh && bash scripts/sw-predictive-test.sh && bash scripts/sw-frontier-test.sh && bash scripts/sw-connect-test.sh
+> shipwright-cli@3.2.4 test
+> bash scripts/sw-agi-roadmap-test.sh && bash scripts/sw-activity-test.sh && bash scripts/sw-adaptive-test.sh && bash scripts/sw-adversarial-test.sh && bash scripts/sw-architecture-enforcer-test.sh && bash scripts/sw-auth-test.sh && bash scripts/sw-autonomous-test.sh && bash scripts/sw-changelog-test.sh && bash scripts/sw-checkpoint-test.sh && bash scripts/sw-ci-test.sh && bash scripts/sw-cleanup-test.sh && bash scripts/sw-code-review-test.sh && bash scripts/sw-connect-test.sh && bash scripts/sw-context-budget-test.sh && bash scripts/sw-context-test.sh && bash scripts/sw-cost-test.sh && bash scripts/sw-daemon-test.sh && bash scripts/sw-dashboard-test.sh && bash scripts/sw-db-test.sh && bash scripts/sw-decompose-test.sh && bash scripts/sw-decide-test.sh && bash scripts/sw-deps-test.sh && bash scripts/sw-developer-simulation-test.sh && bash scripts/sw-discovery-test.sh && bash scripts/sw-doc-fleet-test.sh && bash scripts/sw-docs-agent-test.sh && bash scripts/sw-docs-test.sh && bash scripts/sw-doctor-test.sh && bash scripts/sw-dora-test.sh && bash scripts/sw-durable-test.sh && bash scripts/sw-e2e-orchestrator-test.sh && bash scripts/sw-eventbus-test.sh && bash scripts/sw-feedback-test.sh && bash scripts/sw-outcome-feedback-test.sh && bash scripts/sw-fix-test.sh && bash scripts/sw-fleet-discover-test.sh && bash scripts/sw-fleet-test.sh && bash scripts/sw-fleet-viz-test.sh && bash scripts/sw-frontier-test.sh && bash scripts/sw-github-app-test.sh && bash scripts/sw-github-checks-test.sh && bash scripts/sw-github-deploy-test.sh && bash scripts/sw-github-graphql-test.sh && bash scripts/sw-guild-test.sh && bash scripts/sw-heartbeat-test.sh && bash scripts/sw-hello-test.sh && bash scripts/sw-hygiene-test.sh && bash scripts/sw-incident-test.sh && bash scripts/sw-init-test.sh && bash scripts/sw-instrument-test.sh && bash scripts/sw-intelligence-test.sh && bash scripts/sw-jira-test.sh && bash scripts/sw-launchd-test.sh && bash scripts/sw-linear-test.sh && bash scripts/sw-logs-test.sh && bash scripts/sw-loop-test.sh && bash scripts/sw-memory-test.sh && bash scripts/sw-mission-control-test.sh && bash scripts/sw-model-router-test.sh && bash scripts/sw-otel-test.sh && bash scripts/sw-oversight-test.sh && bash scripts/sw-patrol-meta-test.sh && bash scripts/sw-pipeline-composer-test.sh && bash scripts/sw-pipeline-test.sh && bash scripts/sw-pipeline-vitals-test.sh && bash scripts/sw-pm-test.sh && bash scripts/sw-pr-lifecycle-test.sh && bash scripts/sw-predictive-test.sh && bash scripts/sw-prep-test.sh && bash scripts/sw-ps-test.sh && bash scripts/sw-public-dashboard-test.sh && bash scripts/sw-quality-profile-test.sh && bash scripts/sw-quality-test.sh && bash scripts/sw-reaper-test.sh && bash scripts/sw-recruit-test.sh && bash scripts/sw-regression-test.sh && bash scripts/sw-release-manager-test.sh && bash scripts/sw-release-test.sh && bash scripts/sw-root-cause-test.sh && bash scripts/sw-remote-test.sh && bash scripts/sw-replay-test.sh && bash scripts/sw-retro-test.sh && bash scripts/sw-scale-test.sh && bash scripts/sw-stall-detector-test.sh && bash scripts/sw-security-audit-test.sh && bash scripts/sw-self-optimize-test.sh && bash scripts/sw-session-test.sh && bash scripts/sw-setup-test.sh && bash scripts/sw-standup-test.sh && bash scripts/sw-status-test.sh && bash scripts/sw-strategic-test.sh && bash scripts/sw-stream-test.sh && bash scripts/sw-swarm-test.sh && bash scripts/sw-team-stages-test.sh && bash scripts/sw-templates-test.sh && bash scripts/sw-testgen-test.sh && bash scripts/sw-tmux-pipeline-test.sh && bash scripts/sw-tmux-test.sh && bash scripts/sw-trace-test.sh && bash scripts/sw-tracker-test.sh && bash scripts/sw-triage-test.sh && bash scripts/sw-upgrade-test.sh && bash scripts/sw-ux-test.sh && bash scripts/sw-webhook-test.sh && bash scripts/sw-widgets-test.sh && bash scripts/sw-worktree-test.sh && bash scripts/sw-lib-compat-test.sh && bash scripts/sw-lib-helpers-test.sh && bash scripts/sw-lib-error-actionability-test.sh && bash scripts/sw-lib-daemon-dispatch-test.sh && bash scripts/sw-lib-daemon-failure-test.sh && bash scripts/sw-lib-daemon-poll-test.sh && bash scripts/sw-lib-daemon-state-test.sh && bash scripts/sw-lib-daemon-triage-test.sh && bash scripts/sw-lib-daemon-patrol-test.sh && bash scripts/sw-lib-pipeline-detection-test.sh && bash scripts/sw-lib-pipeline-intelligence-test.sh && bash scripts/sw-lib-pipeline-quality-checks-test.sh && bash scripts/sw-lib-pipeline-stages-test.sh && bash scripts/sw-lib-pipeline-state-test.sh && bash scripts/sw-adapters-test.sh && bash scripts/sw-evidence-test.sh && bash scripts/sw-review-rerun-test.sh && bash scripts/sw-tracker-providers-test.sh && bash scripts/sw-budget-chaos-test.sh && bash scripts/sw-chaos-test.sh && bash scripts/sw-autonomous-e2e-test.sh && bash scripts/sw-memory-discovery-e2e-test.sh && bash scripts/sw-policy-e2e-test.sh && bash scripts/sw-e2e-smoke-test.sh && bash scripts/sw-dashboard-e2e-test.sh && bash scripts/sw-reward-aggregator-test.sh && bash scripts/sw-bandit-selector-test.sh && bash scripts/sw-policy-learner-test.sh && bash scripts/sw-autoresearch-e2e-test.sh
+
+
+[38;2;168;85;247m[1m╔════════════════════════════════════════════════════════════════╗[0m
+[38;2;168;85;247m[1m║  AGI-Roadmap Validation — Real Tests for Every Feature        ║[0m
+[38;2;168;85;247m[1m╚════════════════════════════════════════════════════════════════╝[0m
+
+[38;2;168;85;247m[1mPhase 1: Feedback Loops (Discovery, Memory, PM, Failure Learning)[0m
+  [38;2;0;212;255m▸[0m Daemon: failure_history initialized in state JSON... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Daemon: consecutive count uses reduce (run-from-newest, not total)... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Daemon: get_max_retries_for_class returns per-class limits... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Daemon: exponential backoff formula 5*2^(n-3) is correct... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Daemon: resume_after parsed in UTC (not local TZ)... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m PM: recommend --json flag implemented... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m PM: learn subcommand functional... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Daemon: PM recommend/learn wired into triage + success/failure... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Daemon: confidence < 60% upgrades to full template... [38;2;74;222;128m✓[0m
+
+[38;2;168;85;247m[1mPhase 2: Agent Coordination (Feedback, Predictive, Oversight, Autonomous)[0m
+  [38;2;0;212;255m▸[0m Feedback: ARTIFACTS_DIR respects caller override... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Feedback: rollback uses PIPESTATUS for correct exit code... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Predictive: anomaly detection returns severity for 5x baseline... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Predictive: inject-prevention command exists and runs... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Pipeline: predictive anomaly/baseline/inject-prevention wired... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Pipeline: memory metric wired into stage completion... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Oversight: gate approves clean review... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Oversight: gate rejects with --reject-if... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Oversight: gate JSON safe from newline/quote injection... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Pipeline: oversight gate wired + respects SKIP_GATES... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Pipeline: feedback collect/create-issue/rollback wired into monitor... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Pipeline: intelligence prediction validation wired... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Pipeline: predictive anomaly confirmation wired... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Pipeline: memory fix-outcome negative path wired... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Triage: offline fallback with recruit... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Recruit: policy integration wired... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Recruit: meta feedback loop... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Recruit: audit (negative-compounding feedback)... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Autonomous: safe recruit_args quoting... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Autonomous: Claude output redirected to findings file... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Autonomous: dual branch check (pipeline + daemon)... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Autonomous: run_scheduler with loop/sleep... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Autonomous: trigger_pipeline_for_finding wired... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Incident: create_hotfix_issue echoes issue number... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Incident: trigger_pipeline wires --template hotfix... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Incident: trigger_rollback wires sw-feedback.sh... [38;2;74;222;128m✓[0m
+
+[38;2;168;85;247m[1mPhase 3: Quality Assurance (Code Review, Testgen, Swarm, Multi-Agent)[0m
+  [38;2;0;212;255m▸[0m Code review: run_claude_semantic_review exists... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Code review: semantic findings integrated... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Testgen: Claude prompt asks for real assertions... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Testgen: prompt piped to avoid shell expansion... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Swarm: spawn creates tmux session... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Swarm: retire kills tmux session... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Swarm: spawn/retire functional (real tmux)... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Loop: multi-agent restarts not blocked... [38;2;74;222;128m✓[0m
+
+[38;2;168;85;247m[1mPhase 4: Meta-Cognition (Effectiveness, Self-Awareness, Capability)[0m
+  [38;2;0;212;255m▸[0m Pipeline: record_stage_effectiveness creates valid JSONL... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Pipeline: self-awareness hint triggers on >50% failure rate... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Pipeline: effectiveness recorded on both complete and failed... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Pipeline: discovery inject wired... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Pipeline: self-awareness hint injected into plan prompt... [38;2;74;222;128m✓[0m
+
+[38;2;168;85;247m[1mIntegration & Safety[0m
+  [38;2;0;212;255m▸[0m CI: integration-claude jobs in workflow... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Integration-claude: skip path functional... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m All modified scripts have strict mode... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m All modified scripts have ERR trap... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m No hardcoded secrets in scripts... [38;2;74;222;128m✓[0m
+
+[2m  ──────────────────────────────────────────[0m
+
+  [38;2;74;222;128m[1mAll 53 tests passed![0m
+
+
+[38;2;0;212;255m[1m  Shipwright Activity Tests[0m
+[2m  ══════════════════════════════════════════[0m
+
+[1m  Script Safety[0m
+  [38;2;74;222;128m✓[0m set -euo pipefail present
+  [38;2;74;222;128m✓[0m ERR trap present
+  [38;2;74;222;128m✓[0m Source guard pattern (if/then/fi)
+  [38;2;74;222;128m✓[0m VERSION variable defined
+
+[1m  Help Output[0m
+  [38;2;74;222;128m✓[0m help exits 0 and contains USAGE
+  [38;2;74;222;128m✓[0m help lists 'watch' subcommand
+  [38;2;74;222;128m✓[0m help lists 'snapshot' subcommand
+  [38;2;74;222;128m✓[0m help lists 'history' subcommand
+  [38;2;74;222;128m✓[0m help lists 'stats' subcommand
+  [38;2;74;222;128m✓[0m help lists 'agents' subcommand
+  [38;2;74;222;128m✓[0m --help alias works
+
+[1m  Error Handling[0m
+[38;2;0;212;255m[1mshipwright activity[0m — Live agent activity stream
+
+[1mUSAGE[0m
+  shipwright activity [subcommand] [options]
+
+[1mSUBCOMMANDS[0m
+  watch                      Live stream of agent activity (default)
+  snapshot                   Current state of all active agents
+  history [range]            Replay past activity (e.g., '1h', '10m', 'all')
+  stats                      Running counters (events, commits, tests, agents)
+  agents                     List known agents and last activity
+  help                       Show this help message
+
+[1mOPTIONS[0m
+  --type <type>              Filter events by type (e.g., 'stage.completed')
+  --agent <name>             Filter by agent name
+  --team <name>              Filter by team
+  --stage <name>             Filter by pipeline stage (e.g., 'build')
+
+[1mEXAMPLES[0m
+  \033[2mshipwright activity\033[0m                    # Live stream
+  \033[2mshipwright activity watch --type stage.*\033[0m  # Only stage events
+  \033[2mshipwright activity history 1h\033[0m           # Last hour
+  \033[2mshipwright activity snapshot\033[0m             # Current state
+  \033[2mshipwright activity stats\033[0m                # Counters
+  [38;2;74;222;128m✓[0m Unknown command exits non-zero
+
+[1m  Subcommands Without Events File[0m
+  [38;2;74;222;128m✓[0m snapshot exits non-zero with no events
+  [38;2;74;222;128m✓[0m stats exits non-zero with no events
+  [38;2;74;222;128m✓[0m agents exits non-zero with no events
+
+[1m  Event Emission[0m
+  [38;2;74;222;128m✓[0m emit_event creates events.jsonl
+  [38;2;74;222;128m✓[0m emit_event writes valid JSON
+  [38;2;74;222;128m✓[0m Event contains type field
+  [38;2;74;222;128m✓[0m Event contains agent field
+  [38;2;74;222;128m✓[0m Event contains numeric count
+
+[1m  Format Helpers[0m
+  [38;2;74;222;128m✓[0m get_icon_for_type commit returns icon
+  [38;2;74;222;128m✓[0m get_icon_for_type test.passed returns icon
+  [38;2;74;222;128m✓[0m get_icon_for_type unknown returns bullet
+  [38;2;74;222;128m✓[0m format_timestamp strips T and Z
+
+[1m  Stats With Events[0m
+  [38;2;74;222;128m✓[0m stats shows Total Events
+  [38;2;74;222;128m✓[0m stats shows Commits count
+  [38;2;74;222;128m✓[0m stats shows Pipelines count
 
+[1m  History Subcommand[0m
+  [38;2;74;222;128m✓[0m history all shows activity header
 
-[38;2;124;58;237m[1m╔═══════════════════════════════════════════════════════════════════╗[0m
-[38;2;124;58;237m[1m║  shipwright pipeline test — E2E Validation (Real Subprocess)     ║[0m
-[38;2;124;58;237m[1m╚═══════════════════════════════════════════════════════════════════╝[0m
 
-[2mSetting up mock environment...[0m
-[38;2;74;222;128m✓[0m Environment ready: [2m/tmp/sw-pipeline-test.76QxGO[0m
+[2m  ──────────────────────────────────────────[0m
 
-  [38;2;0;212;255m▸[0m Preflight passes with all mocks... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Preflight fails when sw-loop.sh missing... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Start requires --goal or --issue... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Intake with --goal creates branch + artifacts... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Intake with --issue fetches from GitHub... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Plan generates plan.md, dod.md, tasks... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Build invokes sw loop and commits... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Test stage captures results to log... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Review generates report with severities... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m PR stage creates PR URL artifact... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Full E2E pipeline (6 stages)... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Resume continues from partial state... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Abort marks pipeline as aborted... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Dry run shows config, no artifacts... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Self-healing build→test retry loop... [38;2;74;222;128m✓[0m
+  [38;2;74;222;128m[1mAll 28 tests passed[0m
 
-[38;2;124;58;237m[1m━━━ Results ━━━[0m
-  [38;2;74;222;128mPassed:[0m 15
-  [38;2;248;113;113mFailed:[0m 0
-  [2mTotal:[0m  15
 
-[38;2;74;222;128m[1mAll 15 tests passed![0m
+[38;2;0;212;255m[1m  Shipwright Adaptive Tests[0m
+[2m  ══════════════════════════════════════════[0m
 
+[2m  help / version[0m
+  [38;2;74;222;128m✓[0m help exits 0
+  [38;2;74;222;128m✓[0m help shows USAGE
+  [38;2;74;222;128m✓[0m help shows SUBCOMMANDS
+  [38;2;74;222;128m✓[0m help mentions get
+  [38;2;74;222;128m✓[0m help mentions train
+  [38;2;74;222;128m✓[0m help mentions profile
+  [38;2;74;222;128m✓[0m version exits 0
+  [38;2;74;222;128m✓[0m version output contains version string
 
-[38;2;124;58;237m[1m╔═══════════════════════════════════════════════════════════════════╗[0m
-[38;2;124;58;237m[1m║  shipwright daemon test — Unit Tests (Synthetic Events)           ║[0m
-[38;2;124;58;237m[1m╚═══════════════════════════════════════════════════════════════════╝[0m
+[2m  error handling[0m
+  [38;2;74;222;128m✓[0m Unknown command exits non-zero
 
-[2mSetting up test environment...[0m
-[38;2;74;222;128m✓[0m Environment ready: [2m/tmp/sw-daemon-test.G3riH7[0m
+[2m  get command[0m
+  [38;2;74;222;128m✓[0m get timeout with default exits 0
 
-  [38;2;0;212;255m▸[0m dora_grade deploy_freq Elite (>= 7)... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m dora_grade deploy_freq High (>= 1)... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m dora_grade deploy_freq Medium (>= 0.25)... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m dora_grade deploy_freq Low (< 0.25)... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m dora_grade CFR thresholds (Elite/High/Medium/Low)... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Stage timings filter-first jq query... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m MTTR pairs failures with next success... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m epoch_to_iso helper function... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Health check detects stale jobs... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Priority label sorting... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Degradation alert triggers on high CFR... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Metrics --json output with cycle_time keys... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Self-labeling includes watch_label when enabled... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Self-labeling excludes watch_label when disabled... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Patrol recurring failures label construction... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m DORA degradation event detection... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Retry exhaustion event detection... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Untested script detection logic... [38;2;74;222;128m✓[0m
+[2m  profile command[0m
+  [38;2;74;222;128m✓[0m profile exits 0
 
-[38;2;124;58;237m[1m━━━ Results ━━━[0m
-  [38;2;74;222;128mPassed:[0m 18
-  [38;2;248;113;113mFailed:[0m 0
-  [2mTotal:[0m  18
+[2m  reset command[0m
+  [38;2;74;222;128m✓[0m reset exits 0
 
-[38;2;74;222;128m[1mAll 18 tests passed![0m
+[2m  script safety[0m
+  [38;2;74;222;128m✓[0m Uses set -euo pipefail
+  [38;2;74;222;128m✓[0m Has source guard pattern
 
+[2m  statistical functions[0m
+  [38;2;74;222;128m✓[0m percentile, mean, median functions defined in source
+  [38;2;74;222;128m✓[0m mean returns numeric value (avg of 1-5 is 3)
 
-[38;2;124;58;237m[1m╔═══════════════════════════════════════════════════════════════════╗[0m
-[38;2;124;58;237m[1m║  shipwright prep test — Validation Suite (Real Subprocess)        ║[0m
-[38;2;124;58;237m[1m╚═══════════════════════════════════════════════════════════════════╝[0m
+[2m  get_timeout / get_iterations / get_model[0m
+  [38;2;74;222;128m✓[0m get_timeout returns number (default with no events)
+  [38;2;74;222;128m✓[0m get_iterations returns number
+  [38;2;74;222;128m✓[0m get_model returns valid model name
 
-[2mSetting up test environment...[0m
-[38;2;74;222;128m✓[0m Environment ready: [2m/tmp/sw-prep-test.3ZRNVS[0m
-
-  [38;2;0;212;255m▸[0m Node.js project detection... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Python project detection... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Go project detection... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Rust project detection... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m settings.json is valid JSON... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Hook scripts are executable... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Hook scripts have valid syntax... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m CLAUDE.md has required sections... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Check mode outputs scoring... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Idempotency without --force... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m --force overwrites modified files... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m No eval in generated hooks... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Definition of Done generated... [38;2;74;222;128m✓[0m
+[2m  train subcommand[0m
+  [38;2;74;222;128m✓[0m train subcommand runs with mock events
 
-[38;2;124;58;237m[1m━━━ Results ━━━[0m
-  [38;2;74;222;128mPassed:[0m 13
-  [38;2;248;113;113mFailed:[0m 0
-  [2mTotal:[0m  13
+[2m  ──────────────────────────────────────────[0m
 
-[38;2;74;222;128m[1mAll 13 tests passed![0m
+  [38;2;74;222;128m[1mAll 20 tests passed[0m
 
 
-[38;2;124;58;237m[1m╔═══════════════════════════════════════════════════════════════════╗[0m
-[38;2;124;58;237m[1m║  shipwright fleet test — Unit Tests                                ║[0m
-[38;2;124;58;237m[1m╚═══════════════════════════════════════════════════════════════════╝[0m
 
-[2mSetting up test environment...[0m
-[38;2;74;222;128m✓[0m Environment ready: [2m/tmp/sw-fleet-test.f4j7ea[0m
+[38;2;0;212;255m[1m  shipwright adversarial test[0m
+[2m  ══════════════════════════════════════════[0m
 
-  [38;2;0;212;255m▸[0m Help output contains expected sections... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Help via --help flag... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Config parsing — valid config... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Config parsing — missing config file... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Config parsing — invalid JSON... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Config parsing — empty repos array... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Config defaults applied... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Fleet init generates config template... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Fleet init skips when config exists... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Fleet start spawns tmux sessions per repo... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Fleet start skips missing repos... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Fleet start skips existing sessions... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Fleet start creates fleet state file... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Fleet start emits fleet.started event... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Fleet start applies repo-level overrides... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Fleet stop kills sessions and cleans state... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Fleet stop — no fleet running... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Fleet stop emits fleet.stopped event... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Fleet status — no fleet running... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Fleet status shows dashboard... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Fleet metrics — no events file... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Fleet metrics dashboard output... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Fleet metrics JSON output... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Fleet metrics period flag... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Session name generation... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Fleet start skips non-git repos... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Unknown subcommand... [38;2;74;222;128m✓[0m
+[2m  ══════════════════════════════════════════[0m
 
-[38;2;124;58;237m[1m━━━ Results ━━━[0m
-  [38;2;74;222;128mPassed:[0m 27
-  [38;2;248;113;113mFailed:[0m 0
-  [2mTotal:[0m  27
+[1m  Script Safety[0m
+  [38;2;74;222;128m✓[0m set -euo pipefail present
+  [38;2;74;222;128m✓[0m ERR trap present
+  [38;2;74;222;128m✓[0m Source guard pattern (if/then/fi)
+  [38;2;74;222;128m✓[0m VERSION variable defined
 
-[38;2;74;222;128m[1mAll 27 tests passed![0m
+[1m  Help Output[0m
+  [38;2;74;222;128m✓[0m help exits 0 and contains USAGE
+  [38;2;74;222;128m✓[0m help lists 'review' subcommand
+  [38;2;74;222;128m✓[0m help lists 'iterate' subcommand
+  [38;2;74;222;128m✓[0m help mentions adversarial_enabled flag
+  [38;2;74;222;128m✓[0m --help alias works
+  [38;2;74;222;128m✓[0m -h alias works
 
+[1m  Error Handling[0m
+  [38;2;74;222;128m✓[0m Unknown command exits non-zero
 
-[38;2;124;58;237m[1m╔═══════════════════════════════════════════════════════════════════╗[0m
-[38;2;124;58;237m[1m║  shipwright fix test — Unit Tests                                  ║[0m
-[38;2;124;58;237m[1m╚═══════════════════════════════════════════════════════════════════╝[0m
+[1m  Review Subcommand[0m
+  [38;2;74;222;128m✓[0m review disabled returns empty JSON array
+  [38;2;74;222;128m✓[0m review without diff arg exits non-zero
 
-[2mSetting up test environment...[0m
-[38;2;74;222;128m✓[0m Environment ready: [2m/tmp/sw-fix-test.XuOv7c[0m
+[1m  Iterate Subcommand[0m
+  [38;2;74;222;128m✓[0m iterate without args exits non-zero
+  [38;2;74;222;128m✓[0m iterate with empty findings converges
+  [38;2;74;222;128m✓[0m iterate past max rounds returns findings
 
-  [38;2;0;212;255m▸[0m Help output contains expected sections... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Help via --help flag... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Missing goal shows error... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Missing repos shows error... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Arg parsing — --repos comma-separated... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Arg parsing — --repos-from file... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Arg parsing — --repos-from missing file... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Arg parsing — --pipeline template... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Arg parsing — --max-parallel... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Arg parsing — --branch-prefix... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Dry run shows what would happen... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Dry run does not create state file... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Fix status — no sessions... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Fix status shows existing sessions... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Invalid repo directory shows error... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Fix start creates state file... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Fix start emits events... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Fix start — summary output... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Branch name sanitization... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Fix header shows configuration... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Non-git repo warning... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Per-repo event tracking... [38;2;74;222;128m✓[0m
+[1m  Configuration[0m
+  [38;2;74;222;128m✓[0m ADVERSARIAL_MAX_ROUNDS env var respected
+  [38;2;74;222;128m✓[0m disabled config returns empty array
 
-[38;2;124;58;237m[1m━━━ Results ━━━[0m
-  [38;2;74;222;128mPassed:[0m 22
-  [38;2;248;113;113mFailed:[0m 0
-  [2mTotal:[0m  22
+[1m  Event Emission[0m
+  [38;2;74;222;128m✓[0m emit_event creates events.jsonl
+  [38;2;74;222;128m✓[0m emit_event writes valid JSON
+  [38;2;74;222;128m✓[0m Event contains type field
 
-[38;2;74;222;128m[1mAll 22 tests passed![0m
 
 
-[38;2;124;58;237m[1m╔═══════════════════════════════════════════════════════════════════╗[0m
-[38;2;124;58;237m[1m║  shipwright memory+cost test — Unit Tests for Memory & Cost      ║[0m
-[38;2;124;58;237m[1m╚═══════════════════════════════════════════════════════════════════╝[0m
 
-[2mSetting up mock environment...[0m
-[38;2;74;222;128m✓[0m Environment ready: [2m/tmp/sw-memory-test.yiF1Rw[0m
+[2m  ──────────────────────────────────────────[0m
 
-  [38;2;0;212;255m▸[0m Memory capture from pipeline state... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Memory inject returns context for each stage... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Failure capture stores patterns... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Pattern detection identifies project type... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Cross-repo vs per-repo isolation... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Memory show displays dashboard... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Memory search finds matching entries... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Memory export produces valid JSON... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Memory forget clears repo memory... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Cost calculation for each model... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Cost recording writes to costs.json... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Budget set and check... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Cost dashboard runs without errors... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Cost JSON output is valid... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Actionable failures threshold filtering... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Actionable failures with no file returns []... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m DORA baseline calculation from events... [38;2;74;222;128m✓[0m
+  [38;2;74;222;128m[1mAll 0 tests passed[0m
 
-[38;2;124;58;237m[1m━━━ Results ━━━[0m
-  [38;2;74;222;128mPassed:[0m 17
-  [38;2;248;113;113mFailed:[0m 0
-  [2mTotal:[0m  17
 
-[38;2;74;222;128m[1mAll 17 tests passed![0m
 
+[38;2;0;212;255m[1m  shipwright architecture-enforcer test[0m
+[2m  ══════════════════════════════════════════[0m
 
-[38;2;0;212;255m[1m╔═══════════════════════════════════════════════════╗[0m
-[38;2;0;212;255m[1m║  shipwright session — E2E Test Suite              ║[0m
-[38;2;0;212;255m[1m╚═══════════════════════════════════════════════════╝[0m
+[2m  ══════════════════════════════════════════[0m
 
-[2mSetting up test environment...[0m
-[2mTest tmux session: sw-test-1303977[0m
-
-[38;2;124;58;237m[1mTemplate Loading[0m
-  [38;2;0;212;255m▸[0m Load feature-dev template (3 agents)... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Load exploration template (2 agents)... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Missing template returns error... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m All 24 templates load successfully... [38;2;74;222;128m✓[0m
-
-[38;2;124;58;237m[1mWindow Creation[0m
-  [38;2;0;212;255m▸[0m No-launch creates window without claude... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Duplicate window detection... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Window gets dark theme... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Auto-generated team name... [38;2;74;222;128m✓[0m
-
-[38;2;124;58;237m[1mPrompt & Launcher[0m
-  [38;2;0;212;255m▸[0m Launcher script generation with template... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Output includes agents from template... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Output includes goal when provided... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m No template + goal works... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m No template + no goal = interactive... [38;2;74;222;128m✓[0m
-
-[38;2;124;58;237m[1mCLI & Configuration[0m
-  [38;2;0;212;255m▸[0m Help flag... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Unknown option... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m TMPDIR used for launcher files... [38;2;74;222;128m✓[0m
+[1m  Script Safety[0m
+  [38;2;74;222;128m✓[0m set -euo pipefail present
+  [38;2;74;222;128m✓[0m ERR trap present
+  [38;2;74;222;128m✓[0m Source guard pattern (if/then/fi)
+  [38;2;74;222;128m✓[0m VERSION variable defined
 
-[38;2;124;58;237m[1mEnhanced Features[0m
-  [38;2;0;212;255m▸[0m Template auto-suggestion from goal... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m No suggestion without goal... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Memory injection in prompt... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m CLAUDE.md reminder in prompt... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Secure temp dir in source... [38;2;74;222;128m✓[0m
+[1m  Help Output[0m
+  [38;2;74;222;128m✓[0m help exits 0 and contains USAGE
+  [38;2;74;222;128m✓[0m help lists 'build' subcommand
+  [38;2;74;222;128m✓[0m help lists 'validate' subcommand
+  [38;2;74;222;128m✓[0m help lists 'evolve' subcommand
+  [38;2;74;222;128m✓[0m help mentions architecture_enabled flag
+  [38;2;74;222;128m✓[0m --help alias works
+  [38;2;74;222;128m✓[0m -h alias works
 
-[38;2;0;212;255m[1m════════════════════════════════════════════════════[0m
-[38;2;74;222;128m[1m  All 21 tests passed ✓[0m
-[38;2;0;212;255m[1m════════════════════════════════════════════════════[0m
+[1m  Error Handling[0m
+  [38;2;74;222;128m✓[0m Unknown command exits non-zero
 
+[1m  Build Subcommand[0m
+  [38;2;74;222;128m✓[0m build disabled returns empty JSON object
+  [38;2;74;222;128m✓[0m build with enabled returns model with layers
+  [38;2;74;222;128m✓[0m build model contains patterns array
+  [38;2;74;222;128m✓[0m build model contains conventions array
 
-[38;2;0;212;255m[1m╔═══════════════════════════════════════════════════╗[0m
-[38;2;0;212;255m[1m║  shipwright init — E2E Test Suite                 ║[0m
-[38;2;0;212;255m[1m╚═══════════════════════════════════════════════════╝[0m
+[1m  Validate Subcommand[0m
+  [38;2;74;222;128m✓[0m validate disabled returns empty array
+  [38;2;74;222;128m✓[0m validate without diff arg exits non-zero
+  [38;2;74;222;128m✓[0m validate without model file returns empty array
 
-[2mSetting up sandboxed environment...[0m
-[2mTemp dir: /tmp/sw-init-test.JhXYsO[0m
+[1m  Evolve Subcommand[0m
+  [38;2;74;222;128m✓[0m evolve disabled exits 0
+  [38;2;74;222;128m✓[0m evolve without model exits 0
 
-[38;2;124;58;237m[1mConfiguration[0m
-  [38;2;0;212;255m▸[0m Settings.json created with agent teams... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Settings merge preserves existing vars... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m tmux.conf installed... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Overlay installed... [38;2;74;222;128m✓[0m
+[1m  Model Storage[0m
+  [38;2;74;222;128m✓[0m build stores model in ~/.shipwright/memory/
+  [38;2;74;222;128m✓[0m Stored model is valid JSON
 
-[38;2;124;58;237m[1mTemplates[0m
-  [38;2;0;212;255m▸[0m Team templates installed (>= 10)... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Pipeline templates installed (>= 5)... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Legacy templates path populated... [38;2;74;222;128m✓[0m
+[1m  Event Emission[0m
+  [38;2;74;222;128m✓[0m emit_event creates events.jsonl
+  [38;2;74;222;128m✓[0m emit_event writes valid JSON
+  [38;2;74;222;128m✓[0m Event contains type field
 
-[38;2;124;58;237m[1mRobustness[0m
-  [38;2;0;212;255m▸[0m Idempotency — double init safe... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Doctor runs at end... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Help flag... [38;2;74;222;128m✓[0m
 
-[38;2;124;58;237m[1mHook Wiring[0m
-  [38;2;0;212;255m▸[0m JSONC stripped from settings.json... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Hooks wired into settings.json... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Hook wiring preserves existing hooks... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m SessionStart hook installed... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Hook wiring with pre-existing settings... [38;2;74;222;128m✓[0m
 
-[38;2;0;212;255m[1m════════════════════════════════════════════════════[0m
-[38;2;74;222;128m[1m  All 15 tests passed ✓[0m
-[38;2;0;212;255m[1m════════════════════════════════════════════════════[0m
 
+[2m  ──────────────────────────────────────────[0m
 
-[38;2;0;212;255m[1m╔═══════════════════════════════════════════════════╗[0m
-[38;2;0;212;255m[1m║  shipwright tracker — Test Suite                  ║[0m
-[38;2;0;212;255m[1m╚═══════════════════════════════════════════════════╝[0m
+  [38;2;74;222;128m[1mAll 0 tests passed[0m
 
-[2mSetting up test environment...[0m
 
-[38;2;124;58;237m[1mProvider Loading[0m
-  [38;2;0;212;255m▸[0m Provider loads from config (linear)... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Provider loads jira... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Graceful skip when no provider... [38;2;74;222;128m✓[0m
+[38;2;0;212;255m[1m  Shipwright Auth Tests[0m
+[2m  ══════════════════════════════════════════[0m
 
-[38;2;124;58;237m[1mPipeline Enrichment[0m
-  [38;2;0;212;255m▸[0m Stage descriptions exist for all 12 stages... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Enriched progress body has Delivering line... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Enriched progress body has stage descriptions... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Pipeline state includes stage_progress... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Pipeline state includes stage description... [38;2;74;222;128m✓[0m
+[1m  Help[0m
+  [38;2;74;222;128m✓[0m help shows usage
+  [38;2;74;222;128m✓[0m help shows commands
+  [38;2;74;222;128m✓[0m --help flag works
+  [38;2;74;222;128m✓[0m unknown command shows error
+[1m  Status & Users[0m
+  [38;2;74;222;128m✓[0m status with no login shows warning
+  [38;2;74;222;128m✓[0m users with empty shows warning
+  [38;2;74;222;128m✓[0m token with no user errors
+  [38;2;74;222;128m✓[0m switch without user exits non-zero
+[1m  Auth Storage[0m
+  [38;2;74;222;128m✓[0m auth file has users array
+  [38;2;74;222;128m✓[0m auth file has active_user
+  [38;2;74;222;128m✓[0m users lists stored user
+  [38;2;74;222;128m✓[0m token shows stored token
+  [38;2;74;222;128m✓[0m user info shows login
+  [38;2;74;222;128m✓[0m switch to nonexistent errors
+  [38;2;74;222;128m✓[0m logout succeeds
 
-[38;2;124;58;237m[1mIntegration[0m
-  [38;2;0;212;255m▸[0m Tracker notify routes to provider (mock)... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Dashboard reads goal from pipeline state... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Jira config validation... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Linear config migration (legacy fallback)... [38;2;74;222;128m✓[0m
+[2m  ──────────────────────────────────────────[0m
 
-[38;2;0;212;255m[1m════════════════════════════════════════════════════[0m
-[38;2;74;222;128m[1m  All 12 tests passed ✓[0m
-[38;2;0;212;255m[1m════════════════════════════════════════════════════[0m
+  [38;2;74;222;128m[1mAll 15 tests passed[0m
 
 
-[38;2;0;212;255m[1m╔═══════════════════════════════════════════════════╗[0m
-[38;2;0;212;255m[1m║  shipwright heartbeat + checkpoint — Test Suite   ║[0m
-[38;2;0;212;255m[1m╚═══════════════════════════════════════════════════╝[0m
 
-[2mSetting up test environment...[0m
+[38;2;0;212;255m[1m  Shipwright Autonomous Tests[0m
+[2m  ══════════════════════════════════════════[0m
 
-[38;2;124;58;237m[1mHeartbeat Lifecycle[0m
-  [38;2;0;212;255m▸[0m Write heartbeat creates JSON file... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Check heartbeat reports alive... [38;2;74;222;128m[1m✓[0m Job test-job-alive alive (0s ago)
-[38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Check heartbeat reports stale... [38;2;250;204;21m[1m⚠[0m Job test-job-stale stale (192940640s ago, timeout: 120s)
-[38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Clear heartbeat removes file... [38;2;74;222;128m[1m✓[0m Cleared heartbeat for job: test-job-clear
-[38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m List heartbeats returns JSON array... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Heartbeat update overwrites existing... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Check missing heartbeat returns error... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Heartbeat dir auto-created when missing... [38;2;74;222;128m✓[0m
+[2m  ══════════════════════════════════════════[0m
 
-[38;2;124;58;237m[1mCheckpoint Lifecycle[0m
-  [38;2;0;212;255m▸[0m Checkpoint save creates JSON file... [38;2;74;222;128m[1m✓[0m Checkpoint saved for stage [1mbuild[0m (iteration 5)
-[38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Checkpoint restore outputs JSON... [38;2;74;222;128m[1m✓[0m Checkpoint saved for stage [1mtest[0m (iteration 3)
-[38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Checkpoint restore missing stage fails... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Checkpoint clear removes file... [38;2;74;222;128m[1m✓[0m Checkpoint saved for stage [1mreview[0m (iteration 1)
-[38;2;74;222;128m[1m✓[0m Cleared checkpoint for stage [1mreview[0m
-[38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Checkpoint clear --all removes all... [38;2;74;222;128m[1m✓[0m Checkpoint saved for stage [1mbuild[0m (iteration 1)
-[38;2;74;222;128m[1m✓[0m Checkpoint saved for stage [1mtest[0m (iteration 2)
-[38;2;74;222;128m[1m✓[0m Cleared 2 checkpoint(s)
-[38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Checkpoint save with files-modified... [38;2;74;222;128m[1m✓[0m Checkpoint saved for stage [1mbuild[0m (iteration 7)
-[38;2;74;222;128m✓[0m
+  [38;2;74;222;128m✓[0m help shows usage text
+  [38;2;74;222;128m✓[0m help exits 0
+  [38;2;74;222;128m✓[0m --help flag works
+  [38;2;74;222;128m✓[0m unknown command exits 1
+  [38;2;74;222;128m✓[0m start shows running message
+  [38;2;74;222;128m✓[0m state.json created after start
+  [38;2;74;222;128m✓[0m state status is running
+  [38;2;74;222;128m✓[0m config.json created
+  [38;2;74;222;128m✓[0m config is valid JSON
+  [38;2;74;222;128m✓[0m status shows dashboard
+  [38;2;74;222;128m✓[0m pause sets status to paused
+  [38;2;74;222;128m✓[0m resume sets status to running
+  [38;2;74;222;128m✓[0m stop sets status to stopped
+  [38;2;74;222;128m✓[0m config show displays settings
+  [38;2;74;222;128m✓[0m config set interval works
+  [38;2;74;222;128m✓[0m history handles no data
 
-[38;2;124;58;237m[1mIntegration[0m
-  [38;2;0;212;255m▸[0m Pipeline script has heartbeat functions... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Loop script has heartbeat and checkpoint... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Pipeline has human intervention checks... [38;2;74;222;128m✓[0m
+[1m  Config Set/Show Cycle[0m
+  [38;2;74;222;128m✓[0m config show reflects set value
+  [38;2;74;222;128m✓[0m config value persists in file
 
-[38;2;0;212;255m[1m════════════════════════════════════════════════════[0m
-[38;2;74;222;128m[1m  All 17 tests passed ✓[0m
-[38;2;0;212;255m[1m════════════════════════════════════════════════════[0m
+[1m  Config Structure[0m
+  [38;2;74;222;128m✓[0m config contains key: cycle_interval_minutes
+  [38;2;74;222;128m✓[0m config contains key: max_issues_per_cycle
+  [38;2;74;222;128m✓[0m config contains key: daemon_aware
 
+[1m  History With Fixture Events[0m
+  [38;2;74;222;128m✓[0m history shows recent cycles
+  [38;2;74;222;128m✓[0m history shows cycle entries
 
-[38;2;0;212;255m[1m╔═══════════════════════════════════════════════════╗[0m
-[38;2;0;212;255m[1m║  shipwright remote — Test Suite                   ║[0m
-[38;2;0;212;255m[1m╚═══════════════════════════════════════════════════╝[0m
+[1m  Status Fields[0m
+  [38;2;74;222;128m✓[0m status when running includes Status
+  [38;2;74;222;128m✓[0m status when running includes Cycles
+  [38;2;74;222;128m✓[0m status when running includes Issues Created
+  [38;2;74;222;128m✓[0m status when running includes Pipelines
+  [38;2;74;222;128m✓[0m status when running includes Cycle Interval
+  [38;2;74;222;128m✓[0m status when running shows running
+  [38;2;74;222;128m✓[0m status when stopped shows stopped
 
-[2mSetting up test environment...[0m
 
-[38;2;124;58;237m[1mMachine Registry[0m
-  [38;2;0;212;255m▸[0m Add machine creates machines.json... [38;2;0;212;255m[1m▸[0m Checking shipwright installation at [2m/tmp/sw-remote-test.Qm0tkC/mock-install[0m...
-[38;2;74;222;128m[1m✓[0m Shipwright found at /tmp/sw-remote-test.Qm0tkC/mock-install
-[38;2;74;222;128m[1m✓[0m Registered machine: [1mbuilder-1[0m (localhost, worker, 4 workers)
-[38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Add second machine appends to array... [38;2;0;212;255m[1m▸[0m Checking shipwright installation at [2m/tmp/sw-remote-test.Qm0tkC/mock-install[0m...
-[38;2;74;222;128m[1m✓[0m Shipwright found at /tmp/sw-remote-test.Qm0tkC/mock-install
-[38;2;74;222;128m[1m✓[0m Registered machine: [1mbuilder-2[0m (localhost, worker, 8 workers)
-[38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Remove machine by name... [38;2;74;222;128m[1m✓[0m Removed machine: [1mbuilder-2[0m
-[38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m List machines returns output... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m machines.json uses atomic writes... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Duplicate machine name prevented... [38;2;0;212;255m[1m▸[0m Use [38;2;0;212;255mshipwright remote remove builder-1[0m first
-[38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Remote script has help command... [38;2;74;222;128m✓[0m
 
-[38;2;124;58;237m[1mCLI & Dashboard Integration[0m
-  [38;2;0;212;255m▸[0m CLI router includes remote command... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m CLI router includes heartbeat command... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m CLI router includes checkpoint command... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Doctor has heartbeat health check... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Doctor has remote machine checks... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Status shows heartbeat section... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Status shows remote machines section... [38;2;74;222;128m✓[0m
+[2m  ──────────────────────────────────────────[0m
 
-[38;2;0;212;255m[1m════════════════════════════════════════════════════[0m
-[38;2;74;222;128m[1m  All 14 tests passed ✓[0m
-[38;2;0;212;255m[1m════════════════════════════════════════════════════[0m
+  [38;2;74;222;128m[1mAll 0 tests passed[0m
 
 
-[38;2;124;58;237m[1m╔═══════════════════════════════════════════════════════════════════╗[0m
-[38;2;124;58;237m[1m║  shipwright intelligence test — Unit Tests                       ║[0m
-[38;2;124;58;237m[1m╚═══════════════════════════════════════════════════════════════════╝[0m
 
-[2mSetting up test environment...[0m
-✓ Environment ready: /tmp/sw-intelligence-test.aRDezI
+[38;2;0;212;255m[1m  Shipwright Changelog Tests[0m
+[2m  ══════════════════════════════════════════[0m
 
-  ▸ analyze_issue returns valid schema... ✓
-  ▸ Cache hit on second call with same input... ✓
-  ▸ Graceful degradation when claude CLI unavailable... ✓
-  ▸ compose_pipeline produces valid pipeline JSON... ✓
-  ▸ recommend_model returns valid model names... ✓
-  ▸ predict_cost returns numeric estimates... ✓
-  ▸ Cache TTL expiry returns miss... ✓
-  ▸ search_memory returns ranked results... ✓
-  ▸ Feature flag disabled returns fallback... ✓
-  ▸ Events emitted for analysis... ✓
-  ▸ recommend_model emits events... ✓
-  ▸ Cache init creates file if missing... ✓
+[2m  ══════════════════════════════════════════[0m
 
-━━━ Results ━━━
-  Passed: 12
-  Failed: 0
-  Total:  12
+[2m  help / version[0m
+  [38;2;74;222;128m✓[0m help exits 0
+  [38;2;74;222;128m✓[0m help shows USAGE
+  [38;2;74;222;128m✓[0m help mentions generate
+  [38;2;74;222;128m✓[0m help mentions preview
+  [38;2;74;222;128m✓[0m help mentions version
+  [38;2;74;222;128m✓[0m help mentions migrate
+  [38;2;74;222;128m✓[0m VERSION variable defined
 
-All 12 tests passed!
+[2m  error handling[0m
+  [38;2;74;222;128m✓[0m Unknown command exits non-zero
 
+[2m  formats command[0m
+  [38;2;74;222;128m✓[0m formats exits 0
 
-[38;2;0;212;255m[1m╔═══════════════════════════════════════════════════╗[0m
-[38;2;0;212;255m[1m║  shipwright pipeline composer — Test Suite        ║[0m
-[38;2;0;212;255m[1m╚═══════════════════════════════════════════════════╝[0m
+[2m  generate command[0m
+  [38;2;74;222;128m✓[0m generate exits 0
 
-[2mSetting up test environment...[0m
+[2m  version command[0m
+  [38;2;74;222;128m✓[0m version recommendation exits 0
 
-[38;2;124;58;237m[1mPipeline Composition[0m
-  [38;2;0;212;255m▸[0m Composed pipeline has valid stage ordering... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m High-risk issue gets security stages... [38;2;0;212;255m[1m▸[0m Composing pipeline with intelligence engine...
-[38;2;74;222;128m[1m✓[0m Composed pipeline: 7 stages
-.claude/pipeline-artifacts/composed-pipeline.json
-[38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Fallback to static template when no intelligence... [38;2;74;222;128m✓[0m
+[2m  script safety[0m
+  [38;2;74;222;128m✓[0m Uses set -euo pipefail
+  [38;2;74;222;128m✓[0m Has source guard pattern
 
-[38;2;124;58;237m[1mConditional Stage Insertion[0m
-  [38;2;0;212;255m▸[0m Stage inserted at correct position after build... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Insert into nonexistent stage fails... [38;2;74;222;128m✓[0m
 
-[38;2;124;58;237m[1mModel Downgrade[0m
-  [38;2;0;212;255m▸[0m Budget constraint triggers model downgrades... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Downgrade with nonexistent stage fails... [38;2;74;222;128m✓[0m
 
-[38;2;124;58;237m[1mPipeline Validation[0m
-  [38;2;0;212;255m▸[0m Validation accepts valid pipeline... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Validation rejects invalid ordering (test before build)... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Validation rejects missing stage ids... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Validation rejects missing stages array... [38;2;74;222;128m✓[0m
+[2m  ──────────────────────────────────────────[0m
 
-[38;2;124;58;237m[1mIteration Estimation[0m
-  [38;2;0;212;255m▸[0m Iteration estimates are reasonable (1-50 range)... [38;2;74;222;128m✓[0m
+  [38;2;74;222;128m[1mAll 0 tests passed[0m
 
-[38;2;0;212;255m[1m════════════════════════════════════════════════════[0m
-[38;2;74;222;128m[1m  All 12 tests passed ✓[0m
-[38;2;0;212;255m[1m════════════════════════════════════════════════════[0m
 
 
-[38;2;124;58;237m[1m━━━ shipwright self-optimize tests ━━━[0m
+[38;2;0;212;255m[1m  shipwright checkpoint test[0m
+[2m  ══════════════════════════════════════════[0m
 
-  ▸ Outcome analysis extracts correct metrics... ✓
-  ▸ Outcome analysis emits event... ✓
-  ▸ Outcome analysis rejects missing file... ✓
-  ▸ Template weight increases for high success... ✓
-  ▸ Template weight decreases for low success... ✓
-  ▸ A/B test selects ~20% sample... ✓
-  ▸ Iteration model updates with data points... ✓
-  ▸ Model routing tracks success rates... ✓
-  ▸ Model routing keeps opus with few sonnet samples... ✓
-  ▸ Memory pruning removes old patterns... ✓
-  ▸ Memory strengthening boosts confirmed patterns... ✓
-  ▸ Memory promotion copies cross-repo patterns... ✓
-  ▸ Full analysis runs on empty data... ✓
-  ▸ Report generates output with data... ✓
-  ▸ Report handles empty outcomes... ✓
-  ▸ Outcome analysis extracts stage data... ✓
+[2m  ══════════════════════════════════════════[0m
 
-━━━ Results ━━━
-  Passed: 16
-  Failed: 0
-  Total:  16
+[1m  Script Safety[0m
+  [38;2;74;222;128m✓[0m set -euo pipefail present
+  [38;2;74;222;128m✓[0m ERR trap present
+  [38;2;74;222;128m✓[0m VERSION variable defined
+
+[1m  Help Output[0m
+  [38;2;74;222;128m✓[0m help exits 0 and contains USAGE
+  [38;2;74;222;128m✓[0m help lists 'save' subcommand
+  [38;2;74;222;128m✓[0m help lists 'restore' subcommand
+  [38;2;74;222;128m✓[0m help lists 'list' subcommand
+  [38;2;74;222;128m✓[0m help lists 'clear' subcommand
+  [38;2;74;222;128m✓[0m help lists 'expire' subcommand
+  [38;2;74;222;128m✓[0m --help alias works
+  [38;2;74;222;128m✓[0m -h alias works
+
+[1m  Error Handling[0m
+
+[38;2;0;212;255m[1mshipwright checkpoint[0m [2mv3.2.4[0m — Save and restore agent state mid-stage
+
+[1mUSAGE[0m
+  [38;2;0;212;255mshipwright checkpoint[0m <command> [options]
+
+[1mCOMMANDS[0m
+  [38;2;0;212;255msave[0m           Save a checkpoint for a stage
+  [38;2;0;212;255mrestore[0m        Restore a checkpoint (prints JSON to stdout)
+  [38;2;0;212;255msave-context[0m   Save Claude context (goal, findings, test output) for resume
+  [38;2;0;212;255mrestore-context[0m Restore Claude context (exports RESTORED_* and SW_LOOP_* vars)
+  [38;2;0;212;255mlist[0m      Show all available checkpoints
+  [38;2;0;212;255mclear[0m     Remove checkpoint(s)
+  [38;2;0;212;255mexpire[0m    Remove checkpoints older than N hours
+
+[1mSAVE OPTIONS[0m
+  [38;2;0;212;255m--stage[0m <name>              Stage name (required)
+  [38;2;0;212;255m--iteration[0m <n>             Current iteration number
+  [38;2;0;212;255m--git-sha[0m <sha>             Git commit SHA (default: HEAD)
+  [38;2;0;212;255m--files-modified[0m "f1,f2"    Comma-separated list of modified files
+  [38;2;0;212;255m--tests-passing[0m             Mark tests as passing
+  [38;2;0;212;255m--loop-state[0m <state>        Loop state (running, paused, etc.)
+
+[1mRESTORE OPTIONS[0m
+  [38;2;0;212;255m--stage[0m <name>              Stage to restore (required)
+
+[1mCLEAR OPTIONS[0m
+  [38;2;0;212;255m--stage[0m <name>              Stage to clear
+  [38;2;0;212;255m--all[0m                       Clear all checkpoints
+
+[1mEXPIRE OPTIONS[0m
+  [38;2;0;212;255m--hours[0m <n>                 Max age in hours (default: 24)
 
-All 16 tests passed!
+[1mEXAMPLES[0m
+  [2mshipwright checkpoint save --stage build --iteration 5[0m
+  [2mshipwright checkpoint save --stage build --iteration 3 --tests-passing --files-modified "src/auth.ts,src/middleware.ts"[0m
+  [2mshipwright checkpoint restore --stage build[0m
+  [2mshipwright checkpoint list[0m
+  [2mshipwright checkpoint clear --stage build[0m
+  [2mshipwright checkpoint clear --all[0m
+  [2mshipwright checkpoint expire --hours 48[0m
+  [38;2;74;222;128m✓[0m Unknown command exits non-zero
+
+[1m  Save Subcommand[0m
+
+[38;2;0;212;255m[1mshipwright checkpoint[0m [2mv3.2.4[0m — Save and restore agent state mid-stage
+
+[1mUSAGE[0m
+  [38;2;0;212;255mshipwright checkpoint[0m <command> [options]
+
+[1mCOMMANDS[0m
+  [38;2;0;212;255msave[0m           Save a checkpoint for a stage
+  [38;2;0;212;255mrestore[0m        Restore a checkpoint (prints JSON to stdout)
+  [38;2;0;212;255msave-context[0m   Save Claude context (goal, findings, test output) for resume
+  [38;2;0;212;255mrestore-context[0m Restore Claude context (exports RESTORED_* and SW_LOOP_* vars)
+  [38;2;0;212;255mlist[0m      Show all available checkpoints
+  [38;2;0;212;255mclear[0m     Remove checkpoint(s)
+  [38;2;0;212;255mexpire[0m    Remove checkpoints older than N hours
+
+[1mSAVE OPTIONS[0m
+  [38;2;0;212;255m--stage[0m <name>              Stage name (required)
+  [38;2;0;212;255m--iteration[0m <n>             Current iteration number
+  [38;2;0;212;255m--git-sha[0m <sha>             Git commit SHA (default: HEAD)
+  [38;2;0;212;255m--files-modified[0m "f1,f2"    Comma-separated list of modified files
+  [38;2;0;212;255m--tests-passing[0m             Mark tests as passing
+  [38;2;0;212;255m--loop-state[0m <state>        Loop state (running, paused, etc.)
+
+[1mRESTORE OPTIONS[0m
+  [38;2;0;212;255m--stage[0m <name>              Stage to restore (required)
+
+[1mCLEAR OPTIONS[0m
+  [38;2;0;212;255m--stage[0m <name>              Stage to clear
+  [38;2;0;212;255m--all[0m                       Clear all checkpoints
+
+[1mEXPIRE OPTIONS[0m
+  [38;2;0;212;255m--hours[0m <n>                 Max age in hours (default: 24)
+
+[1mEXAMPLES[0m
+  [2mshipwright checkpoint save --stage build --iteration 5[0m
+  [2mshipwright checkpoint save --stage build --iteration 3 --tests-passing --files-modified "src/auth.ts,src/middleware.ts"[0m
+  [2mshipwright checkpoint restore --stage build[0m
+  [2mshipwright checkpoint list[0m
+  [2mshipwright checkpoint clear --stage build[0m
+  [2mshipwright checkpoint clear --all[0m
+  [2mshipwright checkpoint expire --hours 48[0m
+  [38;2;74;222;128m✓[0m save without --stage exits non-zero
+[38;2;74;222;128m[1m✓[0m Checkpoint saved for stage [1mbuild[0m (iteration 5)
+  [38;2;74;222;128m✓[0m save creates checkpoint file
+  [38;2;74;222;128m✓[0m Checkpoint is valid JSON
+  [38;2;74;222;128m✓[0m Checkpoint stage field correct
+  [38;2;74;222;128m✓[0m Checkpoint iteration field correct
+  [38;2;74;222;128m✓[0m Checkpoint git_sha populated
+[38;2;74;222;128m[1m✓[0m Checkpoint saved for stage [1mtest[0m (iteration 0)
+  [38;2;74;222;128m✓[0m save --tests-passing sets true
+[38;2;74;222;128m[1m✓[0m Checkpoint saved for stage [1mreview[0m (iteration 0)
+  [38;2;74;222;128m✓[0m save --files-modified stores 2 files
+[38;2;74;222;128m[1m✓[0m Checkpoint saved for stage [1mdeploy[0m (iteration 0)
+  [38;2;74;222;128m✓[0m save --loop-state stores state
+  [38;2;74;222;128m✓[0m Checkpoint created_at timestamp present
+
+[1m  Restore Subcommand[0m
+  [38;2;74;222;128m✓[0m restore returns checkpoint JSON
+  [38;2;74;222;128m✓[0m Restored checkpoint has correct stage
+  [38;2;74;222;128m✓[0m restore missing stage exits non-zero
+  [38;2;74;222;128m✓[0m restore without --stage exits non-zero
+
+[1m  List Subcommand[0m
+  [38;2;74;222;128m✓[0m list shows Checkpoints header
+  [38;2;74;222;128m✓[0m list shows build checkpoint
+  [38;2;74;222;128m✓[0m list shows checkpoint count
+  [38;2;74;222;128m✓[0m list with no checkpoints shows empty
+
+[1m  Clear Subcommand[0m
+[38;2;74;222;128m[1m✓[0m Checkpoint saved for stage [1mbuild[0m (iteration 1)
+[38;2;74;222;128m[1m✓[0m Checkpoint saved for stage [1mtest[0m (iteration 2)
+[38;2;74;222;128m[1m✓[0m Cleared checkpoint for stage [1mbuild[0m
+  [38;2;74;222;128m✓[0m clear --stage removes specific checkpoint
+  [38;2;74;222;128m✓[0m clear --stage preserves other checkpoints
+  [38;2;74;222;128m✓[0m clear without args exits non-zero
+[38;2;74;222;128m[1m✓[0m Checkpoint saved for stage [1mbuild[0m (iteration 3)
+[38;2;74;222;128m[1m✓[0m Cleared 2 checkpoint(s)
+  [38;2;74;222;128m✓[0m clear --all removes all checkpoints
 
+[1m  Expire Subcommand[0m
+  [38;2;74;222;128m✓[0m expire with no checkpoints exits 0
 
-[38;2;0;212;255m[1m╔═══════════════════════════════════════════════════════════╗[0m
-[38;2;0;212;255m[1m║  shipwright predictive test                              ║[0m
-[38;2;0;212;255m[1m╚═══════════════════════════════════════════════════════════╝[0m
+[1m  Save-context / Restore-context[0m
+  [38;2;74;222;128m✓[0m save-context creates claude-context.json
+  [38;2;74;222;128m✓[0m Context goal saved correctly
+  [38;2;74;222;128m✓[0m Context iteration saved correctly
+  [38;2;74;222;128m✓[0m restore-context exports RESTORED_GOAL
+  [38;2;74;222;128m✓[0m restore-context exports SW_LOOP_GOAL
 
 
-[38;2;124;58;237m[1mRisk Assessment[0m
-  [38;2;0;212;255m▸[0m Risk returns valid schema with 0-100 range... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Risk elevates for complex keywords... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Risk emits event... [38;2;74;222;128m✓[0m
 
-[38;2;124;58;237m[1mAnomaly Detection[0m
-  [38;2;0;212;255m▸[0m Critical at 3x threshold (181 vs 60 baseline)... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Normal at 2x (119 vs 60 baseline)... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Warning between 2x and 3x (150 vs 60)... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Normal when no baseline exists... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Emits event for critical anomaly... [38;2;74;222;128m✓[0m
 
-[38;2;124;58;237m[1mBaseline Management[0m
-  [38;2;0;212;255m▸[0m First data point uses raw value... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m EMA calculation (0.9*100 + 0.1*200 = 110)... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Creates baseline file if missing... [38;2;74;222;128m✓[0m
+[2m  ──────────────────────────────────────────[0m
 
-[38;2;124;58;237m[1mPreventative Injection[0m
-  [38;2;0;212;255m▸[0m Injects context from matching patterns... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Returns empty for non-matching stage... [38;2;74;222;128m✓[0m
+  [38;2;74;222;128m[1mAll 0 tests passed[0m
 
-[38;2;124;58;237m[1mGraceful Degradation[0m
-  [38;2;0;212;255m▸[0m Works without intelligence engine... [38;2;74;222;128m✓[0m
 
-[38;2;124;58;237m[1mAI Patrol[0m
-  [38;2;0;212;255m▸[0m AI patrol returns structured findings... [38;2;74;222;128m✓[0m
 
-[38;2;0;212;255m[1m════════════════════════════════════════════════════[0m
-[38;2;74;222;128m[1m  All 15 tests passed ✓[0m
-[38;2;0;212;255m[1m════════════════════════════════════════════════════[0m
+[38;2;0;212;255m[1m  Shipwright CI Tests[0m
+[2m  ══════════════════════════════════════════[0m
 
+[2m  ══════════════════════════════════════════[0m
 
-[38;2;0;212;255m[1m╔═══════════════════════════════════════════════════╗[0m
-[38;2;0;212;255m[1m║  shipwright frontier — Test Suite                 ║[0m
-[38;2;0;212;255m[1m╚═══════════════════════════════════════════════════╝[0m
+  [38;2;74;222;128m✓[0m help shows usage text
+  [38;2;74;222;128m✓[0m help exits 0
+  [38;2;74;222;128m✓[0m --help flag works
+  [38;2;74;222;128m✓[0m version shows version
+  [38;2;74;222;128m✓[0m unknown command exits 1
+  [38;2;74;222;128m✓[0m generate starts processing
+  [38;2;74;222;128m✓[0m validate runs on valid workflow
+  [38;2;74;222;128m✓[0m VERSION is defined
+  [38;2;74;222;128m✓[0m analyze shows analysis
+  [38;2;74;222;128m✓[0m analyze shows cache info
+  [38;2;74;222;128m✓[0m matrix generates config
+  [38;2;74;222;128m✓[0m matrix workflow file exists
+  [38;2;74;222;128m✓[0m validate passes on valid workflow
+  [38;2;74;222;128m✓[0m runners list shows options
+  [38;2;74;222;128m✓[0m runners recommend shows guidance
 
-[2mSetting up test environment...[0m
 
-[38;2;124;58;237m[1mAdversarial Review[0m
-  [38;2;0;212;255m▸[0m Adversarial review produces structured findings... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Adversarial iteration converges on no critical findings... [38;2;74;222;128m✓[0m
 
-[38;2;124;58;237m[1mDeveloper Simulation[0m
-  [38;2;0;212;255m▸[0m Simulation generates objections from 3 personas... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Simulation address returns action items... [38;2;74;222;128m✓[0m
+[2m  ──────────────────────────────────────────[0m
 
-[38;2;124;58;237m[1mArchitecture Enforcer[0m
-  [38;2;0;212;255m▸[0m Architecture model has valid schema... [38;2;74;222;128m✓[0m
-  [38;2;0;212;255m▸[0m Architecture validates changes (violation detected)... [38;2;74;222;128m✓[0m
+  [38;2;74;222;128m[1mAll 0 tests passed[0m
 
-[38;2;124;58;237m[1mGraceful Degradation[0m
-  [38;2;0;212;255m▸[0m All three degrade gracefully when claude unavailable... [38;2;74;222;128m✓[0m
 
-[38;2;0;212;255m[1m════════════════════════════════════════════════════[0m
-[38;2;74;222;128m[1m  All 7 tests passed ✓[0m
-[38;2;0;212;255m[1m════════════════════════════════════════════════════[0m
+
+[38;2;0;212;255m[1m  Shipwright Cleanup Tests[0m
+[2m  ══════════════════════════════════════════[0m
+
+[2m  ══════════════════════════════════════════[0m
+
+[1m  Help[0m
+  [38;2;74;222;128m✓[0m help exits 0
+  [38;2;74;222;128m✓[0m help shows usage
+  [38;2;74;222;128m✓[0m help shows --force
+  [38;2;74;222;128m✓[0m help shows dry-run
+
+[1m  Dry-Run (Empty)[0m
+  [38;2;74;222;128m✓[0m dry-run shows Tmux Windows section
+  [38;2;74;222;128m✓[0m dry-run shows Team Configs section
+  [38;2;74;222;128m✓[0m dry-run shows Task Lists section
+  [38;2;74;222;128m✓[0m dry-run shows Pipeline Artifacts section
+  [38;2;74;222;128m✓[0m dry-run shows Pipeline State section
+  [38;2;74;222;128m✓[0m dry-run shows Heartbeats section
+  [38;2;74;222;128m✓[0m dry-run reports clean
+
+[1m  Force Mode (Empty)[0m
+  [38;2;74;222;128m✓[0m force shows FORCE MODE
+  [38;2;74;222;128m✓[0m force reports nothing to clean
+
+[1m  Detect Team Configs[0m
+  [38;2;74;222;128m✓[0m dry-run detects team dir
+  [38;2;74;222;128m✓[0m dry-run shows would remove
+
+[1m  Force Removes Teams[0m
+  [38;2;74;222;128m✓[0m force removes team dir
+  [38;2;74;222;128m✓[0m team directory actually removed
+
+[1m  Detect Task Lists[0m
+  [38;2;74;222;128m✓[0m dry-run detects task dir
+  [38;2;74;222;128m✓[0m task directory actually removed
+
+[1m  Detect Stale Heartbeats[0m
+  [38;2;74;222;128m✓[0m dry-run detects stale heartbeat
+
+[1m  Error Handling[0m
+  [38;2;74;222;128m✓[0m unknown option exits non-zero
+  [38;2;74;222;128m✓[0m unknown option shows error
+
+[1m  Summary Counting[0m
+  [38;2;74;222;128m✓[0m summary shows found count
+  [38;2;74;222;128m✓[0m summary shows --force hint
+
+
+
+[2m  ──────────────────────────────────────────[0m
+
+  [38;2;74;222;128m[1mAll 24 tests passed[0m
+
+
+
+[38;2;0;212;255m[1m  Shipwright Code Review Tests[0m
+[2m  ══════════════════════════════════════════[0m
+
+[2m  ══════════════════════════════════════════[0m
+
+  [38;2;74;222;128m✓[0m help shows usage text
+  [38;2;74;222;128m✓[0m help exits 0
+  [38;2;74;222;128m✓[0m --help flag works
+  [38;2;74;222;128m✓[0m review runs and starts reviewing
+  [38;2;74;222;128m✓[0m trends with no data
+  [38;2;74;222;128m✓[0m config show outputs valid config
+  [38;2;74;222;128m✓[0m unknown subcommand exits nonzero
+  [38;2;74;222;128m✓[0m no false long function detection on small file
+  [38;2;74;222;128m✓[0m style consistency check runs without crash
+  [38;2;74;222;128m✓[0m architecture boundary check runs without crash
+
+
+
+[2m  ──────────────────────────────────────────[0m
+
+  [38;2;74;222;128m[1mAll 0 tests passed[0m
 
 
 [38;2;0;212;255m[1m╔═══════════════════════════════════════════════════╗[0m
@@ -560,24 +698,24 @@ All 16 tests passed!
 
 [2mSetting up test environment...[0m
 
-[38;2;124;58;237m[1mIdentity Resolution[0m
+[38;2;168;85;247m[1mIdentity Resolution[0m
   [38;2;0;212;255m▸[0m resolve_developer_id from DEVELOPER_ID env... [38;2;74;222;128m✓[0m
   [38;2;0;212;255m▸[0m resolve_developer_id from git config... [38;2;74;222;128m✓[0m
   [38;2;0;212;255m▸[0m resolve_developer_id fallback to USER... [38;2;74;222;128m✓[0m
   [38;2;0;212;255m▸[0m resolve_machine_name from MACHINE_NAME env... [38;2;74;222;128m✓[0m
   [38;2;0;212;255m▸[0m resolve_machine_name from hostname... [38;2;74;222;128m✓[0m
 
-[38;2;124;58;237m[1mDashboard URL Resolution[0m
+[38;2;168;85;247m[1mDashboard URL Resolution[0m
   [38;2;0;212;255m▸[0m resolve_dashboard_url from --url flag... [38;2;74;222;128m✓[0m
   [38;2;0;212;255m▸[0m resolve_dashboard_url from DASHBOARD_URL env... [38;2;74;222;128m✓[0m
   [38;2;0;212;255m▸[0m resolve_dashboard_url from team-config.json... [38;2;74;222;128m✓[0m
   [38;2;0;212;255m▸[0m resolve_dashboard_url falls back to default... [38;2;74;222;128m✓[0m
 
-[38;2;124;58;237m[1mStart/Stop Lifecycle[0m
+[38;2;168;85;247m[1mStart/Stop Lifecycle[0m
   [38;2;0;212;255m▸[0m cmd_start creates PID file... [38;2;0;212;255m[1m▸[0m Starting connect to [1mhttp://localhost:8767[0m
 [38;2;0;212;255m[1m▸[0m Developer: [1mtest-developer[0m @ [1mtest-machine[0m
-[38;2;74;222;128m[1m✓[0m Connect started (PID 1315235)
-  [2mLogs: /tmp/sw-connect-test.UX0pCu/home/.shipwright/connect.log[0m
+[38;2;74;222;128m[1m✓[0m Connect started (PID 15326)
+  [2mLogs: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-connect-test.kkYSxV/home/.shipwright/connect.log[0m
   [2mStop: shipwright connect stop[0m
 [38;2;74;222;128m✓[0m
   [38;2;0;212;255m▸[0m cmd_start rejects if already running...   [2mStop it first: shipwright connect stop[0m
@@ -587,29 +725,3272 @@ All 16 tests passed!
   [38;2;0;212;255m▸[0m cmd_stop handles missing PID gracefully... [38;2;250;204;21m[1m⚠[0m Connect is not running (no PID file)
 [38;2;74;222;128m✓[0m
 
-[38;2;124;58;237m[1mStatus[0m
+[38;2;168;85;247m[1mStatus[0m
   [38;2;0;212;255m▸[0m cmd_status shows connected when PID alive... [38;2;74;222;128m✓[0m
   [38;2;0;212;255m▸[0m cmd_status shows disconnected when no PID... [38;2;74;222;128m✓[0m
 
-[38;2;124;58;237m[1mJoin Flow[0m
+[38;2;168;85;247m[1mJoin Flow[0m
   [38;2;0;212;255m▸[0m cmd_join verifies token against dashboard... [38;2;74;222;128m✓[0m
   [38;2;0;212;255m▸[0m cmd_join saves team-config.json... [38;2;74;222;128m✓[0m
   [38;2;0;212;255m▸[0m cmd_join rejects invalid token... [38;2;74;222;128m✓[0m
   [38;2;0;212;255m▸[0m cmd_join accepts --url and --token flags... [38;2;74;222;128m✓[0m
 
-[38;2;124;58;237m[1mHeartbeat & Disconnect Payloads[0m
+[38;2;168;85;247m[1mHeartbeat & Disconnect Payloads[0m
   [38;2;0;212;255m▸[0m Heartbeat payload includes required fields... [38;2;74;222;128m✓[0m
   [38;2;0;212;255m▸[0m Send disconnect sends proper payload... [38;2;74;222;128m✓[0m
 
-[38;2;124;58;237m[1mConfiguration & Utilities[0m
+[38;2;168;85;247m[1mConfiguration & Utilities[0m
   [38;2;0;212;255m▸[0m ensure_dir creates shipwright directory... [38;2;74;222;128m✓[0m
   [38;2;0;212;255m▸[0m now_iso returns valid ISO timestamp... [38;2;74;222;128m✓[0m
   [38;2;0;212;255m▸[0m Script has correct version... [38;2;74;222;128m✓[0m
 
-[38;2;124;58;237m[1mIntegration[0m
+[38;2;168;85;247m[1mIntegration[0m
   [38;2;0;212;255m▸[0m Help command shows all main commands... [38;2;74;222;128m✓[0m
 
 [38;2;0;212;255m[1m════════════════════════════════════════════════════[0m
 [38;2;74;222;128m[1m  All 25 tests passed ✓[0m
 [38;2;0;212;255m[1m════════════════════════════════════════════════════[0m
 
+
+[38;2;0;212;255m[1m  Context Budget Monitor Tests[0m
+[2m  ══════════════════════════════════════════[0m
+
+[2m  ══════════════════════════════════════════[0m
+
+  [38;2;0;212;255mBudget Initialization[0m
+  [38;2;74;222;128m✓[0m init creates config (exit 0)
+  [38;2;74;222;128m✓[0m config has correct total_budget
+  [38;2;74;222;128m✓[0m system_reserve is 10% (80000)
+  [38;2;74;222;128m✓[0m tools_reserve is 10% (80000)
+  [38;2;74;222;128m✓[0m working_memory is 60% (480000)
+  [38;2;74;222;128m✓[0m output_reserve is 20% (160000)
+
+  [38;2;0;212;255mToken Estimation[0m
+  [38;2;74;222;128m✓[0m estimation produces JSON
+  [38;2;74;222;128m✓[0m estimate contains utilization_percent
+  [38;2;74;222;128m✓[0m estimate contains total_used (>0)
+
+  [38;2;0;212;255mStatus Checking (Thresholds)[0m
+  [38;2;74;222;128m✓[0m 50% utilization returns green status
+  [38;2;74;222;128m✓[0m 70% utilization returns yellow status
+  [38;2;74;222;128m✓[0m 85% utilization returns red status
+  [38;2;74;222;128m✓[0m 95% utilization returns critical status
+
+  [38;2;0;212;255mContext Trimming[0m
+  [38;2;74;222;128m✓[0m green status doesn't trim content
+  [38;2;74;222;128m✓[0m yellow status reduces content length
+  [38;2;74;222;128m✓[0m hard truncate respects size limit
+
+  [38;2;0;212;255mIteration Summarization[0m
+  [38;2;74;222;128m✓[0m summarize_iteration succeeds (exit 0)
+  [38;2;74;222;128m✓[0m iteration summary file created with 1 entry
+
+  [38;2;0;212;255mBudget Report Generation[0m
+  [38;2;74;222;128m✓[0m report contains budget_config
+  [38;2;74;222;128m✓[0m report contains iteration_summaries
+
+  [38;2;0;212;255mState Logging[0m
+  [38;2;74;222;128m✓[0m log_state succeeds (exit 0)
+  [38;2;74;222;128m✓[0m log file created with entries
+
+
+[2m  ──────────────────────────────────────────[0m
+
+  [38;2;74;222;128m[1mAll 22 tests passed[0m
+
+
+
+[38;2;0;212;255m[1m  Shipwright Context Tests[0m
+[2m  ══════════════════════════════════════════[0m
+
+[2m  ══════════════════════════════════════════[0m
+
+  [38;2;0;212;255mhelp command[0m
+  [38;2;74;222;128m✓[0m help exits 0
+  [38;2;74;222;128m✓[0m help shows usage
+  [38;2;74;222;128m✓[0m help shows commands
+  [38;2;74;222;128m✓[0m --help exits 0
+
+  [38;2;0;212;255merror handling[0m
+  [38;2;74;222;128m✓[0m unknown command exits 1
+  [38;2;74;222;128m✓[0m unknown command shows error
+
+  [38;2;0;212;255mshow subcommand[0m
+  [38;2;74;222;128m✓[0m show exits 0
+  [38;2;74;222;128m✓[0m show outputs context header
+
+  [38;2;0;212;255mclear subcommand[0m
+  [38;2;74;222;128m✓[0m clear exits 0
+  [38;2;74;222;128m✓[0m clear confirms cleared
+
+  [38;2;0;212;255mgather subcommand[0m
+  [38;2;74;222;128m✓[0m gather without args exits 1
+  [38;2;74;222;128m✓[0m gather shows must provide
+  [38;2;74;222;128m✓[0m gather with unknown option exits 1
+
+  [38;2;0;212;255mgather with goal[0m
+  [38;2;74;222;128m✓[0m gather exits 0
+  [38;2;74;222;128m✓[0m gather shows building
+  [38;2;74;222;128m✓[0m gather shows success
+  [38;2;74;222;128m✓[0m context-bundle.md created
+
+  [38;2;0;212;255mshow after gather[0m
+  [38;2;74;222;128m✓[0m show after gather exits 0
+  [38;2;74;222;128m✓[0m show contains pipeline context
+
+  [38;2;0;212;255mclear after gather[0m
+  [38;2;74;222;128m✓[0m clear exits 0
+
+  [38;2;0;212;255mgather with issue[0m
+  [38;2;74;222;128m✓[0m gather with --issue exits 0
+  [38;2;74;222;128m✓[0m gather shows building
+
+  [38;2;0;212;255mgather default stage[0m
+  [38;2;74;222;128m✓[0m gather default stage exits 0
+
+  [38;2;0;212;255minternal stage_guidance[0m
+  [38;2;74;222;128m✓[0m stage_guidance returns plan guidance
+  [38;2;74;222;128m✓[0m stage_guidance returns build guidance
+  [38;2;74;222;128m✓[0m stage_guidance handles unknown stage
+
+
+
+[2m  ──────────────────────────────────────────[0m
+
+  [38;2;74;222;128m[1mAll 26 tests passed[0m
+
+
+
+[38;2;0;212;255m[1m  Shipwright Cost Tests[0m
+[2m  ══════════════════════════════════════════[0m
+
+[2m  ══════════════════════════════════════════[0m
+
+[2m  help / version[0m
+  [38;2;74;222;128m✓[0m help exits 0
+  [38;2;74;222;128m✓[0m help shows USAGE
+  [38;2;74;222;128m✓[0m help shows COMMANDS
+  [38;2;74;222;128m✓[0m help mentions show
+  [38;2;74;222;128m✓[0m help mentions budget
+  [38;2;74;222;128m✓[0m help mentions calculate
+  [38;2;74;222;128m✓[0m VERSION variable defined
+
+[2m  state management[0m
+  [38;2;74;222;128m✓[0m costs.json created on first use
+  [38;2;74;222;128m✓[0m budget.json created on first use
+  [38;2;74;222;128m✓[0m costs.json has entries array
+  [38;2;74;222;128m✓[0m budget.json has daily_budget_usd
+
+[2m  budget commands[0m
+  [38;2;74;222;128m✓[0m budget set exits 0
+  [38;2;74;222;128m✓[0m budget set to 50
+  [38;2;74;222;128m✓[0m budget show exits 0
+
+[2m  error handling[0m
+  [38;2;74;222;128m✓[0m Unknown command exits non-zero
+
+[2m  calculate[0m
+  [38;2;74;222;128m✓[0m calculate exits 0
+
+[2m  script safety[0m
+  [38;2;74;222;128m✓[0m Uses set -euo pipefail
+  [38;2;74;222;128m✓[0m ERR trap is set
+
+[2m  context efficiency in cost dashboard[0m
+  [38;2;74;222;128m✓[0m Cost dashboard has CONTEXT EFFICIENCY section
+  [38;2;74;222;128m✓[0m Cost dashboard reads loop.context_efficiency events
+  [38;2;74;222;128m✓[0m Context efficiency reports utilization and waste
+  [38;2;74;222;128m✓[0m Dashboard renders CONTEXT EFFICIENCY with event data
+  [38;2;74;222;128m✓[0m Dashboard shows avg budget utilization
+
+
+
+[2m  ──────────────────────────────────────────[0m
+
+  [38;2;74;222;128m[1mAll 0 tests passed[0m
+
+
+[38;2;168;85;247m[1m╔═══════════════════════════════════════════════════════════════════╗[0m
+[38;2;168;85;247m[1m║  shipwright daemon test — Unit Tests (Synthetic Events)           ║[0m
+[38;2;168;85;247m[1m╚═══════════════════════════════════════════════════════════════════╝[0m
+
+[2mSetting up test environment...[0m
+[38;2;74;222;128m✓[0m Environment ready: [2m/var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-daemon-test.tgqluq[0m
+
+  [38;2;0;212;255m▸[0m dora_grade deploy_freq Elite (>= 7)... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m dora_grade deploy_freq High (>= 1)... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m dora_grade deploy_freq Medium (>= 0.25)... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m dora_grade deploy_freq Low (< 0.25)... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m dora_grade CFR thresholds (Elite/High/Medium/Low)... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Stage timings filter-first jq query... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m MTTR pairs failures with next success... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m epoch_to_iso helper function... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Health check detects stale jobs... scripts/sw-daemon-test.sh: line 120: 17144 Terminated: 15          sleep 300
+[38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Priority label sorting... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Degradation alert triggers on high CFR... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Metrics --json output with cycle_time keys... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Self-labeling includes watch_label when enabled... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Self-labeling excludes watch_label when disabled... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Patrol recurring failures label construction... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m DORA degradation event detection... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Retry exhaustion event detection... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Untested script detection logic... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Progress detects stage advancement... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Progress detects stuck (no change N checks)... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Progress detects repeated error loop... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Progress resets on diff growth... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Hard limit kills even with progress on... scripts/sw-daemon-test.sh: line 200: 18550 Terminated: 15          sleep 300
+[38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Adaptive cycles extends limit on >50% issue drop... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Adaptive cycles reduces limit on issue increase... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Adaptive cycles respects 2x base hard ceiling... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Adaptive cycles no-op on first cycle... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Cleanup: Checkpoint expire removes old checkpoints... [38;2;0;212;255m[1m▸[0m Expired: build checkpoint (1h+ old)
+[38;2;74;222;128m[1m✓[0m Expired 1 checkpoint(s) older than 1h
+[38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Cleanup: Failure handler removes watch label... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Cleanup: Failure handler closes draft PRs... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Cleanup: sw-cleanup.sh has all artifact cleanup sections... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Daemon sources vitals module... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Vitals verdict maps to daemon verdict (continue→healthy etc)... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Vitals emits pipeline.vitals_check events... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Auto-scale includes vitals health factor... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Quality memory drives template selection... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Vitals-based progress with static fallback... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Memory: query fix for error returns matching fix... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Memory: DORA template escalation patterns exist... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Memory: All 12 error categories in post-tool-use.sh... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Daemon: Template weights selection reads weights file... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Daemon: Auto-enable self_optimize when auto_template is true... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Intelligence: classify_failure detects auth errors... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Intelligence: classify_failure has all 6 failure classes... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Intelligence: Retry skips auth_error and invalid_issue... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Intelligence: API errors get extended 300s backoff... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Intelligence: daemon_preflight_auth_check exists and auto-pauses... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Intelligence: Process group spawning (set -m)... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Intelligence: Process tree kill in cleanup (pkill -P)... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Intelligence: Consecutive failure auto-pause (3 threshold)... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Intelligence: Retry escalation args passed to spawn... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Intelligence: classify_failure wired into retry logic... [38;2;74;222;128m✓[0m
+
+[38;2;168;85;247m[1m━━━ Results ━━━[0m
+  [38;2;74;222;128mPassed:[0m 66
+  [38;2;248;113;113mFailed:[0m 0
+  [2mTotal:[0m  52
+
+[38;2;74;222;128m[1mAll 66 tests passed![0m
+
+
+[38;2;168;85;247m[1mDashboard Smoke Tests[0m
+
+[38;2;168;85;247m[1mStructure[0m
+  [38;2;0;212;255m▸[0m server.ts exists... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m server.ts has valid structure (imports, fetch)... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m public/ directory exists... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m index.html exists... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m src/ directory exists... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m main.ts entry point exists... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m tsconfig.json exists... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m src/ modules exist (core, views, components, design, types, canvas)... [38;2;74;222;128m✓[0m
+
+[38;2;168;85;247m[1mRoutes[0m
+  [38;2;0;212;255m▸[0m Server exports /api/health and /api/status... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Server exports /ws WebSocket route... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Server exports /api/context-efficiency... [38;2;74;222;128m✓[0m
+
+[38;2;168;85;247m[1mIntegrity[0m
+  [38;2;0;212;255m▸[0m bun check passes (if bun available)... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m index.html references dist/main.js... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Frontend bundle builds (if bun available)... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m TypeScript type check passes (if tsc available)...     [2m(typescript not installed, skipping)[0m
+[38;2;74;222;128m✓[0m
+
+[38;2;0;212;255m[1m════════════════════════════════════════════════════[0m
+[38;2;74;222;128m[1m  All 15 tests passed ✓[0m
+[38;2;0;212;255m[1m════════════════════════════════════════════════════[0m
+
+
+[38;2;0;212;255m[1m╔════════════════════════════════════════════════════════╗[0m
+[38;2;0;212;255m[1m║  shipwright db — SQLite Persistence Test Suite        ║[0m
+[38;2;0;212;255m[1m╚════════════════════════════════════════════════════════╝[0m
+
+[2mSetting up test environment...[0m
+
+[38;2;168;85;247m[1mSchema Creation[0m
+  [38;2;0;212;255m▸[0m init_schema creates all tables... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Schema includes required tables... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m WAL mode is enabled... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m check_sqlite3 caches result... [38;2;74;222;128m✓[0m
+
+[38;2;168;85;247m[1mDatabase Availability[0m
+  [38;2;0;212;255m▸[0m db_available returns true when ready... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m db_available returns false without sqlite3... /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-db-test.mzxqqq/sw-db.sh: line 19: dirname: command not found
+[38;2;74;222;128m✓[0m
+
+[38;2;168;85;247m[1mEvent CRUD Operations[0m
+  [38;2;0;212;255m▸[0m db_add_event inserts event... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m add_event dual-writes to SQLite + JSONL... [38;2;74;222;128m✓[0m
+
+[38;2;168;85;247m[1mDaemon State Management[0m
+  [38;2;0;212;255m▸[0m db_save_job saves active job... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m db_complete_job marks completed... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m db_fail_job marks failed... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m db_list_active_jobs returns JSON array... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m db_active_job_count returns count... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m db_is_issue_active checks status... [38;2;74;222;128m✓[0m
+
+[38;2;168;85;247m[1mCost Tracking[0m
+  [38;2;0;212;255m▸[0m db_record_cost saves entry... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m db_cost_today calculates total... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m db_set_budget and db_get_budget... [38;2;74;222;128m✓[0m
+
+[38;2;168;85;247m[1mHeartbeat Management[0m
+  [38;2;0;212;255m▸[0m db_record_heartbeat saves heartbeat... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m db_list_heartbeats returns array... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m db_clear_heartbeat deletes entry... [38;2;74;222;128m✓[0m
+
+[38;2;168;85;247m[1mMemory & Failure Tracking[0m
+  [38;2;0;212;255m▸[0m db_record_failure saves pattern... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m db_query_similar_failures finds matches... [38;2;74;222;128m✓[0m
+
+[38;2;168;85;247m[1mJSON Data Migration[0m
+  [38;2;0;212;255m▸[0m migrate_json_data imports events... [38;2;0;212;255m[1m▸[0m Migrating schema v0 → v2...
+[38;2;74;222;128m[1m✓[0m Migrated to schema v2
+[38;2;0;212;255m[1m▸[0m Migrating schema v0 → v3...
+[38;2;74;222;128m[1m✓[0m Migrated to schema v3
+[38;2;0;212;255m[1m▸[0m Migrating schema v0 → v4...
+[38;2;74;222;128m[1m✓[0m Migrated to schema v4
+[38;2;0;212;255m[1m▸[0m Migrating schema v0 → v5...
+[38;2;74;222;128m[1m✓[0m Migrated to schema v5
+[38;2;0;212;255m[1m▸[0m Migrating schema v0 → v6...
+[38;2;74;222;128m[1m✓[0m Migrated to schema v6
+[38;2;0;212;255m[1m▸[0m Importing events from /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-db-test.mzxqqq/home/.shipwright/events.jsonl...
+[38;2;74;222;128m[1m✓[0m Events: 2 imported, 0 skipped (duplicates)
+[38;2;0;212;255m[1m▸[0m Importing heartbeats...
+[38;2;74;222;128m[1m✓[0m Heartbeats: 0 imported
+
+[38;2;74;222;128m[1m✓[0m Migration complete: 2 total records imported
+
+[38;2;0;212;255m[1m▸[0m Verification:
+  Events in DB:     2
+  Cost entries:     0
+  Heartbeats:       0
+[38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m migrate_json_data imports costs... [38;2;0;212;255m[1m▸[0m Database already at schema v6
+[38;2;0;212;255m[1m▸[0m Importing events from /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-db-test.mzxqqq/home/.shipwright/events.jsonl...
+[38;2;74;222;128m[1m✓[0m Events: 2 imported, 0 skipped (duplicates)
+[38;2;0;212;255m[1m▸[0m Importing costs from /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-db-test.mzxqqq/home/.shipwright/costs.json...
+[38;2;74;222;128m[1m✓[0m Costs: 2 entries imported
+[38;2;0;212;255m[1m▸[0m Importing heartbeats...
+[38;2;74;222;128m[1m✓[0m Heartbeats: 0 imported
+
+[38;2;74;222;128m[1m✓[0m Migration complete: 4 total records imported
+
+[38;2;0;212;255m[1m▸[0m Verification:
+  Events in DB:     2
+  Cost entries:     2
+  Heartbeats:       0
+[38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m migrate_json_data imports budget... [38;2;0;212;255m[1m▸[0m Database already at schema v6
+[38;2;0;212;255m[1m▸[0m Importing events from /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-db-test.mzxqqq/home/.shipwright/events.jsonl...
+[38;2;74;222;128m[1m✓[0m Events: 2 imported, 0 skipped (duplicates)
+[38;2;0;212;255m[1m▸[0m Importing costs from /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-db-test.mzxqqq/home/.shipwright/costs.json...
+[38;2;74;222;128m[1m✓[0m Costs: 2 entries imported
+[38;2;0;212;255m[1m▸[0m Importing budget from /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-db-test.mzxqqq/home/.shipwright/budget.json...
+[38;2;74;222;128m[1m✓[0m Budget: imported ($50.00, enabled=true)
+[38;2;0;212;255m[1m▸[0m Importing heartbeats...
+[38;2;74;222;128m[1m✓[0m Heartbeats: 0 imported
+
+[38;2;74;222;128m[1m✓[0m Migration complete: 4 total records imported
+
+[38;2;0;212;255m[1m▸[0m Verification:
+  Events in DB:     2
+  Cost entries:     2
+  Heartbeats:       0
+[38;2;74;222;128m✓[0m
+
+[38;2;168;85;247m[1mHealth Checks[0m
+  [38;2;0;212;255m▸[0m db_health_check validates database... [38;2;74;222;128m✓[0m
+
+[38;2;168;85;247m[1mExport & Backup[0m
+  [38;2;0;212;255m▸[0m export_db creates JSON backup... [38;2;0;212;255m[1m▸[0m Exporting database to /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-db-test.mzxqqq/home/.shipwright/test-backup.json...
+[38;2;74;222;128m[1m✓[0m Database exported to /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-db-test.mzxqqq/home/.shipwright/test-backup.json
+[38;2;74;222;128m✓[0m
+
+[38;2;168;85;247m[1mData Cleanup[0m
+  [38;2;0;212;255m▸[0m cleanup_old_data removes old entries... [38;2;0;212;255m[1m▸[0m Cleaning records older than 30 days (before 2026-03-05T12:37:21Z)...
+[38;2;74;222;128m[1m✓[0m Deleted: 0 events, 0 costs, 0 daemon jobs, 0 stages
+[38;2;74;222;128m✓[0m
+
+[38;2;168;85;247m[1mConcurrent Operations[0m
+  [38;2;0;212;255m▸[0m Concurrent writes don't corrupt DB... 5000
+5000
+5000
+5000
+5000
+5000
+5000
+5000
+5000
+5000
+5000
+5000
+5000
+5000
+5000
+5000
+5000
+5000
+5000
+5000
+5000
+5000
+5000
+5000
+5000
+5000
+5000
+5000
+5000
+5000
+5000
+5000
+5000
+5000
+5000
+5000
+5000
+5000
+5000
+5000
+5000
+5000
+5000
+5000
+5000
+5000
+5000
+5000
+5000
+5000
+5000
+[38;2;74;222;128m✓[0m
+
+[38;2;168;85;247m[1mPipeline Run Tracking[0m
+  [38;2;0;212;255m▸[0m add_pipeline_run creates entry... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m update_pipeline_status updates run... [38;2;74;222;128m✓[0m
+
+[38;2;0;212;255m[1m══════════════════════════════════════════════════════════[0m
+[38;2;74;222;128m[1m  All 31 tests passed ✓[0m
+[38;2;0;212;255m[1m══════════════════════════════════════════════════════════[0m
+
+
+
+[38;2;0;212;255m[1m  Shipwright Decompose Tests[0m
+[2m  ══════════════════════════════════════════[0m
+
+[2m  ══════════════════════════════════════════[0m
+
+  [38;2;0;212;255mhelp command[0m
+  [38;2;74;222;128m✓[0m help exits 0
+  [38;2;74;222;128m✓[0m help shows usage
+  [38;2;74;222;128m✓[0m help shows commands
+  [38;2;74;222;128m✓[0m --help exits 0
+
+  [38;2;0;212;255mversion flag[0m
+  [38;2;74;222;128m✓[0m --version exits 0
+  [38;2;74;222;128m✓[0m --version shows version
+
+  [38;2;0;212;255merror handling[0m
+  [38;2;74;222;128m✓[0m unknown command exits 1
+  [38;2;74;222;128m✓[0m unknown command shows error
+  [38;2;74;222;128m✓[0m analyze without issue exits 1
+  [38;2;74;222;128m✓[0m analyze shows usage
+  [38;2;74;222;128m✓[0m decompose without issue exits 1
+  [38;2;74;222;128m✓[0m auto without issue exits 1
+
+  [38;2;0;212;255manalyze subcommand (mock)[0m
+  [38;2;74;222;128m✓[0m analyze exits 0 with NO_GITHUB
+  [38;2;74;222;128m✓[0m analyze outputs complexity_score
+  [38;2;74;222;128m✓[0m analyze outputs should_decompose
+  [38;2;74;222;128m✓[0m analyze outputs subtasks
+  [38;2;74;222;128m✓[0m analyze outputs valid JSON
+  [38;2;74;222;128m✓[0m analyze returns complexity_score 85
+  [38;2;74;222;128m✓[0m analyze returns should_decompose true
+
+  [38;2;0;212;255mdecompose subcommand (mock)[0m
+  [38;2;74;222;128m✓[0m decompose exits 0 with NO_GITHUB
+  [38;2;74;222;128m✓[0m decompose shows decomposing
+
+  [38;2;0;212;255mauto subcommand (mock)[0m
+  [38;2;74;222;128m✓[0m auto exits 0 with NO_GITHUB
+
+  [38;2;0;212;255mstate file creation[0m
+  [38;2;74;222;128m✓[0m events.jsonl created
+
+  [38;2;0;212;255mDAG scheduling (new features)[0m
+  [38;2;74;222;128m✓[0m schedule exits 0
+  [38;2;74;222;128m✓[0m schedule shows valid DAG
+  [38;2;74;222;128m✓[0m schedule shows waves
+  [38;2;74;222;128m✓[0m critical-path exits 0
+  [38;2;74;222;128m✓[0m critical-path shows title
+  [38;2;74;222;128m✓[0m critical-path shows hours
+  [38;2;74;222;128m✓[0m visualize text exits 0
+  [38;2;74;222;128m✓[0m visualize shows DAG title
+  [38;2;74;222;128m✓[0m visualize shows task 0
+  [38;2;74;222;128m✓[0m visualize mermaid exits 0
+  [38;2;74;222;128m✓[0m visualize mermaid has graph
+  [38;2;74;222;128m✓[0m help shows schedule cmd
+  [38;2;74;222;128m✓[0m help shows critical-path cmd
+  [38;2;74;222;128m✓[0m help shows visualize cmd
+  [38;2;74;222;128m✓[0m version shows 3.2.4
+  [38;2;74;222;128m✓[0m mock data includes depends_on field
+
+
+
+[2m  ──────────────────────────────────────────[0m
+
+  [38;2;74;222;128m[1mAll 39 tests passed[0m
+
+
+[38;2;0;212;255m[1m  sw-decide Tests[0m
+[2m  ══════════════════════════════════════════[0m
+
+
+  [38;2;0;212;255mhelp[0m
+  [38;2;74;222;128m✓[0m help shows usage
+  [38;2;74;222;128m✓[0m help mentions run
+  [38;2;74;222;128m✓[0m help mentions status
+  [38;2;74;222;128m✓[0m help mentions tiers
+  [38;2;74;222;128m✓[0m help mentions candidates
+  [38;2;74;222;128m✓[0m help mentions halt
+  [38;2;74;222;128m✓[0m help mentions resume
+  [38;2;74;222;128m✓[0m help mentions dry-run
+  [38;2;74;222;128m✓[0m --help shows usage
+
+  [38;2;0;212;255mtiers[0m
+  [38;2;74;222;128m✓[0m tiers shows auto
+  [38;2;74;222;128m✓[0m tiers shows propose
+  [38;2;74;222;128m✓[0m tiers shows draft
+  [38;2;74;222;128m✓[0m tiers shows category rules
+  [38;2;74;222;128m✓[0m tiers shows limits
+
+  [38;2;0;212;255msignals[0m
+  [38;2;74;222;128m✓[0m candidate has id
+  [38;2;74;222;128m✓[0m candidate has signal
+  [38;2;74;222;128m✓[0m candidate has category
+  [38;2;74;222;128m✓[0m candidate has risk_score
+  [38;2;74;222;128m✓[0m candidate has dedup_key
+  [38;2;74;222;128m✓[0m candidate has collected_at
+  [38;2;74;222;128m✓[0m candidate is valid JSON
+  [38;2;74;222;128m✓[0m read_pending returns data
+  [38;2;74;222;128m✓[0m clear_pending empties file
+
+  [38;2;0;212;255mscoring[0m
+  [38;2;74;222;128m✓[0m scored has value_score
+  [38;2;74;222;128m✓[0m scored has scores object
+  [38;2;74;222;128m✓[0m critical security scores well (75)
+  [38;2;74;222;128m✓[0m security scores higher than dead_code (75 > 33)
+  [38;2;74;222;128m✓[0m impact weight loaded
+  [38;2;74;222;128m✓[0m urgency weight loaded
+
+  [38;2;0;212;255mautonomy[0m
+  [38;2;74;222;128m✓[0m deps_patch -> auto
+  [38;2;74;222;128m✓[0m refactor_hotspot -> propose
+  [38;2;74;222;128m✓[0m new_feature -> draft
+  [38;2;74;222;128m✓[0m unknown -> draft
+  [38;2;74;222;128m✓[0m auto labels include shipwright
+  [38;2;74;222;128m✓[0m auto labels include ready-to-build
+  [38;2;74;222;128m✓[0m propose labels include proposed
+jq: parse error: Unmatched '}' at line 1, column 111
+jq: parse error: Unmatched '}' at line 1, column 111
+  [38;2;74;222;128m✓[0m budget available with no decisions
+jq: parse error: Unmatched '}' at line 1, column 111
+  [38;2;74;222;128m✓[0m budget exhausted after 16 issues
+  [38;2;74;222;128m✓[0m rate limit passes with no history
+jq: parse error: Unmatched '}' at line 1, column 111
+  [38;2;74;222;128m✓[0m rate limit blocks recent decision
+  [38;2;74;222;128m✓[0m not halted initially
+  [38;2;74;222;128m✓[0m halted after halt()
+  [38;2;74;222;128m✓[0m halt file created
+  [38;2;74;222;128m✓[0m resumed after resume()
+
+  [38;2;0;212;255mrisk ceiling[0m
+  [38;2;74;222;128m✓[0m risk 20 below ceiling 30
+  [38;2;74;222;128m✓[0m risk 35 above ceiling 30
+
+  [38;2;0;212;255mdry-run[0m
+  [38;2;74;222;128m✓[0m dry-run shows DRY RUN
+  [38;2;74;222;128m✓[0m no daily log created in dry-run
+  [38;2;74;222;128m✓[0m no drafts in dry-run
+
+  [38;2;0;212;255mdecision log[0m
+  [38;2;74;222;128m✓[0m daily log exists
+  [38;2;74;222;128m✓[0m log has decision id
+  [38;2;74;222;128m✓[0m log has value_score
+  [38;2;74;222;128m✓[0m last-decision written
+
+  [38;2;0;212;255moutcome learning[0m
+  [38;2;74;222;128m✓[0m urgency weight adjusted on security success (25)
+  [38;2;74;222;128m✓[0m risk weight increased on failure (13 >= 13)
+  [38;2;74;222;128m✓[0m weights sum to 100
+  [38;2;74;222;128m✓[0m weights file written
+
+  [38;2;0;212;255mcandidates[0m
+  [38;2;74;222;128m✓[0m candidates shows title
+  [38;2;74;222;128m✓[0m candidates shows signal
+
+  [38;2;0;212;255mhalt/resume CLI[0m
+  [38;2;74;222;128m✓[0m halt succeeds
+  [38;2;74;222;128m✓[0m run blocked when halted
+  [38;2;74;222;128m✓[0m resume succeeds
+
+  [38;2;0;212;255mstatus[0m
+  [38;2;74;222;128m✓[0m status shows active
+  [38;2;74;222;128m✓[0m status shows decisions
+  [38;2;74;222;128m✓[0m status shows budget
+  [38;2;74;222;128m✓[0m status shows weights
+
+  [38;2;0;212;255mcycle integration[0m
+  [38;2;74;222;128m✓[0m cycle shows Decision Engine
+  [38;2;74;222;128m✓[0m cycle shows Cycle Complete
+  [38;2;74;222;128m✓[0m cycle processes candidates
+  [38;2;74;222;128m✓[0m cycle shows AUTO tier
+  [38;2;74;222;128m✓[0m cycle shows DRAFT tier
+
+  [38;2;0;212;255mlog command[0m
+  [38;2;74;222;128m✓[0m log shows today's date
+  [38;2;74;222;128m✓[0m log shows entry
+
+[2m  ──────────────────────────────────────────[0m
+
+  [38;2;74;222;128m[1mAll 33 tests passed[0m
+
+
+
+[38;2;0;212;255m[1m  Shipwright Deps Tests[0m
+[2m  ══════════════════════════════════════════[0m
+
+[2m  ══════════════════════════════════════════[0m
+
+  [38;2;0;212;255mhelp command[0m
+  [38;2;74;222;128m✓[0m help exits 0
+  [38;2;74;222;128m✓[0m help shows usage
+  [38;2;74;222;128m✓[0m help shows commands
+  [38;2;74;222;128m✓[0m --help exits 0
+
+  [38;2;0;212;255merror handling[0m
+  [38;2;74;222;128m✓[0m unknown command exits 1
+  [38;2;74;222;128m✓[0m unknown command shows error
+
+  [38;2;0;212;255mscan subcommand[0m
+  [38;2;74;222;128m✓[0m scan exits 0 with NO_GITHUB
+  [38;2;74;222;128m✓[0m scan shows warning
+
+  [38;2;0;212;255mclassify subcommand[0m
+  [38;2;74;222;128m✓[0m classify without args exits 1
+  [38;2;74;222;128m✓[0m classify shows usage
+  [38;2;74;222;128m✓[0m classify exits 0 with NO_GITHUB
+  [38;2;74;222;128m✓[0m classify shows warning
+
+  [38;2;0;212;255mbatch subcommand[0m
+  [38;2;74;222;128m✓[0m batch exits 0 with NO_GITHUB
+  [38;2;74;222;128m✓[0m batch shows warning
+
+  [38;2;0;212;255mreport subcommand[0m
+  [38;2;74;222;128m✓[0m report exits 0 with NO_GITHUB
+  [38;2;74;222;128m✓[0m report shows warning
+
+  [38;2;0;212;255mmerge subcommand[0m
+  [38;2;74;222;128m✓[0m merge without args exits 1
+
+  [38;2;0;212;255mtest subcommand[0m
+  [38;2;74;222;128m✓[0m test without args exits 1
+
+  [38;2;0;212;255minternal parse_version_bump[0m
+  [38;2;74;222;128m✓[0m parse_version_bump detects patch
+  [38;2;74;222;128m✓[0m parse_version_bump detects minor
+  [38;2;74;222;128m✓[0m parse_version_bump detects major
+  [38;2;74;222;128m✓[0m parse_version_bump handles v prefix
+
+
+
+[2m  ──────────────────────────────────────────[0m
+
+  [38;2;74;222;128m[1mAll 22 tests passed[0m
+
+
+
+[38;2;0;212;255m[1m  shipwright developer-simulation test[0m
+[2m  ══════════════════════════════════════════[0m
+
+[2m  ══════════════════════════════════════════[0m
+
+[1mScript Safety[0m
+  [38;2;74;222;128m✓[0m set -euo pipefail present
+  [38;2;74;222;128m✓[0m ERR trap present
+  [38;2;74;222;128m✓[0m source guard uses if/then/fi pattern
+
+[1mVersion[0m
+  [38;2;74;222;128m✓[0m VERSION variable defined
+
+[1mHelp Output[0m
+  [38;2;74;222;128m✓[0m help contains USAGE
+  [38;2;74;222;128m✓[0m help contains review subcommand
+  [38;2;74;222;128m✓[0m help contains address subcommand
+  [38;2;74;222;128m✓[0m help contains PERSONAS
+  [38;2;74;222;128m✓[0m help contains simulation_enabled
+  [38;2;74;222;128m✓[0m --help flag works
+
+[1mError Handling[0m
+  [38;2;74;222;128m✓[0m unknown command exits non-zero
+  [38;2;74;222;128m✓[0m unknown command mentions error
+
+[1mReview Subcommand[0m
+  [38;2;74;222;128m✓[0m review warns when disabled
+  [38;2;74;222;128m✓[0m review returns empty JSON array when disabled
+
+[1mAddress Subcommand[0m
+  [38;2;74;222;128m✓[0m address with no objections succeeds
+  [38;2;74;222;128m✓[0m address returns empty JSON
+
+[1mPersona Definitions[0m
+  [38;2;74;222;128m✓[0m security persona defined
+  [38;2;74;222;128m✓[0m performance persona defined
+  [38;2;74;222;128m✓[0m maintainability persona defined
+
+[1mConfiguration[0m
+  [38;2;74;222;128m✓[0m SIMULATION_MAX_ROUNDS env var supported
+  [38;2;74;222;128m✓[0m daemon-config.json checked
+
+[1mEvent Emission[0m
+  [38;2;74;222;128m✓[0m emits simulation.objection events
+  [38;2;74;222;128m✓[0m emits simulation.complete events
+  [38;2;74;222;128m✓[0m emits simulation.addressed events
+
+
+
+
+[2m  ──────────────────────────────────────────[0m
+
+  [38;2;74;222;128m[1mAll 0 tests passed[0m
+
+
+
+[38;2;0;212;255m[1m  Shipwright Discovery Tests[0m
+[2m  ══════════════════════════════════════════[0m
+
+[2m  ══════════════════════════════════════════[0m
+
+  [38;2;0;212;255mhelp command[0m
+  [38;2;74;222;128m✓[0m help exits 0
+  [38;2;74;222;128m✓[0m help shows usage
+  [38;2;74;222;128m✓[0m help shows commands
+  [38;2;74;222;128m✓[0m --help exits 0
+
+  [38;2;0;212;255merror handling[0m
+  [38;2;74;222;128m✓[0m unknown command exits 1
+  [38;2;74;222;128m✓[0m unknown command shows error
+  [38;2;74;222;128m✓[0m broadcast without args exits 1
+  [38;2;74;222;128m✓[0m query without args exits 1
+  [38;2;74;222;128m✓[0m inject without args exits 1
+
+  [38;2;0;212;255mbroadcast subcommand[0m
+  [38;2;74;222;128m✓[0m broadcast exits 0
+  [38;2;74;222;128m✓[0m broadcast confirms
+  [38;2;74;222;128m✓[0m discoveries.jsonl created
+  [38;2;74;222;128m✓[0m discoveries.jsonl contains valid JSON
+
+  [38;2;0;212;255mquery subcommand[0m
+  [38;2;74;222;128m✓[0m query exits 0
+  [38;2;74;222;128m✓[0m query finds discovery
+  [38;2;74;222;128m✓[0m query non-match exits 0
+  [38;2;74;222;128m✓[0m query reports no discoveries
+
+  [38;2;0;212;255mstatus subcommand[0m
+  [38;2;74;222;128m✓[0m status exits 0
+  [38;2;74;222;128m✓[0m status shows total
+
+  [38;2;0;212;255mclean subcommand[0m
+  [38;2;74;222;128m✓[0m clean exits 0
+  [38;2;74;222;128m✓[0m clean reports result
+
+  [38;2;0;212;255minject subcommand[0m
+  [38;2;74;222;128m✓[0m inject exits 0
+
+  [38;2;0;212;255minternal patterns_overlap[0m
+  [38;2;74;222;128m✓[0m patterns_overlap matches same pattern
+  [38;2;74;222;128m✓[0m patterns_overlap rejects different paths
+
+  [38;2;0;212;255mprioritize subcommand[0m
+  [38;2;74;222;128m✓[0m prioritize security exits 0
+  [38;2;74;222;128m✓[0m prioritize assigns P0
+  [38;2;74;222;128m✓[0m prioritize assigns P3
+
+  [38;2;0;212;255mscore subcommand[0m
+  [38;2;74;222;128m✓[0m score exits 0
+  [38;2;74;222;128m✓[0m score returns numeric result: 89
+
+  [38;2;0;212;255macknowledge subcommand[0m
+  [38;2;74;222;128m✓[0m acknowledge exits 0
+  [38;2;74;222;128m✓[0m consumption file created
+  [38;2;74;222;128m✓[0m consumption count incremented
+
+  [38;2;0;212;255mconsumption stats[0m
+  [38;2;74;222;128m✓[0m consumption stats valid JSON
+  [38;2;74;222;128m✓[0m consumption count correct
+
+  [38;2;0;212;255mmemory promotion[0m
+  [38;2;74;222;128m✓[0m promotion function exists
+
+  [38;2;0;212;255mfleet broadcast[0m
+  [38;2;74;222;128m✓[0m fleet broadcast function exists
+
+
+
+[2m  ──────────────────────────────────────────[0m
+
+  [38;2;74;222;128m[1mAll 36 tests passed[0m
+
+
+
+[38;2;0;212;255m[1m  Shipwright Doc Fleet Tests[0m
+[2m  ══════════════════════════════════════════[0m
+
+[2m  ══════════════════════════════════════════[0m
+
+[1m  Help[0m
+  [38;2;74;222;128m✓[0m help shows title
+  [38;2;74;222;128m✓[0m help shows commands section
+  [38;2;74;222;128m✓[0m help shows fleet roles section
+  [38;2;74;222;128m✓[0m help shows examples
+  [38;2;74;222;128m✓[0m --help flag works
+  [38;2;74;222;128m✓[0m unknown command shows error
+[1m  Roles[0m
+  [38;2;74;222;128m✓[0m roles lists doc-architect
+  [38;2;74;222;128m✓[0m roles lists claude-md
+  [38;2;74;222;128m✓[0m roles lists strategy-curator
+  [38;2;74;222;128m✓[0m roles lists pattern-writer
+  [38;2;74;222;128m✓[0m roles lists readme-optimizer
+[1m  Audit[0m
+  [38;2;74;222;128m✓[0m audit shows health header
+  [38;2;74;222;128m✓[0m audit shows health score
+  [38;2;74;222;128m✓[0m audit checks doc inventory
+  [38;2;74;222;128m✓[0m audit checks CLAUDE.md
+  [38;2;74;222;128m✓[0m audit checks agent roles
+  [38;2;74;222;128m✓[0m audit creates state file
+  [38;2;74;222;128m✓[0m audit records health score (91%)
+[1m  Launch[0m
+  [38;2;74;222;128m✓[0m launch dry-run shows header
+  [38;2;74;222;128m✓[0m launch dry-run mentions dry-run
+  [38;2;74;222;128m✓[0m launch dry-run lists doc-architect
+  [38;2;74;222;128m✓[0m launch dry-run lists claude-md
+  [38;2;74;222;128m✓[0m launch dry-run lists strategy-curator
+  [38;2;74;222;128m✓[0m launch dry-run lists pattern-writer
+  [38;2;74;222;128m✓[0m launch dry-run lists readme-optimizer
+  [38;2;74;222;128m✓[0m launch dry-run shows agent count
+  [38;2;74;222;128m✓[0m launch specific role shows role
+  [38;2;74;222;128m✓[0m launch specific role shows 1 agent
+  [38;2;74;222;128m✓[0m launch invalid role shows error
+[1m  Status[0m
+  [38;2;74;222;128m✓[0m status shows header
+  [38;2;74;222;128m✓[0m status shows last run
+  [38;2;74;222;128m✓[0m status shows health score
+  [38;2;74;222;128m✓[0m status shows session list
+[1m  Manifest[0m
+  [38;2;74;222;128m✓[0m manifest shows generation
+  [38;2;74;222;128m✓[0m manifest file created
+  [38;2;74;222;128m✓[0m manifest has documents (16)
+[1m  Report[0m
+  [38;2;74;222;128m✓[0m report shows header
+  [38;2;74;222;128m✓[0m report shows inventory
+  [38;2;74;222;128m✓[0m report shows volume
+  [38;2;74;222;128m✓[0m report shows fleet state
+  [38;2;74;222;128m✓[0m report json shows JSON
+  [38;2;74;222;128m✓[0m JSON report file created
+[1m  Retire[0m
+  [38;2;74;222;128m✓[0m retire shows retiring
+  [38;2;74;222;128m✓[0m retire shows count
+[1m  State Persistence[0m
+  [38;2;74;222;128m✓[0m status shows run count after commands
+[1m  Events[0m
+  [38;2;74;222;128m✓[0m doc_fleet events logged (8 events)
+[1m  Aliases[0m
+  [38;2;74;222;128m✓[0m start alias works
+  [38;2;74;222;128m✓[0m stop alias works
+
+
+
+[2m  ──────────────────────────────────────────[0m
+
+  [38;2;74;222;128m[1mAll 48 tests passed[0m
+
+
+
+[38;2;0;212;255m[1m  Shipwright Docs Agent Tests[0m
+[2m  ══════════════════════════════════════════[0m
+
+[2m  ══════════════════════════════════════════[0m
+
+[1m  Help[0m
+  [38;2;74;222;128m✓[0m help shows usage
+  [38;2;74;222;128m✓[0m help shows commands
+  [38;2;74;222;128m✓[0m --help flag works
+  [38;2;74;222;128m✓[0m unknown command shows error
+[1m  Coverage[0m
+  [38;2;74;222;128m✓[0m coverage shows header
+  [38;2;74;222;128m✓[0m coverage shows total scripts
+[1m  API Reference[0m
+  [38;2;74;222;128m✓[0m api generation succeeds
+  [38;2;74;222;128m✓[0m api file has title
+[1m  Wiki[0m
+  [38;2;74;222;128m✓[0m wiki generation succeeds
+  [38;2;74;222;128m✓[0m wiki directory created
+[1m  Scan[0m
+  [38;2;74;222;128m✓[0m scan shows scanning
+[1m  Sync[0m
+  [38;2;74;222;128m✓[0m sync shows sync complete
+[1m  Impact[0m
+  [38;2;74;222;128m✓[0m impact shows analysis
+[1m  State[0m
+  [38;2;74;222;128m✓[0m docs-agent home directory exists
+
+
+
+[2m  ──────────────────────────────────────────[0m
+
+  [38;2;74;222;128m[1mAll 14 tests passed[0m
+
+
+[38;2;0;212;255m[1m╔═══════════════════════════════════════════════════╗[0m
+[38;2;0;212;255m[1m║  shipwright docs — Test Suite                     ║[0m
+[38;2;0;212;255m[1m╚═══════════════════════════════════════════════════╝[0m
+
+[2mSetting up test environment...[0m
+
+[38;2;168;85;247m[1mAUTO Section Discovery[0m
+  [38;2;0;212;255m▸[0m find_auto_files discovers CLAUDE.md... [38;2;74;222;128mPASS[0m
+  [38;2;0;212;255m▸[0m get_sections extracts section IDs... [38;2;74;222;128mPASS[0m
+
+[38;2;168;85;247m[1mSection Generators[0m
+  [38;2;0;212;255m▸[0m Architecture table has headers and scripts... [38;2;74;222;128mPASS[0m
+  [38;2;0;212;255m▸[0m Architecture table includes CLI router... [38;2;74;222;128mPASS[0m
+  [38;2;0;212;255m▸[0m Feature flags table with intelligence config... [38;2;74;222;128mPASS[0m
+  [38;2;0;212;255m▸[0m Test suites table picks up test files... [38;2;74;222;128mPASS[0m
+
+[38;2;168;85;247m[1mSection Check & Replace[0m
+  [38;2;0;212;255m▸[0m check_section detects fresh vs stale... [38;2;74;222;128mPASS[0m
+  [38;2;0;212;255m▸[0m replace_section updates content between markers... [38;2;74;222;128mPASS[0m
+
+[38;2;168;85;247m[1mSubcommands[0m
+  [38;2;0;212;255m▸[0m docs check returns 1 when stale... [38;2;74;222;128mPASS[0m
+  [38;2;0;212;255m▸[0m docs sync then check returns 0 (fresh)... [38;2;74;222;128mPASS[0m
+  [38;2;0;212;255m▸[0m docs sync is idempotent... [38;2;74;222;128mPASS[0m
+
+[38;2;168;85;247m[1mCLI & Help[0m
+  [38;2;0;212;255m▸[0m Help output contains all subcommands... [38;2;74;222;128mPASS[0m
+  [38;2;0;212;255m▸[0m Unknown command exits with error... [38;2;74;222;128mPASS[0m
+  [38;2;0;212;255m▸[0m Default (no args) shows help... [38;2;74;222;128mPASS[0m
+
+[38;2;168;85;247m[1mEdge Cases[0m
+  [38;2;0;212;255m▸[0m No AUTO markers returns 0... [38;2;74;222;128mPASS[0m
+  [38;2;0;212;255m▸[0m Multiple sections all get processed... [38;2;74;222;128mPASS[0m
+  [38;2;0;212;255m▸[0m Purpose extracted from script headers... [38;2;74;222;128mPASS[0m
+  [38;2;0;212;255m▸[0m Wiki dry-run succeeds... [38;2;74;222;128mPASS[0m
+
+[2m  ──────────────────────────────────────────[0m
+  [38;2;74;222;128m[1m18 passed[0m  [38;2;248;113;113m[1m0 failed[0m  [2m(18 total)[0m
+
+
+
+[38;2;0;212;255m[1m  Shipwright Doctor Tests[0m
+[2m  ══════════════════════════════════════════[0m
+
+[2m  ══════════════════════════════════════════[0m
+
+[2m  execution[0m
+  [38;2;74;222;128m✓[0m doctor runs without crash
+  [38;2;74;222;128m✓[0m output shows PREREQUISITES
+  [38;2;74;222;128m✓[0m detects tmux
+  [38;2;74;222;128m✓[0m detects jq
+  [38;2;74;222;128m✓[0m detects Claude Code CLI
+  [38;2;74;222;128m✓[0m detects git
+
+[2m  structure[0m
+  [38;2;74;222;128m✓[0m VERSION variable defined
+  [38;2;74;222;128m✓[0m Uses set -euo pipefail
+  [38;2;74;222;128m✓[0m ERR trap is set
+  [38;2;74;222;128m✓[0m check_pass helper defined
+  [38;2;74;222;128m✓[0m check_fail helper defined
+  [38;2;74;222;128m✓[0m output shows Shipwright header
+
+[2m  check logic for tools[0m
+  [38;2;74;222;128m✓[0m Source checks for tmux
+  [38;2;74;222;128m✓[0m Source checks for jq
+  [38;2;74;222;128m✓[0m Source checks for Claude CLI
+  [38;2;74;222;128m✓[0m Source checks for git
+  [38;2;74;222;128m✓[0m Source checks for gh
+
+[2m  version flag[0m
+  [38;2;74;222;128m✓[0m --version outputs sw-doctor and version
+  [38;2;74;222;128m✓[0m -V short flag works
+
+[2m  missing tool handling[0m
+  [38;2;74;222;128m✓[0m Doctor reports when jq missing from PATH
+  [38;2;74;222;128m✓[0m output includes PREREQUISITES section
+  [38;2;74;222;128m✓[0m output includes INSTALLED FILES section
+
+[2m  auto-fix mode[0m
+  [38;2;74;222;128m✓[0m --fix-dry flag shows dry-run output
+[38;2;248;113;113m[1m✗[0m Overlay not found: ~/.tmux/shipwright-overlay.conf
+[38;2;248;113;113m[1m✗[0m No ~/.claude/settings.json — agent teams not configured
+[38;2;248;113;113m[1m✗[0m Overlay not found — pane display features unavailable
+[38;2;248;113;113m[1m✗[0m iTerm2 mouse reporting is DISABLED — tmux cannot receive mouse clicks
+  [38;2;74;222;128m✓[0m --fix creates .claude directories
+  [38;2;74;222;128m✓[0m --fix creates ~/.shipwright directories
+  [38;2;74;222;128m✓[0m --fix creates valid daemon-config.json
+  [38;2;74;222;128m✓[0m --fix creates valid settings.json
+  [38;2;74;222;128m✓[0m --fix creates valid budget.json
+[38;2;248;113;113m[1m✗[0m No ~/.claude/settings.json — agent teams not configured
+[38;2;248;113;113m[1m✗[0m iTerm2 mouse reporting is DISABLED — tmux cannot receive mouse clicks
+  [38;2;74;222;128m✓[0m --fix is idempotent (second run succeeds)
+[38;2;248;113;113m[1m✗[0m No ~/.claude/settings.json — agent teams not configured
+[38;2;248;113;113m[1m✗[0m iTerm2 mouse reporting is DISABLED — tmux cannot receive mouse clicks
+  [38;2;74;222;128m✓[0m --fix handles existing config files safely
+  [38;2;74;222;128m✓[0m --fix without other args works
+  [38;2;74;222;128m✓[0m Auto-fix output shows AUTO-FIX SUMMARY
+  [38;2;74;222;128m✓[0m Auto-fix reports what was fixed
+
+
+
+[2m  ──────────────────────────────────────────[0m
+
+  [38;2;74;222;128m[1mAll 0 tests passed[0m
+
+
+
+[38;2;0;212;255m[1m  shipwright dora test[0m
+[2m  ══════════════════════════════════════════[0m
+
+[2m  ══════════════════════════════════════════[0m
+
+[1mScript Safety[0m
+  [38;2;74;222;128m✓[0m set -euo pipefail present
+  [38;2;74;222;128m✓[0m ERR trap present
+  [38;2;74;222;128m✓[0m source guard uses if/then/fi pattern
+
+[1mVersion[0m
+  [38;2;74;222;128m✓[0m VERSION variable defined
+
+[1mHelp Output[0m
+  [38;2;74;222;128m✓[0m help contains USAGE
+  [38;2;74;222;128m✓[0m help contains show subcommand
+  [38;2;74;222;128m✓[0m help contains dx subcommand
+  [38;2;74;222;128m✓[0m help contains ai subcommand
+  [38;2;74;222;128m✓[0m help contains trends subcommand
+  [38;2;74;222;128m✓[0m help contains compare subcommand
+  [38;2;74;222;128m✓[0m help contains export subcommand
+  [38;2;74;222;128m✓[0m help contains DORA BANDS
+  [38;2;74;222;128m✓[0m --help flag works
+
+[1mError Handling[0m
+  [38;2;74;222;128m✓[0m unknown command exits non-zero
+  [38;2;74;222;128m✓[0m unknown command error message
+
+[1mShow Subcommand (no events)[0m
+  [38;2;74;222;128m✓[0m show displays DORA Metrics
+  [38;2;74;222;128m✓[0m show displays Deploy Frequency
+  [38;2;74;222;128m✓[0m show displays Lead Time
+  [38;2;74;222;128m✓[0m show displays Change Failure Rate
+  [38;2;74;222;128m✓[0m show displays MTTR
+
+[1mDX Subcommand[0m
+  [38;2;74;222;128m✓[0m dx displays Developer Experience
+
+[1mAI Subcommand[0m
+  [38;2;74;222;128m✓[0m ai displays AI Performance Metrics
+
+[1mExport Subcommand[0m
+  [38;2;74;222;128m✓[0m export produces JSON with timestamp
+  [38;2;74;222;128m✓[0m export contains current_period
+  [38;2;74;222;128m✓[0m export contains previous_period
+
+[1mTrends Subcommand[0m
+  [38;2;74;222;128m✓[0m trends displays Trends heading
+
+[1mCompare Subcommand[0m
+  [38;2;74;222;128m✓[0m compare displays Period Comparison
+
+[1mDORA Band Classification[0m
+  [38;2;74;222;128m✓[0m classify_band function defined
+  [38;2;74;222;128m✓[0m Elite band classification
+  [38;2;74;222;128m✓[0m High band classification
+  [38;2;74;222;128m✓[0m Medium band classification
+  [38;2;74;222;128m✓[0m Low band classification
+
+[1mTrend Arrows[0m
+  [38;2;74;222;128m✓[0m trend_arrow function defined
+
+
+
+
+[2m  ──────────────────────────────────────────[0m
+
+  [38;2;74;222;128m[1mAll 0 tests passed[0m
+
+
+
+[38;2;0;212;255m[1m  Shipwright Durable Tests[0m
+[2m  ══════════════════════════════════════════[0m
+
+[2m  ══════════════════════════════════════════[0m
+
+[2m  help / version[0m
+  [38;2;74;222;128m✓[0m help exits 0
+  [38;2;74;222;128m✓[0m help shows USAGE
+  [38;2;74;222;128m✓[0m help mentions publish
+  [38;2;74;222;128m✓[0m help mentions consume
+  [38;2;74;222;128m✓[0m help mentions checkpoint
+  [38;2;74;222;128m✓[0m help mentions lock
+  [38;2;74;222;128m✓[0m help mentions compact
+  [38;2;74;222;128m✓[0m help mentions status
+  [38;2;74;222;128m✓[0m VERSION variable defined
+
+[2m  publish events[0m
+  [38;2;74;222;128m✓[0m publish exits 0
+  [38;2;74;222;128m✓[0m WAL file created
+  [38;2;74;222;128m✓[0m Event written to WAL
+
+[2m  error handling[0m
+  [38;2;74;222;128m✓[0m publish without args exits non-zero
+  [38;2;74;222;128m✓[0m Unknown command exits non-zero
+
+[2m  status command[0m
+  [38;2;74;222;128m✓[0m status exits 0
+
+[2m  checkpointing[0m
+  [38;2;74;222;128m✓[0m checkpoint save exits 0
+  [38;2;74;222;128m✓[0m Checkpoint file created
+  [38;2;74;222;128m✓[0m checkpoint restore exits 0
+
+[2m  distributed locks[0m
+  [38;2;74;222;128m✓[0m lock acquire exits 0
+  [38;2;74;222;128m✓[0m lock release exits 0
+
+[2m  script safety[0m
+  [38;2;74;222;128m✓[0m Uses set -euo pipefail
+  [38;2;74;222;128m✓[0m Has source guard pattern
+
+
+
+[2m  ──────────────────────────────────────────[0m
+
+  [38;2;74;222;128m[1mAll 0 tests passed[0m
+
+
+
+[38;2;0;212;255m[1m  Shipwright E2E Orchestrator Tests[0m
+[2m  ══════════════════════════════════════════[0m
+
+[2m  ══════════════════════════════════════════[0m
+
+  [38;2;74;222;128m✓[0m help shows usage text
+  [38;2;74;222;128m✓[0m help exits 0
+  [38;2;74;222;128m✓[0m --help flag works
+  [38;2;74;222;128m✓[0m unknown command exits nonzero
+  [38;2;74;222;128m✓[0m registry file created on init
+  [38;2;74;222;128m✓[0m registry is valid JSON
+  [38;2;74;222;128m✓[0m registry has >= 3 default suites
+  [38;2;74;222;128m✓[0m register adds suite
+  [38;2;74;222;128m✓[0m duplicate register fails
+  [38;2;74;222;128m✓[0m quarantine adds test
+  [38;2;74;222;128m✓[0m quarantine list has entry
+  [38;2;74;222;128m✓[0m report handles no results
+  [38;2;74;222;128m✓[0m flaky handles no history
+
+
+
+[2m  ──────────────────────────────────────────[0m
+
+  [38;2;74;222;128m[1mAll 0 tests passed[0m
+
+
+
+[38;2;0;212;255m[1m  Shipwright Eventbus Tests[0m
+[2m  ══════════════════════════════════════════[0m
+
+[2m  ══════════════════════════════════════════[0m
+
+  [38;2;0;212;255mhelp command[0m
+  [38;2;74;222;128m✓[0m help exits 0
+  [38;2;74;222;128m✓[0m help shows usage
+  [38;2;74;222;128m✓[0m help shows subcommands
+  [38;2;74;222;128m✓[0m --help exits 0
+
+  [38;2;0;212;255merror handling[0m
+  [38;2;74;222;128m✓[0m unknown command exits 1
+  [38;2;74;222;128m✓[0m unknown command shows error
+
+  [38;2;0;212;255mstatus subcommand[0m
+  [38;2;74;222;128m✓[0m status exits 0 with empty bus
+  [38;2;74;222;128m✓[0m status shows title
+
+  [38;2;0;212;255mpublish subcommand[0m
+  [38;2;74;222;128m✓[0m publish exits 0
+  [38;2;74;222;128m✓[0m publish confirms
+  [38;2;74;222;128m✓[0m events.jsonl created
+  [38;2;74;222;128m✓[0m events.jsonl contains published event type
+  [38;2;74;222;128m✓[0m events.jsonl contains correlation_id
+  [38;2;74;222;128m✓[0m eventbus has 3+ events after multi-publish
+
+  [38;2;0;212;255mstatus with events[0m
+  [38;2;74;222;128m✓[0m status with events exits 0
+  [38;2;74;222;128m✓[0m status shows total events
+  [38;2;74;222;128m✓[0m status shows events by type
+
+  [38;2;0;212;255mclean subcommand[0m
+  [38;2;74;222;128m✓[0m clean exits 0
+  [38;2;74;222;128m✓[0m clean reports result
+
+  [38;2;0;212;255mreplay subcommand[0m
+  [38;2;74;222;128m✓[0m replay exits 0
+  [38;2;74;222;128m✓[0m replay shows replaying
+
+  [38;2;0;212;255mpublish error handling[0m
+  [38;2;74;222;128m✓[0m publish with empty type exits 1
+  [38;2;74;222;128m✓[0m watch with missing dir exits 1
+  [38;2;74;222;128m✓[0m watch shows dir error
+
+
+
+[2m  ──────────────────────────────────────────[0m
+
+  [38;2;74;222;128m[1mAll 24 tests passed[0m
+
+
+
+[38;2;0;212;255m[1m  Shipwright Feedback Tests[0m
+[2m  ══════════════════════════════════════════[0m
+
+[2m  ══════════════════════════════════════════[0m
+
+  [38;2;0;212;255mhelp command[0m
+  [38;2;74;222;128m✓[0m help exits 0
+  [38;2;74;222;128m✓[0m help shows usage
+  [38;2;74;222;128m✓[0m help shows subcommands
+  [38;2;74;222;128m✓[0m --help exits 0
+
+  [38;2;0;212;255merror handling[0m
+  [38;2;74;222;128m✓[0m unknown command exits 1
+  [38;2;74;222;128m✓[0m unknown command shows error
+
+  [38;2;0;212;255mcollect subcommand[0m
+  [38;2;74;222;128m✓[0m collect on empty dir exits 0
+  [38;2;74;222;128m✓[0m collect shows collecting
+  [38;2;74;222;128m✓[0m collect shows save path
+
+  [38;2;0;212;255mcollect with error log[0m
+  [38;2;74;222;128m✓[0m collect with errors exits 0
+  [38;2;74;222;128m✓[0m collect reports errors
+
+  [38;2;0;212;255manalyze subcommand[0m
+  [38;2;74;222;128m✓[0m analyze missing file exits 1
+  [38;2;74;222;128m✓[0m analyze shows not found
+  [38;2;74;222;128m✓[0m analyze exits 0
+  [38;2;74;222;128m✓[0m analyze shows report
+
+  [38;2;0;212;255mlearn subcommand[0m
+  [38;2;74;222;128m✓[0m learn exits 0
+  [38;2;74;222;128m✓[0m learn confirms capture
+  [38;2;74;222;128m✓[0m incidents.jsonl created
+  [38;2;74;222;128m✓[0m incidents.jsonl has valid JSONL
+
+  [38;2;0;212;255mreport subcommand[0m
+  [38;2;74;222;128m✓[0m report exits 0
+  [38;2;74;222;128m✓[0m report shows incidents
+  [38;2;74;222;128m✓[0m report shows total
+  [38;2;74;222;128m✓[0m report no incidents exits 0
+  [38;2;74;222;128m✓[0m report says no incidents
+
+  [38;2;0;212;255mcreate-issue subcommand[0m
+  [38;2;74;222;128m✓[0m create-issue with NO_GITHUB exits 0
+  [38;2;74;222;128m✓[0m create-issue skips with NO_GITHUB
+
+  [38;2;0;212;255mpost-merge monitoring[0m
+  [38;2;74;222;128m✓[0m post-merge exits 0
+  [38;2;74;222;128m✓[0m post-merge shows monitoring
+  [38;2;74;222;128m✓[0m post-merge creates monitoring file
+  [38;2;74;222;128m✓[0m monitoring has merge_sha
+  [38;2;74;222;128m✓[0m monitoring has environment
+
+  [38;2;0;212;255mregression detection[0m
+  [38;2;74;222;128m✓[0m regression detection outputs valid JSON
+  [38;2;74;222;128m✓[0m no regression flag
+  [38;2;74;222;128m✓[0m deploy failure detects regression
+  [38;2;74;222;128m✓[0m deploy failure is P0
+  [38;2;74;222;128m✓[0m deploy failure type
+  [38;2;74;222;128m✓[0m error spike detects regression
+  [38;2;74;222;128m✓[0m error spike is P1
+  [38;2;74;222;128m✓[0m error spike type
+
+  [38;2;0;212;255mcorrelate with changes[0m
+  [38;2;74;222;128m✓[0m correlate outputs valid JSON
+  [38;2;74;222;128m✓[0m correlation has pr_number
+
+  [38;2;0;212;255mlearn from outcome[0m
+  [38;2;74;222;128m✓[0m outcomes exits 0
+  [38;2;74;222;128m✓[0m outcomes shows recording
+  [38;2;74;222;128m✓[0m outcomes creates merge-outcomes file
+  [38;2;74;222;128m✓[0m outcomes file has valid JSONL
+  [38;2;74;222;128m✓[0m outcome has pr_number
+
+  [38;2;0;212;255mhealth report[0m
+  [38;2;74;222;128m✓[0m health with no data exits 0
+  [38;2;74;222;128m✓[0m health shows no data message
+  [38;2;74;222;128m✓[0m health shows statistics
+  [38;2;74;222;128m✓[0m health shows success rate
+  [38;2;74;222;128m✓[0m health shows regressions
+
+  [38;2;0;212;255mintegrated post-merge workflow[0m
+  [38;2;74;222;128m✓[0m workflow: monitoring complete
+  [38;2;74;222;128m✓[0m workflow: regression detection valid
+  [38;2;74;222;128m✓[0m workflow: correlation valid
+  [38;2;74;222;128m✓[0m workflow: outcome recorded
+
+
+
+[2m  ──────────────────────────────────────────[0m
+
+  [38;2;74;222;128m[1mAll 55 tests passed[0m
+
+
+╔════════════════════════════════════════════════════════════╗
+║  Outcome Feedback Test Suite                              ║
+╚════════════════════════════════════════════════════════════╝
+
+▸ Skipping review capture (NO_GITHUB set)
+[38;2;74;222;128m✓[0m review feedback capture stores correct JSON
+✓ Computed merge quality: PR #100 score=1 (clean_merge)
+[38;2;74;222;128m✓[0m merge quality scoring clean merge → +1
+✓ Computed merge quality: PR #101 score=-1 (changes_requested)
+[38;2;74;222;128m✓[0m merge quality scoring changes_requested → -1
+✓ Computed merge quality: PR #102 score=-3 (reverted)
+[38;2;74;222;128m✓[0m merge quality scoring reverted → -3
+✓ Computed merge quality: PR #103 score=-2 (regression)
+[38;2;74;222;128m✓[0m merge quality scoring regression → -2
+✓ Computed merge quality: PR #200 score=1 (clean_merge)
+✓ Computed merge quality: PR #201 score=1 (clean_merge)
+✓ Computed merge quality: PR #202 score=-1 (changes_requested)
+[38;2;74;222;128m✓[0m rolling quality score calculation
+[38;2;74;222;128m✓[0m pattern detection: 3 error_handling comments → detected
+[38;2;74;222;128m✓[0m pattern detection: 2 comments → not detected
+▸ Generating learned rules from review patterns...
+✓ Added learned rule: testing (confidence: 0.6)
+[38;2;74;222;128m✓[0m learned rule generation creates valid JSON
+▸ Generating learned rules from review patterns...
+▸ Rule already exists for category: error_handling
+▸ Generating learned rules from review patterns...
+▸ Rule already exists for category: error_handling
+[38;2;74;222;128m✓[0m learned rule addition to quality profile is idempotent
+▸ Running post-merge feedback collection for PR #700...
+▸ Skipping review capture (NO_GITHUB set)
+✓ Computed merge quality: PR #700 score=1 (clean_merge)
+✓ Post-merge feedback collection complete
+[38;2;74;222;128m✓[0m post-merge feedback runs all steps
+✓ Computed merge quality: PR #800 score=1 (clean_merge)
+[38;2;74;222;128m✓[0m works when no previous feedback exists (cold start)
+
+╔════════════════════════════════════════════════════════════╗
+║  PASSED: 12   FAILED: 0    TOTAL: 12                        ║
+╚════════════════════════════════════════════════════════════╝
+
+
+[38;2;168;85;247m[1m╔═══════════════════════════════════════════════════════════════════╗[0m
+[38;2;168;85;247m[1m║  shipwright fix test — Unit Tests                                  ║[0m
+[38;2;168;85;247m[1m╚═══════════════════════════════════════════════════════════════════╝[0m
+
+[2mSetting up test environment...[0m
+[38;2;74;222;128m✓[0m Environment ready: [2m/var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-fix-test.LlaaBt[0m
+
+  [38;2;0;212;255m▸[0m Help output contains expected sections... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Help via --help flag... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Missing goal shows error... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Missing repos shows error... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Arg parsing — --repos comma-separated... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Arg parsing — --repos-from file... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Arg parsing — --repos-from missing file... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Arg parsing — --pipeline template... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Arg parsing — --max-parallel... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Arg parsing — --branch-prefix... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Dry run shows what would happen... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Dry run does not create state file... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Fix status — no sessions... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Fix status shows existing sessions... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Invalid repo directory shows error... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Fix start creates state file... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Fix start emits events... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Fix start — summary output... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Branch name sanitization... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Fix header shows configuration... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Non-git repo warning... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Per-repo event tracking... [38;2;74;222;128m✓[0m
+
+[38;2;168;85;247m[1m━━━ Results ━━━[0m
+  [38;2;74;222;128mPassed:[0m 22
+  [38;2;248;113;113mFailed:[0m 0
+  [2mTotal:[0m  22
+
+[38;2;74;222;128m[1mAll 22 tests passed![0m
+
+
+
+[38;2;0;212;255m[1m  shipwright fleet-discover test[0m
+[2m  ══════════════════════════════════════════[0m
+
+[2m  ══════════════════════════════════════════[0m
+
+[1mScript Safety[0m
+  [38;2;74;222;128m✓[0m set -euo pipefail present
+  [38;2;74;222;128m✓[0m ERR trap present
+  [38;2;74;222;128m✓[0m source guard uses if/then/fi pattern
+
+[1mVersion[0m
+  [38;2;74;222;128m✓[0m VERSION variable defined
+
+[1mHelp Output[0m
+  [38;2;74;222;128m✓[0m help contains USAGE
+  [38;2;74;222;128m✓[0m help contains --org option
+  [38;2;74;222;128m✓[0m help contains --language option
+  [38;2;74;222;128m✓[0m help contains --dry-run option
+  [38;2;74;222;128m✓[0m help contains --json option
+  [38;2;74;222;128m✓[0m help contains --topic option
+  [38;2;74;222;128m✓[0m help contains --exclude-topic option
+  [38;2;74;222;128m✓[0m help contains --min-activity-days
+
+[1mArgument Validation[0m
+  [38;2;74;222;128m✓[0m missing --org exits non-zero
+  [38;2;74;222;128m✓[0m missing --org error message
+
+[1mError Handling[0m
+  [38;2;74;222;128m✓[0m unknown option exits non-zero
+  [38;2;74;222;128m✓[0m unknown option error
+
+[1mNO_GITHUB Check[0m
+  [38;2;74;222;128m✓[0m NO_GITHUB blocks discovery
+  [38;2;74;222;128m✓[0m NO_GITHUB shows error
+
+[1mArgument Parsing[0m
+  [38;2;74;222;128m✓[0m supports --org=value syntax
+  [38;2;74;222;128m✓[0m supports --config=value syntax
+  [38;2;74;222;128m✓[0m supports --language=value syntax
+  [38;2;74;222;128m✓[0m supports --topic=value syntax
+
+[1mConfig Merge[0m
+  [38;2;74;222;128m✓[0m merge added new repo
+  [38;2;74;222;128m✓[0m merge preserved existing repo
+
+[1mFilter Logic[0m
+  [38;2;74;222;128m✓[0m filters archived repos
+  [38;2;74;222;128m✓[0m filters disabled repos
+  [38;2;74;222;128m✓[0m checks has_issues
+  [38;2;74;222;128m✓[0m language filter applied
+  [38;2;74;222;128m✓[0m topic filter applied
+  [38;2;74;222;128m✓[0m exclude topic filter
+  [38;2;74;222;128m✓[0m checks .shipwright-ignore
+
+[1mEvent Emission[0m
+  [38;2;74;222;128m✓[0m emits fleet.discover.completed event
+  [38;2;74;222;128m✓[0m emits fleet.discover.merged event
+
+
+
+
+[2m  ──────────────────────────────────────────[0m
+
+  [38;2;74;222;128m[1mAll 0 tests passed[0m
+
+
+[38;2;168;85;247m[1m╔═══════════════════════════════════════════════════════════════════╗[0m
+[38;2;168;85;247m[1m║  shipwright fleet test — Unit Tests                                ║[0m
+[38;2;168;85;247m[1m╚═══════════════════════════════════════════════════════════════════╝[0m
+
+[2mSetting up test environment...[0m
+[38;2;74;222;128m✓[0m Environment ready: [2m/var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-fleet-test.TROF8n[0m
+
+  [38;2;0;212;255m▸[0m Help output contains expected sections... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Help via --help flag... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Config parsing — valid config... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Config parsing — missing config file... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Config parsing — invalid JSON... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Config parsing — empty repos array... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Config defaults applied... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Fleet init generates config template... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Fleet init skips when config exists... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Fleet start spawns tmux sessions per repo... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Fleet start skips missing repos... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Fleet start skips existing sessions... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Fleet start creates fleet state file... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Fleet start emits fleet.started event... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Fleet start applies repo-level overrides... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Fleet stop kills sessions and cleans state... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Fleet stop — no fleet running... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Fleet stop emits fleet.stopped event... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Fleet status — no fleet running... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Fleet status shows dashboard... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Fleet metrics — no events file... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Fleet metrics dashboard output... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Fleet metrics JSON output... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Fleet metrics period flag... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Session name generation... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Fleet start skips non-git repos... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Unknown subcommand... [38;2;74;222;128m✓[0m
+
+[38;2;168;85;247m[1m━━━ Results ━━━[0m
+  [38;2;74;222;128mPassed:[0m 27
+  [38;2;248;113;113mFailed:[0m 0
+  [2mTotal:[0m  27
+
+[38;2;74;222;128m[1mAll 27 tests passed![0m
+
+
+
+[38;2;0;212;255m[1m  shipwright fleet-viz test[0m
+[2m  ══════════════════════════════════════════[0m
+
+[2m  ══════════════════════════════════════════[0m
+
+[1mScript Safety[0m
+  [38;2;74;222;128m✓[0m set -euo pipefail present
+  [38;2;74;222;128m✓[0m ERR trap present
+  [38;2;74;222;128m✓[0m source guard uses if/then/fi pattern
+
+[1mVersion[0m
+  [38;2;74;222;128m✓[0m VERSION variable defined
+
+[1mHelp Output[0m
+  [38;2;74;222;128m✓[0m help contains USAGE
+  [38;2;74;222;128m✓[0m help contains overview subcommand
+  [38;2;74;222;128m✓[0m help contains workers subcommand
+  [38;2;74;222;128m✓[0m help contains insights subcommand
+  [38;2;74;222;128m✓[0m help contains queue subcommand
+  [38;2;74;222;128m✓[0m help contains costs subcommand
+  [38;2;74;222;128m✓[0m help contains export subcommand
+  [38;2;74;222;128m✓[0m --help flag works
+
+[1mError Handling[0m
+  [38;2;74;222;128m✓[0m unknown command exits non-zero
+  [38;2;74;222;128m✓[0m unknown command error message
+
+[1mOverview Subcommand[0m
+  [38;2;74;222;128m✓[0m overview shows Fleet Overview
+  [38;2;74;222;128m✓[0m overview shows Active count
+  [38;2;74;222;128m✓[0m overview shows Queued count
+  [38;2;74;222;128m✓[0m overview shows Repos count
+
+[1mWorkers Subcommand[0m
+  [38;2;74;222;128m✓[0m workers shows Worker Allocation
+  [38;2;74;222;128m✓[0m workers shows Remote Machines
+
+[1mQueue Subcommand[0m
+  [38;2;74;222;128m✓[0m queue shows Issue Queue
+  [38;2;74;222;128m✓[0m queue shows queued items
+
+[1mCosts Subcommand[0m
+  [38;2;74;222;128m✓[0m costs shows Fleet Costs
+  [38;2;74;222;128m✓[0m costs shows Total Spend
+  [38;2;74;222;128m✓[0m costs shows Per-Repo
+  [38;2;74;222;128m✓[0m costs shows Per-Model
+
+[1mExport Subcommand[0m
+  [38;2;74;222;128m✓[0m export produces JSON with active_jobs
+
+[1mInsights Subcommand[0m
+  [38;2;74;222;128m✓[0m insights shows Fleet Insights
+  [38;2;74;222;128m✓[0m insights shows Success Rate
+
+[1mDefault Command[0m
+  [38;2;74;222;128m✓[0m default command shows Fleet Overview
+
+[1mHealth Helpers[0m
+  [38;2;74;222;128m✓[0m get_health_status function defined
+  [38;2;74;222;128m✓[0m color_health function defined
+  [38;2;74;222;128m✓[0m healthy status handled
+  [38;2;74;222;128m✓[0m degraded status handled
+  [38;2;74;222;128m✓[0m failing status handled
+
+
+
+
+[2m  ──────────────────────────────────────────[0m
+
+  [38;2;74;222;128m[1mAll 0 tests passed[0m
+
+
+[38;2;0;212;255m[1m╔═══════════════════════════════════════════════════╗[0m
+[38;2;0;212;255m[1m║  shipwright frontier — Test Suite                 ║[0m
+[38;2;0;212;255m[1m╚═══════════════════════════════════════════════════╝[0m
+
+[2mSetting up test environment...[0m
+
+[38;2;168;85;247m[1mAdversarial Review[0m
+  [38;2;0;212;255m▸[0m Adversarial review produces structured findings... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Adversarial iteration converges on no critical findings... [38;2;74;222;128m✓[0m
+
+[38;2;168;85;247m[1mDeveloper Simulation[0m
+  [38;2;0;212;255m▸[0m Simulation generates objections from 3 personas... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Simulation address returns action items... [38;2;74;222;128m✓[0m
+
+[38;2;168;85;247m[1mArchitecture Enforcer[0m
+  [38;2;0;212;255m▸[0m Architecture model has valid schema... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Architecture validates changes (violation detected)... [38;2;74;222;128m✓[0m
+
+[38;2;168;85;247m[1mGraceful Degradation[0m
+  [38;2;0;212;255m▸[0m All three degrade gracefully when claude unavailable... [38;2;74;222;128m✓[0m
+
+[38;2;0;212;255m[1m════════════════════════════════════════════════════[0m
+[38;2;74;222;128m[1m  All 7 tests passed ✓[0m
+[38;2;0;212;255m[1m════════════════════════════════════════════════════[0m
+
+
+
+[38;2;0;212;255m[1m  Shipwright GitHub App Tests[0m
+[2m  ══════════════════════════════════════════[0m
+
+[2m  ══════════════════════════════════════════[0m
+
+[1m  Help[0m
+  [38;2;74;222;128m✓[0m help shows usage
+  [38;2;74;222;128m✓[0m help shows commands
+  [38;2;74;222;128m✓[0m --help flag works
+  [38;2;74;222;128m✓[0m unknown command shows error
+[1m  Status[0m
+  [38;2;74;222;128m✓[0m status without config warns
+[1m  Events[0m
+  [38;2;74;222;128m✓[0m events with no log warns
+[1m  Manifest[0m
+  [38;2;74;222;128m✓[0m manifest contains app name
+  [38;2;74;222;128m✓[0m manifest contains webhook URL
+  [38;2;74;222;128m✓[0m manifest success message
+  [38;2;74;222;128m✓[0m manifest output is valid JSON
+[1m  Configured Status[0m
+  [38;2;74;222;128m✓[0m configured status shows app ID
+  [38;2;74;222;128m✓[0m configured status shows install ID
+  [38;2;74;222;128m✓[0m events shows recent events
+[1m  Token[0m
+  [38;2;74;222;128m✓[0m token without key file errors
+[1m  Verify[0m
+  [38;2;74;222;128m✓[0m verify without secret errors
+
+
+
+[2m  ──────────────────────────────────────────[0m
+
+  [38;2;74;222;128m[1mAll 15 tests passed[0m
+
+
+[38;2;0;212;255m[1m╔═══════════════════════════════════════════════════╗[0m
+[38;2;0;212;255m[1m║  shipwright github-checks — Test Suite            ║[0m
+[38;2;0;212;255m[1m╚═══════════════════════════════════════════════════╝[0m
+
+[2mSetting up test environment...[0m
+
+[38;2;168;85;247m[1mChecks API Availability[0m
+  [38;2;0;212;255m▸[0m _gh_checks_available: returns true when API accessible... {"check_runs":[],"total_count":0}
+[38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m _gh_checks_available: returns false on 403... [38;2;74;222;128m✓[0m
+
+[38;2;168;85;247m[1mCheck Run CRUD[0m
+  [38;2;0;212;255m▸[0m gh_checks_create_run: returns run ID from response... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m gh_checks_create_run: handles 403 gracefully... [38;2;250;204;21m[1m⚠[0m Failed to create check run 'test-check' (API returned 1)
+ERROR: scripts/sw-github-checks-test.sh:224 exited with status 1
+[38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m gh_checks_update_run: sends correct PATCH request... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m gh_checks_update_run: skips when run_id empty... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m gh_checks_annotate: respects 50-annotation limit... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m gh_checks_list_runs: parses response correctly... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m gh_checks_complete: convenience wrapper works... [38;2;74;222;128m✓[0m
+
+[38;2;168;85;247m[1mPipeline Integration[0m
+  [38;2;0;212;255m▸[0m gh_checks_pipeline_start: creates runs for all stages... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m gh_checks_stage_update: looks up stored run IDs... [38;2;74;222;128m✓[0m
+
+[38;2;168;85;247m[1mNO_GITHUB Guard[0m
+  [38;2;0;212;255m▸[0m NO_GITHUB: all functions return early... [38;2;74;222;128m✓[0m
+
+[38;2;0;212;255m[1m════════════════════════════════════════════════════[0m
+[38;2;74;222;128m[1m  All 12 tests passed ✓[0m
+[38;2;0;212;255m[1m════════════════════════════════════════════════════[0m
+
+
+[38;2;0;212;255m[1m╔═══════════════════════════════════════════════════╗[0m
+[38;2;0;212;255m[1m║  shipwright github-deploy — Test Suite            ║[0m
+[38;2;0;212;255m[1m╚═══════════════════════════════════════════════════╝[0m
+
+[2mSetting up test environment...[0m
+
+[38;2;168;85;247m[1mDeployment CRUD[0m
+  [38;2;0;212;255m▸[0m gh_deploy_create: returns deployment ID... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m gh_deploy_create: handles 403 gracefully... [38;2;250;204;21m[1m⚠[0m Failed to create deployment for ref 'main' to 'production' (API returned 1)
+ERROR: scripts/sw-github-deploy-test.sh:158 exited with status 1
+[38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m gh_deploy_update_status: sends correct POST... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m gh_deploy_update_status: skips when deploy_id empty... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m gh_deploy_list: parses deployment list... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m gh_deploy_latest: returns first result... [38;2;74;222;128m✓[0m
+
+[38;2;168;85;247m[1mRollback[0m
+  [38;2;0;212;255m▸[0m gh_deploy_rollback: creates new deployment with prev ref... [38;2;0;212;255m[1m▸[0m Rolling back to ref: v2.9
+[38;2;74;222;128m[1m✓[0m Rolled back to v2.9 (deployment 301)
+[38;2;74;222;128m✓[0m
+
+[38;2;168;85;247m[1mPipeline Integration[0m
+  [38;2;0;212;255m▸[0m gh_deploy_pipeline_start: stores deployment ID... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m gh_deploy_pipeline_complete: updates status correctly... [38;2;74;222;128m✓[0m
+
+[38;2;168;85;247m[1mNO_GITHUB Guard[0m
+  [38;2;0;212;255m▸[0m NO_GITHUB: all functions return early... [38;2;74;222;128m✓[0m
+
+[38;2;0;212;255m[1m════════════════════════════════════════════════════[0m
+[38;2;74;222;128m[1m  All 10 tests passed ✓[0m
+[38;2;0;212;255m[1m════════════════════════════════════════════════════[0m
+
+
+[38;2;168;85;247m[1m━━━ shipwright github-graphql tests ━━━[0m
+
+  [38;2;0;212;255m▸[0m Fresh cache returns cached data... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Stale cache returns miss... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Atomic writes leave no temp files... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m gh_file_change_frequency returns count... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m gh_contributors returns parsed list... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m gh_similar_issues truncates long text... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m gh_branch_protection handles 404... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m gh_security_alerts handles 403... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m gh_dependabot_alerts handles 403... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m gh_repo_context aggregates data... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m NO_GITHUB returns defaults... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m _gh_detect_repo parses SSH URL... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m _gh_detect_repo parses HTTPS URL... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m _gh_detect_repo parses HTTPS without .git... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m gh_codeowners parses CODEOWNERS file... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Cache clear removes all files... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m gh_commit_history returns parsed commits... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m gh_blame_data aggregates authors... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m gh_actions_runs calculates duration... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Events emitted for cache hit/miss... [38;2;74;222;128m✓[0m
+
+[38;2;124;58;237m[1m━━━ Results ━━━[0m
+  [38;2;74;222;128mPassed:[0m 20
+  [38;2;248;113;113mFailed:[0m 0
+  [2mTotal:[0m  20
+
+[38;2;74;222;128m[1mAll 20 tests passed![0m
+
+
+
+[38;2;0;212;255m[1m  Shipwright Guild Tests[0m
+[2m  ══════════════════════════════════════════[0m
+
+[2m  ══════════════════════════════════════════[0m
+
+  [38;2;74;222;128m✓[0m help shows usage text
+  [38;2;74;222;128m✓[0m help exits 0
+  [38;2;74;222;128m✓[0m --help flag works
+  [38;2;74;222;128m✓[0m no args shows help
+  [38;2;74;222;128m✓[0m list shows Available Guilds
+  [38;2;74;222;128m✓[0m guild config.json created
+  [38;2;74;222;128m✓[0m guild config is valid JSON
+  [38;2;74;222;128m✓[0m guilds.json data file created
+  [38;2;74;222;128m✓[0m show security guild
+  [38;2;74;222;128m✓[0m show invalid guild exits nonzero
+  [38;2;74;222;128m✓[0m show without name exits nonzero
+  [38;2;74;222;128m✓[0m add pattern succeeds
+  [38;2;74;222;128m✓[0m pattern saved in data file
+  [38;2;74;222;128m✓[0m report shows guild data
+  [38;2;74;222;128m✓[0m report for specific guild
+  [38;2;74;222;128m✓[0m inject security shows knowledge
+  [38;2;74;222;128m✓[0m unknown command exits nonzero
+
+
+
+[2m  ──────────────────────────────────────────[0m
+
+  [38;2;74;222;128m[1mAll 0 tests passed[0m
+
+
+[38;2;0;212;255m[1m╔═══════════════════════════════════════════════════╗[0m
+[38;2;0;212;255m[1m║  shipwright heartbeat + checkpoint — Test Suite   ║[0m
+[38;2;0;212;255m[1m╚═══════════════════════════════════════════════════╝[0m
+
+[2mSetting up test environment...[0m
+
+[38;2;168;85;247m[1mHeartbeat Lifecycle[0m
+  [38;2;0;212;255m▸[0m Write heartbeat creates JSON file... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Check heartbeat reports alive... ✓ Job test-job-alive alive (0s ago)
+[38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Check heartbeat reports stale... ⚠ Job test-job-stale stale (197469510s ago, timeout: 120s)
+[38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Clear heartbeat removes file... ✓ Cleared heartbeat for job: test-job-clear
+[38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m List heartbeats returns JSON array... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Heartbeat update overwrites existing... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Check missing heartbeat returns error... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Heartbeat dir auto-created when missing... [38;2;74;222;128m✓[0m
+
+[38;2;168;85;247m[1mCheckpoint Lifecycle[0m
+  [38;2;0;212;255m▸[0m Checkpoint save creates JSON file... [38;2;74;222;128m[1m✓[0m Checkpoint saved for stage [1mbuild[0m (iteration 5)
+[38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Checkpoint restore outputs JSON... [38;2;74;222;128m[1m✓[0m Checkpoint saved for stage [1mtest[0m (iteration 3)
+[38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Checkpoint restore missing stage fails... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Checkpoint clear removes file... [38;2;74;222;128m[1m✓[0m Checkpoint saved for stage [1mreview[0m (iteration 1)
+[38;2;74;222;128m[1m✓[0m Cleared checkpoint for stage [1mreview[0m
+[38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Checkpoint clear --all removes all... [38;2;74;222;128m[1m✓[0m Checkpoint saved for stage [1mbuild[0m (iteration 1)
+[38;2;74;222;128m[1m✓[0m Checkpoint saved for stage [1mtest[0m (iteration 2)
+[38;2;74;222;128m[1m✓[0m Cleared 2 checkpoint(s)
+[38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Checkpoint save with files-modified... [38;2;74;222;128m[1m✓[0m Checkpoint saved for stage [1mbuild[0m (iteration 7)
+[38;2;74;222;128m✓[0m
+
+[38;2;168;85;247m[1mIntegration[0m
+  [38;2;0;212;255m▸[0m Pipeline script has heartbeat functions... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Loop script has heartbeat and checkpoint... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Pipeline has human intervention checks... [38;2;74;222;128m✓[0m
+
+[38;2;0;212;255m[1m════════════════════════════════════════════════════[0m
+[38;2;74;222;128m[1m  All 17 tests passed ✓[0m
+[38;2;0;212;255m[1m════════════════════════════════════════════════════[0m
+
+sw-hello-test.sh
+  [38;2;74;222;128m[1m✓[0m hello command outputs 'Shipwright vX.Y.Z'
+  [38;2;74;222;128m[1m✓[0m hello command exits with code 0
+  [38;2;74;222;128m[1m✓[0m hello --help displays help text
+  [38;2;74;222;128m[1m✓[0m hello -h displays help text
+  [38;2;74;222;128m[1m✓[0m hello --version displays 'Shipwright vX.Y.Z'
+  [38;2;74;222;128m[1m✓[0m hello version matches package.json (3.2.4)
+  [38;2;74;222;128m[1m✓[0m hello with invalid option exits with code 1
+
+PASS: 7
+FAIL: 0
+
+
+[38;2;0;212;255m[1m  Shipwright Hygiene Tests[0m
+[2m  ══════════════════════════════════════════[0m
+
+[2m  ══════════════════════════════════════════[0m
+
+  [38;2;0;212;255mhelp command[0m
+  [38;2;74;222;128m✓[0m help exits 0
+  [38;2;74;222;128m✓[0m help shows usage
+  [38;2;74;222;128m✓[0m help shows subcommands
+  [38;2;74;222;128m✓[0m --help exits 0
+
+  [38;2;0;212;255merror handling[0m
+  [38;2;74;222;128m✓[0m unknown subcommand exits 1
+  [38;2;74;222;128m✓[0m unknown subcommand shows error
+
+  [38;2;0;212;255mreport subcommand[0m
+  [38;2;74;222;128m✓[0m report exits 0
+  [38;2;74;222;128m✓[0m report shows generating
+  [38;2;74;222;128m✓[0m report exits 0
+  [38;2;74;222;128m✓[0m report creates JSON file
+  [38;2;74;222;128m✓[0m report JSON is valid
+  [38;2;74;222;128m✓[0m report JSON has timestamp
+  [38;2;74;222;128m✓[0m report JSON has sections
+
+  [38;2;0;212;255mstructure subcommand[0m
+  [38;2;74;222;128m✓[0m structure exits 0
+  [38;2;74;222;128m✓[0m structure reports validating
+
+  [38;2;0;212;255mnaming subcommand[0m
+  [38;2;74;222;128m✓[0m naming exits 0
+  [38;2;74;222;128m✓[0m naming shows checking
+
+  [38;2;0;212;255mdead-code subcommand[0m
+  [38;2;74;222;128m✓[0m dead-code exits 0
+  [38;2;74;222;128m✓[0m dead-code shows scanning
+
+  [38;2;0;212;255mdependencies subcommand[0m
+  [38;2;74;222;128m✓[0m dependencies exits 0
+  [38;2;74;222;128m✓[0m dependencies shows auditing
+
+  [38;2;0;212;255mplatform-refactor subcommand[0m
+  [38;2;74;222;128m✓[0m platform-refactor exits 0
+  [38;2;74;222;128m✓[0m platform-refactor scans for hardcoded/fallback
+  [38;2;74;222;128m✓[0m platform-refactor creates platform-hygiene.json with counts
+
+  [38;2;0;212;255mpolicy read (policy_get from config)[0m
+  [38;2;74;222;128m✓[0m policy_get returns value from config
+  [38;2;74;222;128m✓[0m policy_get returns default when key missing
+
+
+
+[2m  ──────────────────────────────────────────[0m
+
+  [38;2;74;222;128m[1mAll 26 tests passed[0m
+
+
+
+[38;2;0;212;255m[1m  Shipwright Incident Tests[0m
+[2m  ══════════════════════════════════════════[0m
+
+[2m  ══════════════════════════════════════════[0m
+
+[2m  help / version[0m
+  [38;2;74;222;128m✓[0m help exits 0
+  [38;2;74;222;128m✓[0m help shows USAGE
+  [38;2;74;222;128m✓[0m help mentions watch
+  [38;2;74;222;128m✓[0m help mentions list
+  [38;2;74;222;128m✓[0m help mentions report
+  [38;2;74;222;128m✓[0m help mentions stats
+  [38;2;74;222;128m✓[0m VERSION variable defined
+
+[2m  error handling[0m
+  [38;2;74;222;128m✓[0m Unknown command exits non-zero
+
+[2m  list command[0m
+  [38;2;74;222;128m✓[0m list with no incidents exits 0
+
+[2m  stats command[0m
+  [38;2;74;222;128m✓[0m stats with no data exits 0
+
+[2m  state management[0m
+  [38;2;74;222;128m✓[0m Incident config created
+  [38;2;74;222;128m✓[0m Incident config is valid JSON
+
+[2m  script safety[0m
+  [38;2;74;222;128m✓[0m Uses set -euo pipefail
+  [38;2;74;222;128m✓[0m Has source guard pattern
+  [38;2;74;222;128m✓[0m ERR trap is set
+
+[2m  config subcommand[0m
+  [38;2;74;222;128m✓[0m config subcommand creates valid JSON config
+
+[2m  subcommand usage[0m
+ERROR: scripts/sw-incident-test.sh:203 exited with status 1
+  [38;2;74;222;128m✓[0m show subcommand fails or shows usage when missing args
+  [38;2;74;222;128m✓[0m report subcommand shows usage when missing args
+
+[2m  detect_pipeline_failures[0m
+  [38;2;74;222;128m✓[0m detect_pipeline_failures defined and callable
+  [38;2;74;222;128m✓[0m report with nonexistent incident handles gracefully
+  [38;2;74;222;128m✓[0m gap list subcommand produces expected output
+
+[2m  timeline updates[0m
+  [38;2;74;222;128m✓[0m Timeline update creates valid JSON
+  [38;2;74;222;128m✓[0m Timeline entry has all required fields
+
+[2m  correlation engine[0m
+  [38;2;74;222;128m✓[0m Correlation engine produces valid JSON
+
+[2m  escalation logic[0m
+  [38;2;74;222;128m✓[0m Escalation includes P0 rules
+  [38;2;74;222;128m✓[0m Escalation function defined
+
+[2m  rollback verification[0m
+  [38;2;74;222;128m✓[0m Rollback verification function defined
+  [38;2;74;222;128m✓[0m Rollback verification updates timeline
+
+[2m  auto-remediate subcommand[0m
+  [38;2;74;222;128m✓[0m auto-remediate subcommand shows usage when missing args
+
+[2m  deep analysis[0m
+  [38;2;74;222;128m✓[0m Deep analysis function defined
+  [38;2;74;222;128m✓[0m Deep analysis returns valid JSON with required fields
+  [38;2;74;222;128m✓[0m Config includes auto_remediate_enabled flag
+  [38;2;74;222;128m✓[0m Config includes escalation rules for all severities
+
+[2m  post-mortem report[0m
+  [38;2;74;222;128m✓[0m Post-mortem report includes Timeline section
+  [38;2;74;222;128m✓[0m Post-mortem report references timeline fields
+
+
+
+[2m  ──────────────────────────────────────────[0m
+
+  [38;2;74;222;128m[1mAll 0 tests passed[0m
+
+
+[38;2;0;212;255m[1m╔═══════════════════════════════════════════════════╗[0m
+[38;2;0;212;255m[1m║  shipwright init — E2E Test Suite                 ║[0m
+[38;2;0;212;255m[1m╚═══════════════════════════════════════════════════╝[0m
+
+[2mSetting up sandboxed environment...[0m
+[2mTemp dir: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-init-test.A30bb1[0m
+
+[38;2;168;85;247m[1mConfiguration[0m
+  [38;2;0;212;255m▸[0m Settings.json created with agent teams... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Settings merge preserves existing vars... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m tmux.conf installed... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Overlay installed... [38;2;74;222;128m✓[0m
+
+[38;2;168;85;247m[1mTemplates[0m
+  [38;2;0;212;255m▸[0m Team templates installed (>= 10)... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Pipeline templates installed (>= 5)... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Legacy templates path populated... [38;2;74;222;128m✓[0m
+
+[38;2;168;85;247m[1mRobustness[0m
+  [38;2;0;212;255m▸[0m Idempotency — double init safe... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Doctor runs at end... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Help flag... [38;2;74;222;128m✓[0m
+
+[38;2;168;85;247m[1mHook Wiring[0m
+  [38;2;0;212;255m▸[0m JSONC stripped from settings.json... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Hooks wired into settings.json... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Hook wiring preserves existing hooks... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m SessionStart hook installed... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Hook wiring with pre-existing settings... [38;2;74;222;128m✓[0m
+
+[38;2;168;85;247m[1mRepair & Cleanup[0m
+  [38;2;0;212;255m▸[0m Legacy overlay cleanup... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Legacy overlay source-file reference stripped... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Repair mode forces clean reinstall... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Plugin direct-clone fallback (outside tmux)... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Post-install verification... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m tmux adapter deployed... [38;2;74;222;128m✓[0m
+
+[38;2;0;212;255m[1m════════════════════════════════════════════════════[0m
+[38;2;74;222;128m[1m  All 21 tests passed ✓[0m
+[38;2;0;212;255m[1m════════════════════════════════════════════════════[0m
+
+
+
+[38;2;0;212;255m[1m  Shipwright Instrument Tests[0m
+[2m  ══════════════════════════════════════════[0m
+
+[2m  ══════════════════════════════════════════[0m
+
+[1m  Help & Version[0m
+  [38;2;74;222;128m✓[0m help shows usage
+  [38;2;74;222;128m✓[0m help shows commands
+  [38;2;74;222;128m✓[0m help shows start
+  [38;2;74;222;128m✓[0m help shows record
+  [38;2;74;222;128m✓[0m help shows version
+
+[1m  Start Command[0m
+  [38;2;74;222;128m✓[0m start without --run-id exits non-zero
+  [38;2;74;222;128m✓[0m start without --run-id shows error
+  [38;2;74;222;128m✓[0m start with --run-id exits 0
+  [38;2;74;222;128m✓[0m start confirms run ID
+  [38;2;74;222;128m✓[0m start creates run file
+  [38;2;74;222;128m✓[0m run file contains correct run_id
+  [38;2;74;222;128m✓[0m run file contains correct issue
+
+[1m  Record Command[0m
+  [38;2;74;222;128m✓[0m record exits 0
+  [38;2;74;222;128m✓[0m record confirms metric
+  [38;2;74;222;128m✓[0m run file has 1 metric
+  [38;2;74;222;128m✓[0m record without all args exits non-zero
+  [38;2;74;222;128m✓[0m record on missing run exits non-zero
+  [38;2;74;222;128m✓[0m record on missing run shows error
+
+[1m  Stage Start/End[0m
+  [38;2;74;222;128m✓[0m stage-start exits 0
+  [38;2;74;222;128m✓[0m stage-start confirms stage
+  [38;2;74;222;128m✓[0m stage-end exits 0
+  [38;2;74;222;128m✓[0m stage result recorded
+
+[1m  Finish Command[0m
+  [38;2;74;222;128m✓[0m finish exits 0
+  [38;2;74;222;128m✓[0m finish confirms completion
+  [38;2;74;222;128m✓[0m finish removes active run file
+  [38;2;74;222;128m✓[0m finish writes to completed JSONL
+
+[1m  Trends & Export[0m
+  [38;2;74;222;128m✓[0m trends with no data exits 0
+  [38;2;74;222;128m✓[0m trends with no data warns
+  [38;2;74;222;128m✓[0m export with no data exits 0
+  [38;2;74;222;128m✓[0m export with no data warns
+
+[1m  Error Handling[0m
+  [38;2;74;222;128m✓[0m unknown command exits non-zero
+  [38;2;74;222;128m✓[0m unknown command shows error
+  [38;2;74;222;128m✓[0m events.jsonl created from instrument operations
+
+
+
+[2m  ──────────────────────────────────────────[0m
+
+  [38;2;74;222;128m[1mAll 33 tests passed[0m
+
+
+[38;2;168;85;247m[1m╔═══════════════════════════════════════════════════════════════════╗[0m
+[38;2;168;85;247m[1m║  shipwright intelligence test — Unit Tests                       ║[0m
+[38;2;168;85;247m[1m╚═══════════════════════════════════════════════════════════════════╝[0m
+
+[2mSetting up test environment...[0m
+[38;2;74;222;128m✓[0m Environment ready: [2m/var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-intelligence-test.FKhlqe[0m
+
+  [38;2;0;212;255m▸[0m analyze_issue returns valid schema... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Cache hit on second call with same input... WARN: Unknown event type 'intelligence.cache_hit' — update config/event-schema.json
+[38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Graceful degradation when claude CLI unavailable... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m compose_pipeline produces valid pipeline JSON... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m recommend_model returns valid model names... WARN: Unknown event type 'intelligence.model' — update config/event-schema.json
+WARN: Unknown event type 'intelligence.model' — update config/event-schema.json
+WARN: Unknown event type 'intelligence.model' — update config/event-schema.json
+WARN: Unknown event type 'intelligence.model' — update config/event-schema.json
+[38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m predict_cost returns numeric estimates... WARN: Unknown event type 'intelligence.prediction' — update config/event-schema.json
+[38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Cache TTL expiry returns miss... scripts/sw-intelligence-test.sh: line 334: _intelligence_md5: command not found
+[38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m search_memory returns ranked results... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Feature flag disabled returns fallback...     [38;2;248;113;113m✗[0m Expected 'intelligence_disabled', got 'null' (returns intelligence_disabled error)
+[38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Events emitted for analysis... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m recommend_model emits events... WARN: Unknown event type 'intelligence.model' — update config/event-schema.json
+[38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Cache init creates file if missing... [38;2;74;222;128m✓[0m
+
+[38;2;124;58;237m[1m━━━ Results ━━━[0m
+  [38;2;74;222;128mPassed:[0m 12
+  [38;2;248;113;113mFailed:[0m 0
+  [2mTotal:[0m  12
+
+[38;2;74;222;128m[1mAll 12 tests passed![0m
+
+
+
+[38;2;0;212;255m[1m  Shipwright Jira Test Suite[0m
+[2m  ══════════════════════════════════════════[0m
+
+
+[1m  Script Safety[0m
+  [38;2;74;222;128m✓[0m set -euo pipefail present
+  [38;2;74;222;128m✓[0m ERR trap present
+  [38;2;74;222;128m✓[0m VERSION variable defined
+  [38;2;74;222;128m✓[0m VERSION is semver: 3.2.4
+
+[1m  Help Output[0m
+  [38;2;74;222;128m✓[0m help mentions USAGE
+  [38;2;74;222;128m✓[0m help mentions sync command
+  [38;2;74;222;128m✓[0m help mentions update command
+  [38;2;74;222;128m✓[0m help mentions status command
+  [38;2;74;222;128m✓[0m help mentions init command
+  [38;2;74;222;128m✓[0m help mentions JIRA_BASE_URL
+  [38;2;74;222;128m✓[0m --help works
+
+[1m  Error Handling[0m
+
+[38;2;0;212;255m[1mshipwright jira[0m — Jira ↔ GitHub Bidirectional Sync
+
+[1mUSAGE[0m
+  [38;2;0;212;255mshipwright jira[0m <command> [options]
+
+[1mCOMMANDS[0m
+  [38;2;0;212;255msync[0m [--dry-run]              Sync Jira To Do issues → GitHub
+  [38;2;0;212;255mupdate[0m <issue> <status>       Update linked Jira ticket status
+  [38;2;0;212;255mstatus[0m                        Show Jira board dashboard
+  [38;2;0;212;255minit[0m                          Configure Jira connection
+  [38;2;0;212;255mhelp[0m                          Show this help
+
+[1mSTATUS VALUES[0m
+  [38;2;0;212;255mstarted[0m     Pipeline spawned   → Jira: In Progress
+  [38;2;0;212;255mreview[0m      PR created         → Jira: In Review
+  [38;2;0;212;255mdone[0m        Pipeline complete   → Jira: Done
+  [38;2;0;212;255mfailed[0m      Pipeline failed     → Jira: adds failure comment
+
+[1mEXAMPLES[0m
+  [2mshipwright jira init[0m                    # Set up Jira connection
+  [2mshipwright jira sync[0m                    # Sync To Do → GitHub
+  [2mshipwright jira sync --dry-run[0m          # Preview what would sync
+  [2mshipwright jira update 42 started[0m       # Mark as In Progress
+  [2mshipwright jira update 42 review[0m        # Mark as In Review
+  [2mshipwright jira update 42 done[0m          # Mark as Done
+  [2mshipwright jira status[0m                  # Show board dashboard
+
+[1mENVIRONMENT[0m
+  [2mJIRA_BASE_URL[0m       Jira instance URL (or use 'jira init' to save)
+  [2mJIRA_EMAIL[0m          Account email for authentication
+  [2mJIRA_API_TOKEN[0m      API token from Atlassian account
+  [2mJIRA_PROJECT_KEY[0m    Jira project key (e.g. PROJ)
+  [38;2;74;222;128m✓[0m unknown command exits non-zero
+  [38;2;74;222;128m✓[0m unknown command shows error
+
+[1m  Default Behavior[0m
+  [38;2;74;222;128m✓[0m no-arg defaults to help
+
+[1m  Configuration[0m
+  [38;2;74;222;128m✓[0m sync without config shows error
+  [38;2;74;222;128m✓[0m update without config shows error
+  [38;2;74;222;128m✓[0m status without config shows error
+
+[1m  Config Loading[0m
+  [38;2;74;222;128m✓[0m sync with config proceeds
+
+[1m  Update Subcommand[0m
+  [38;2;74;222;128m✓[0m update without args shows usage
+
+[1m  Notify Integration[0m
+  [38;2;74;222;128m✓[0m notify subcommand executes without crash
+
+[1m  Atomic Writes[0m
+  [38;2;74;222;128m✓[0m init uses atomic write (tmp + mv)
+  [38;2;74;222;128m✓[0m config file gets restricted permissions
+
+[1m  Event Emission[0m
+  [38;2;74;222;128m✓[0m emits jira events
+  [38;2;74;222;128m✓[0m uses EVENTS_FILE for event logging
+
+
+
+
+[2m  ──────────────────────────────────────────[0m
+
+  [38;2;74;222;128m[1mAll 0 tests passed[0m
+
+
+[38;2;0;212;255m[1m╔═══════════════════════════════════════════════════╗[0m
+[38;2;0;212;255m[1m║  shipwright launchd + systemd — Test Suite       ║[0m
+[38;2;0;212;255m[1m╚═══════════════════════════════════════════════════╝[0m
+
+[2mSetting up test environment...[0m
+
+[38;2;168;85;247m[1mOS Detection[0m
+  [38;2;0;212;255m▸[0m macOS detection sets OSTYPE correctly... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Linux detection routes to systemd... [38;2;74;222;128m✓[0m
+
+[38;2;168;85;247m[1mmacOS Plist Generation[0m
+  [38;2;0;212;255m▸[0m Daemon plist has correct structure... [38;2;0;212;255m[1m▸[0m Installing launchd agents...
+[38;2;74;222;128m[1m✓[0m Created daemon plist: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/Library/LaunchAgents/com.shipwright.daemon.plist
+[38;2;250;204;21m[1m⚠[0m server.ts not found at /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T/sw-launchd-test.G2ePKG/dashboard/server.ts — dashboard plist will reference a missing file
+[38;2;74;222;128m[1m✓[0m Created dashboard plist: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/Library/LaunchAgents/com.shipwright.dashboard.plist
+[38;2;74;222;128m[1m✓[0m Created connect plist: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/Library/LaunchAgents/com.shipwright.connect.plist
+[38;2;0;212;255m[1m▸[0m Loading launchd services...
+Mock loaded: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/Library/LaunchAgents/com.shipwright.daemon.plist
+[38;2;74;222;128m[1m✓[0m Loaded daemon service
+Mock loaded: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/Library/LaunchAgents/com.shipwright.dashboard.plist
+[38;2;74;222;128m[1m✓[0m Loaded dashboard service
+Mock loaded: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/Library/LaunchAgents/com.shipwright.connect.plist
+[38;2;74;222;128m[1m✓[0m Loaded connect service
+
+[38;2;0;212;255m[1m▸[0m Services will auto-start on next login
+[38;2;0;212;255m[1m▸[0m View logs: [2mtail -f /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/.shipwright/logs/*.log[0m
+[38;2;0;212;255m[1m▸[0m Uninstall: [2mshipwright launchd uninstall[0m
+[38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Dashboard plist has correct arguments... [38;2;0;212;255m[1m▸[0m Installing launchd agents...
+[38;2;74;222;128m[1m✓[0m Created daemon plist: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/Library/LaunchAgents/com.shipwright.daemon.plist
+[38;2;250;204;21m[1m⚠[0m server.ts not found at /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T/sw-launchd-test.G2ePKG/dashboard/server.ts — dashboard plist will reference a missing file
+[38;2;74;222;128m[1m✓[0m Created dashboard plist: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/Library/LaunchAgents/com.shipwright.dashboard.plist
+[38;2;74;222;128m[1m✓[0m Created connect plist: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/Library/LaunchAgents/com.shipwright.connect.plist
+[38;2;0;212;255m[1m▸[0m Loading launchd services...
+Mock loaded: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/Library/LaunchAgents/com.shipwright.daemon.plist
+[38;2;74;222;128m[1m✓[0m Loaded daemon service
+Mock loaded: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/Library/LaunchAgents/com.shipwright.dashboard.plist
+[38;2;74;222;128m[1m✓[0m Loaded dashboard service
+Mock loaded: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/Library/LaunchAgents/com.shipwright.connect.plist
+[38;2;74;222;128m[1m✓[0m Loaded connect service
+
+[38;2;0;212;255m[1m▸[0m Services will auto-start on next login
+[38;2;0;212;255m[1m▸[0m View logs: [2mtail -f /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/.shipwright/logs/*.log[0m
+[38;2;0;212;255m[1m▸[0m Uninstall: [2mshipwright launchd uninstall[0m
+[38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Connect plist created only when team-config exists... [38;2;0;212;255m[1m▸[0m Installing launchd agents...
+[38;2;74;222;128m[1m✓[0m Created daemon plist: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/fresh-home/Library/LaunchAgents/com.shipwright.daemon.plist
+[38;2;250;204;21m[1m⚠[0m server.ts not found at /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T/sw-launchd-test.G2ePKG/dashboard/server.ts — dashboard plist will reference a missing file
+[38;2;74;222;128m[1m✓[0m Created dashboard plist: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/fresh-home/Library/LaunchAgents/com.shipwright.dashboard.plist
+[38;2;0;212;255m[1m▸[0m Skipping connect plist — /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/fresh-home/.shipwright/team-config.json not found
+[38;2;0;212;255m[1m▸[0m Loading launchd services...
+Mock loaded: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/fresh-home/Library/LaunchAgents/com.shipwright.daemon.plist
+[38;2;74;222;128m[1m✓[0m Loaded daemon service
+Mock loaded: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/fresh-home/Library/LaunchAgents/com.shipwright.dashboard.plist
+[38;2;74;222;128m[1m✓[0m Loaded dashboard service
+
+[38;2;0;212;255m[1m▸[0m Services will auto-start on next login
+[38;2;0;212;255m[1m▸[0m View logs: [2mtail -f /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/fresh-home/.shipwright/logs/*.log[0m
+[38;2;0;212;255m[1m▸[0m Uninstall: [2mshipwright launchd uninstall[0m
+[38;2;0;212;255m[1m▸[0m Installing launchd agents...
+[38;2;74;222;128m[1m✓[0m Created daemon plist: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/fresh-home/Library/LaunchAgents/com.shipwright.daemon.plist
+[38;2;250;204;21m[1m⚠[0m server.ts not found at /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T/sw-launchd-test.G2ePKG/dashboard/server.ts — dashboard plist will reference a missing file
+[38;2;74;222;128m[1m✓[0m Created dashboard plist: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/fresh-home/Library/LaunchAgents/com.shipwright.dashboard.plist
+[38;2;74;222;128m[1m✓[0m Created connect plist: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/fresh-home/Library/LaunchAgents/com.shipwright.connect.plist
+[38;2;0;212;255m[1m▸[0m Loading launchd services...
+Mock loaded: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/fresh-home/Library/LaunchAgents/com.shipwright.daemon.plist
+[38;2;74;222;128m[1m✓[0m Loaded daemon service
+Mock loaded: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/fresh-home/Library/LaunchAgents/com.shipwright.dashboard.plist
+[38;2;74;222;128m[1m✓[0m Loaded dashboard service
+Mock loaded: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/fresh-home/Library/LaunchAgents/com.shipwright.connect.plist
+[38;2;74;222;128m[1m✓[0m Loaded connect service
+
+[38;2;0;212;255m[1m▸[0m Services will auto-start on next login
+[38;2;0;212;255m[1m▸[0m View logs: [2mtail -f /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/fresh-home/.shipwright/logs/*.log[0m
+[38;2;0;212;255m[1m▸[0m Uninstall: [2mshipwright launchd uninstall[0m
+[38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Plist files have correct permissions... [38;2;0;212;255m[1m▸[0m Installing launchd agents...
+[38;2;74;222;128m[1m✓[0m Created daemon plist: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/Library/LaunchAgents/com.shipwright.daemon.plist
+[38;2;250;204;21m[1m⚠[0m server.ts not found at /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T/sw-launchd-test.G2ePKG/dashboard/server.ts — dashboard plist will reference a missing file
+[38;2;74;222;128m[1m✓[0m Created dashboard plist: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/Library/LaunchAgents/com.shipwright.dashboard.plist
+[38;2;74;222;128m[1m✓[0m Created connect plist: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/Library/LaunchAgents/com.shipwright.connect.plist
+[38;2;0;212;255m[1m▸[0m Loading launchd services...
+Mock loaded: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/Library/LaunchAgents/com.shipwright.daemon.plist
+[38;2;74;222;128m[1m✓[0m Loaded daemon service
+Mock loaded: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/Library/LaunchAgents/com.shipwright.dashboard.plist
+[38;2;74;222;128m[1m✓[0m Loaded dashboard service
+Mock loaded: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/Library/LaunchAgents/com.shipwright.connect.plist
+[38;2;74;222;128m[1m✓[0m Loaded connect service
+
+[38;2;0;212;255m[1m▸[0m Services will auto-start on next login
+[38;2;0;212;255m[1m▸[0m View logs: [2mtail -f /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/.shipwright/logs/*.log[0m
+[38;2;0;212;255m[1m▸[0m Uninstall: [2mshipwright launchd uninstall[0m
+[38;2;74;222;128m✓[0m
+
+[38;2;168;85;247m[1mInstall Command[0m
+  [38;2;0;212;255m▸[0m Install creates LaunchAgents directory... [38;2;0;212;255m[1m▸[0m Installing launchd agents...
+[38;2;74;222;128m[1m✓[0m Created daemon plist: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/Library/LaunchAgents/com.shipwright.daemon.plist
+[38;2;250;204;21m[1m⚠[0m server.ts not found at /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T/sw-launchd-test.G2ePKG/dashboard/server.ts — dashboard plist will reference a missing file
+[38;2;74;222;128m[1m✓[0m Created dashboard plist: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/Library/LaunchAgents/com.shipwright.dashboard.plist
+[38;2;74;222;128m[1m✓[0m Created connect plist: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/Library/LaunchAgents/com.shipwright.connect.plist
+[38;2;0;212;255m[1m▸[0m Loading launchd services...
+Mock loaded: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/Library/LaunchAgents/com.shipwright.daemon.plist
+[38;2;74;222;128m[1m✓[0m Loaded daemon service
+Mock loaded: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/Library/LaunchAgents/com.shipwright.dashboard.plist
+[38;2;74;222;128m[1m✓[0m Loaded dashboard service
+Mock loaded: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/Library/LaunchAgents/com.shipwright.connect.plist
+[38;2;74;222;128m[1m✓[0m Loaded connect service
+
+[38;2;0;212;255m[1m▸[0m Services will auto-start on next login
+[38;2;0;212;255m[1m▸[0m View logs: [2mtail -f /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/.shipwright/logs/*.log[0m
+[38;2;0;212;255m[1m▸[0m Uninstall: [2mshipwright launchd uninstall[0m
+[38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Install calls launchctl load... [38;2;0;212;255m[1m▸[0m Installing launchd agents...
+[38;2;74;222;128m[1m✓[0m Created daemon plist: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/Library/LaunchAgents/com.shipwright.daemon.plist
+[38;2;250;204;21m[1m⚠[0m server.ts not found at /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T/sw-launchd-test.G2ePKG/dashboard/server.ts — dashboard plist will reference a missing file
+[38;2;74;222;128m[1m✓[0m Created dashboard plist: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/Library/LaunchAgents/com.shipwright.dashboard.plist
+[38;2;74;222;128m[1m✓[0m Created connect plist: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/Library/LaunchAgents/com.shipwright.connect.plist
+[38;2;0;212;255m[1m▸[0m Loading launchd services...
+Mock loaded: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/Library/LaunchAgents/com.shipwright.daemon.plist
+[38;2;74;222;128m[1m✓[0m Loaded daemon service
+Mock loaded: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/Library/LaunchAgents/com.shipwright.dashboard.plist
+[38;2;74;222;128m[1m✓[0m Loaded dashboard service
+Mock loaded: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/Library/LaunchAgents/com.shipwright.connect.plist
+[38;2;74;222;128m[1m✓[0m Loaded connect service
+
+[38;2;0;212;255m[1m▸[0m Services will auto-start on next login
+[38;2;0;212;255m[1m▸[0m View logs: [2mtail -f /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/.shipwright/logs/*.log[0m
+[38;2;0;212;255m[1m▸[0m Uninstall: [2mshipwright launchd uninstall[0m
+scripts/sw-launchd-test.sh: line 457: [[: 0
+0: syntax error in expression (error token is "0")
+[38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Install fails gracefully if sw binary not found... [38;2;74;222;128m✓[0m
+
+[38;2;168;85;247m[1mUninstall Command[0m
+  [38;2;0;212;255m▸[0m Uninstall removes plist files... [38;2;0;212;255m[1m▸[0m Installing launchd agents...
+[38;2;74;222;128m[1m✓[0m Created daemon plist: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/Library/LaunchAgents/com.shipwright.daemon.plist
+[38;2;250;204;21m[1m⚠[0m server.ts not found at /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T/sw-launchd-test.G2ePKG/dashboard/server.ts — dashboard plist will reference a missing file
+[38;2;74;222;128m[1m✓[0m Created dashboard plist: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/Library/LaunchAgents/com.shipwright.dashboard.plist
+[38;2;74;222;128m[1m✓[0m Created connect plist: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/Library/LaunchAgents/com.shipwright.connect.plist
+[38;2;0;212;255m[1m▸[0m Loading launchd services...
+Mock loaded: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/Library/LaunchAgents/com.shipwright.daemon.plist
+[38;2;74;222;128m[1m✓[0m Loaded daemon service
+Mock loaded: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/Library/LaunchAgents/com.shipwright.dashboard.plist
+[38;2;74;222;128m[1m✓[0m Loaded dashboard service
+Mock loaded: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/Library/LaunchAgents/com.shipwright.connect.plist
+[38;2;74;222;128m[1m✓[0m Loaded connect service
+
+[38;2;0;212;255m[1m▸[0m Services will auto-start on next login
+[38;2;0;212;255m[1m▸[0m View logs: [2mtail -f /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/.shipwright/logs/*.log[0m
+[38;2;0;212;255m[1m▸[0m Uninstall: [2mshipwright launchd uninstall[0m
+[38;2;0;212;255m[1m▸[0m Uninstalling launchd agents...
+Mock unloaded: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/Library/LaunchAgents/com.shipwright.daemon.plist
+[38;2;74;222;128m[1m✓[0m Unloaded daemon service
+[38;2;74;222;128m[1m✓[0m Removed daemon plist
+Mock unloaded: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/Library/LaunchAgents/com.shipwright.dashboard.plist
+[38;2;74;222;128m[1m✓[0m Unloaded dashboard service
+[38;2;74;222;128m[1m✓[0m Removed dashboard plist
+Mock unloaded: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/Library/LaunchAgents/com.shipwright.connect.plist
+[38;2;74;222;128m[1m✓[0m Unloaded connect service
+[38;2;74;222;128m[1m✓[0m Removed connect plist
+
+[38;2;74;222;128m[1m✓[0m Uninstalled all launchd agents
+[38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Uninstall calls launchctl unload... [38;2;0;212;255m[1m▸[0m Installing launchd agents...
+[38;2;74;222;128m[1m✓[0m Created daemon plist: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/Library/LaunchAgents/com.shipwright.daemon.plist
+[38;2;250;204;21m[1m⚠[0m server.ts not found at /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T/sw-launchd-test.G2ePKG/dashboard/server.ts — dashboard plist will reference a missing file
+[38;2;74;222;128m[1m✓[0m Created dashboard plist: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/Library/LaunchAgents/com.shipwright.dashboard.plist
+[38;2;74;222;128m[1m✓[0m Created connect plist: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/Library/LaunchAgents/com.shipwright.connect.plist
+[38;2;0;212;255m[1m▸[0m Loading launchd services...
+Mock loaded: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/Library/LaunchAgents/com.shipwright.daemon.plist
+[38;2;74;222;128m[1m✓[0m Loaded daemon service
+Mock loaded: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/Library/LaunchAgents/com.shipwright.dashboard.plist
+[38;2;74;222;128m[1m✓[0m Loaded dashboard service
+Mock loaded: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/Library/LaunchAgents/com.shipwright.connect.plist
+[38;2;74;222;128m[1m✓[0m Loaded connect service
+
+[38;2;0;212;255m[1m▸[0m Services will auto-start on next login
+[38;2;0;212;255m[1m▸[0m View logs: [2mtail -f /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/.shipwright/logs/*.log[0m
+[38;2;0;212;255m[1m▸[0m Uninstall: [2mshipwright launchd uninstall[0m
+[38;2;0;212;255m[1m▸[0m Uninstalling launchd agents...
+Mock unloaded: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/Library/LaunchAgents/com.shipwright.daemon.plist
+[38;2;74;222;128m[1m✓[0m Unloaded daemon service
+[38;2;74;222;128m[1m✓[0m Removed daemon plist
+Mock unloaded: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/Library/LaunchAgents/com.shipwright.dashboard.plist
+[38;2;74;222;128m[1m✓[0m Unloaded dashboard service
+[38;2;74;222;128m[1m✓[0m Removed dashboard plist
+Mock unloaded: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/Library/LaunchAgents/com.shipwright.connect.plist
+[38;2;74;222;128m[1m✓[0m Unloaded connect service
+[38;2;74;222;128m[1m✓[0m Removed connect plist
+
+[38;2;74;222;128m[1m✓[0m Uninstalled all launchd agents
+scripts/sw-launchd-test.sh: line 549: [[: 0
+0: syntax error in expression (error token is "0")
+[38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Uninstall on empty system doesn't error... [38;2;0;212;255m[1m▸[0m Uninstalling launchd agents...
+
+[38;2;74;222;128m[1m✓[0m Uninstalled all launchd agents
+[38;2;74;222;128m✓[0m
+
+[38;2;168;85;247m[1mStatus Command[0m
+  [38;2;0;212;255m▸[0m Status command checks launchctl list... [38;2;0;212;255m[1m▸[0m Installing launchd agents...
+[38;2;74;222;128m[1m✓[0m Created daemon plist: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/Library/LaunchAgents/com.shipwright.daemon.plist
+[38;2;250;204;21m[1m⚠[0m server.ts not found at /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T/sw-launchd-test.G2ePKG/dashboard/server.ts — dashboard plist will reference a missing file
+[38;2;74;222;128m[1m✓[0m Created dashboard plist: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/Library/LaunchAgents/com.shipwright.dashboard.plist
+[38;2;74;222;128m[1m✓[0m Created connect plist: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/Library/LaunchAgents/com.shipwright.connect.plist
+[38;2;0;212;255m[1m▸[0m Loading launchd services...
+Mock loaded: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/Library/LaunchAgents/com.shipwright.daemon.plist
+[38;2;74;222;128m[1m✓[0m Loaded daemon service
+Mock loaded: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/Library/LaunchAgents/com.shipwright.dashboard.plist
+[38;2;74;222;128m[1m✓[0m Loaded dashboard service
+Mock loaded: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/Library/LaunchAgents/com.shipwright.connect.plist
+[38;2;74;222;128m[1m✓[0m Loaded connect service
+
+[38;2;0;212;255m[1m▸[0m Services will auto-start on next login
+[38;2;0;212;255m[1m▸[0m View logs: [2mtail -f /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/.shipwright/logs/*.log[0m
+[38;2;0;212;255m[1m▸[0m Uninstall: [2mshipwright launchd uninstall[0m
+[38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Status shows log directory... [38;2;74;222;128m✓[0m
+
+[38;2;168;85;247m[1mHelp Command[0m
+  [38;2;0;212;255m▸[0m Help command shows usage and examples... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Help is shown for unknown commands... [38;2;74;222;128m✓[0m
+
+[38;2;168;85;247m[1mEnvironment & Configuration[0m
+  [38;2;0;212;255m▸[0m Plist contains correct environment variables... [38;2;0;212;255m[1m▸[0m Installing launchd agents...
+[38;2;74;222;128m[1m✓[0m Created daemon plist: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/Library/LaunchAgents/com.shipwright.daemon.plist
+[38;2;250;204;21m[1m⚠[0m server.ts not found at /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T/sw-launchd-test.G2ePKG/dashboard/server.ts — dashboard plist will reference a missing file
+[38;2;74;222;128m[1m✓[0m Created dashboard plist: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/Library/LaunchAgents/com.shipwright.dashboard.plist
+[38;2;74;222;128m[1m✓[0m Created connect plist: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/Library/LaunchAgents/com.shipwright.connect.plist
+[38;2;0;212;255m[1m▸[0m Loading launchd services...
+Mock loaded: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/Library/LaunchAgents/com.shipwright.daemon.plist
+[38;2;74;222;128m[1m✓[0m Loaded daemon service
+Mock loaded: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/Library/LaunchAgents/com.shipwright.dashboard.plist
+[38;2;74;222;128m[1m✓[0m Loaded dashboard service
+Mock loaded: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/Library/LaunchAgents/com.shipwright.connect.plist
+[38;2;74;222;128m[1m✓[0m Loaded connect service
+
+[38;2;0;212;255m[1m▸[0m Services will auto-start on next login
+[38;2;0;212;255m[1m▸[0m View logs: [2mtail -f /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/.shipwright/logs/*.log[0m
+[38;2;0;212;255m[1m▸[0m Uninstall: [2mshipwright launchd uninstall[0m
+[38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Working directory is set in plist... [38;2;0;212;255m[1m▸[0m Installing launchd agents...
+[38;2;74;222;128m[1m✓[0m Created daemon plist: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/Library/LaunchAgents/com.shipwright.daemon.plist
+[38;2;250;204;21m[1m⚠[0m server.ts not found at /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T/sw-launchd-test.G2ePKG/dashboard/server.ts — dashboard plist will reference a missing file
+[38;2;74;222;128m[1m✓[0m Created dashboard plist: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/Library/LaunchAgents/com.shipwright.dashboard.plist
+[38;2;74;222;128m[1m✓[0m Created connect plist: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/Library/LaunchAgents/com.shipwright.connect.plist
+[38;2;0;212;255m[1m▸[0m Loading launchd services...
+Mock loaded: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/Library/LaunchAgents/com.shipwright.daemon.plist
+[38;2;74;222;128m[1m✓[0m Loaded daemon service
+Mock loaded: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/Library/LaunchAgents/com.shipwright.dashboard.plist
+[38;2;74;222;128m[1m✓[0m Loaded dashboard service
+Mock loaded: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/Library/LaunchAgents/com.shipwright.connect.plist
+[38;2;74;222;128m[1m✓[0m Loaded connect service
+
+[38;2;0;212;255m[1m▸[0m Services will auto-start on next login
+[38;2;0;212;255m[1m▸[0m View logs: [2mtail -f /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/.shipwright/logs/*.log[0m
+[38;2;0;212;255m[1m▸[0m Uninstall: [2mshipwright launchd uninstall[0m
+[38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Plist configures stdout and stderr logging... [38;2;0;212;255m[1m▸[0m Installing launchd agents...
+[38;2;74;222;128m[1m✓[0m Created daemon plist: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/Library/LaunchAgents/com.shipwright.daemon.plist
+[38;2;250;204;21m[1m⚠[0m server.ts not found at /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T/sw-launchd-test.G2ePKG/dashboard/server.ts — dashboard plist will reference a missing file
+[38;2;74;222;128m[1m✓[0m Created dashboard plist: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/Library/LaunchAgents/com.shipwright.dashboard.plist
+[38;2;74;222;128m[1m✓[0m Created connect plist: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/Library/LaunchAgents/com.shipwright.connect.plist
+[38;2;0;212;255m[1m▸[0m Loading launchd services...
+Mock loaded: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/Library/LaunchAgents/com.shipwright.daemon.plist
+[38;2;74;222;128m[1m✓[0m Loaded daemon service
+Mock loaded: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/Library/LaunchAgents/com.shipwright.dashboard.plist
+[38;2;74;222;128m[1m✓[0m Loaded dashboard service
+Mock loaded: /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/Library/LaunchAgents/com.shipwright.connect.plist
+[38;2;74;222;128m[1m✓[0m Loaded connect service
+
+[38;2;0;212;255m[1m▸[0m Services will auto-start on next login
+[38;2;0;212;255m[1m▸[0m View logs: [2mtail -f /var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-launchd-test.G2ePKG/home/.shipwright/logs/*.log[0m
+[38;2;0;212;255m[1m▸[0m Uninstall: [2mshipwright launchd uninstall[0m
+[38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Version variable is defined... [38;2;74;222;128m✓[0m
+
+[38;2;0;212;255m[1m════════════════════════════════════════════════════[0m
+[38;2;74;222;128m[1m  All 20 tests passed ✓[0m
+[38;2;0;212;255m[1m════════════════════════════════════════════════════[0m
+
+
+
+[38;2;0;212;255m[1m  Shipwright Linear Test Suite[0m
+[2m  ══════════════════════════════════════════[0m
+
+
+[1m  Script Safety[0m
+  [38;2;74;222;128m✓[0m set -euo pipefail present
+  [38;2;74;222;128m✓[0m ERR trap present
+  [38;2;74;222;128m✓[0m VERSION variable defined
+  [38;2;74;222;128m✓[0m VERSION is semver: 3.2.4
+
+[1m  Help Output[0m
+  [38;2;74;222;128m✓[0m help mentions USAGE
+  [38;2;74;222;128m✓[0m help mentions sync command
+  [38;2;74;222;128m✓[0m help mentions update command
+  [38;2;74;222;128m✓[0m help mentions status command
+  [38;2;74;222;128m✓[0m help mentions init command
+  [38;2;74;222;128m✓[0m help mentions LINEAR_API_KEY
+  [38;2;74;222;128m✓[0m --help works
+
+[1m  Error Handling[0m
+
+[38;2;0;212;255m[1mshipwright linear[0m — Linear ↔ GitHub Bidirectional Sync
+
+[1mUSAGE[0m
+  [38;2;0;212;255mshipwright linear[0m <command> [options]
+
+[1mCOMMANDS[0m
+  [38;2;0;212;255msync[0m [--dry-run]              Sync Linear Todo issues → GitHub
+  [38;2;0;212;255mupdate[0m <issue> <status>       Update linked Linear ticket status
+  [38;2;0;212;255mstatus[0m                        Show sync dashboard
+  [38;2;0;212;255minit[0m                          Configure Linear API key
+  [38;2;0;212;255mhelp[0m                          Show this help
+
+[1mSTATUS VALUES[0m
+  [38;2;0;212;255mstarted[0m     Pipeline spawned   → Linear: In Progress
+  [38;2;0;212;255mreview[0m      PR created         → Linear: In Review
+  [38;2;0;212;255mdone[0m        Pipeline complete   → Linear: Done
+  [38;2;0;212;255mfailed[0m      Pipeline failed     → Linear: adds failure comment
+
+[1mEXAMPLES[0m
+  [2mshipwright linear init[0m                    # Set up API key
+  [2mshipwright linear sync[0m                    # Sync Todo → GitHub
+  [2mshipwright linear sync --dry-run[0m          # Preview what would sync
+  [2mshipwright linear update 42 started[0m       # Mark as In Progress
+  [2mshipwright linear update 42 review[0m        # Mark as In Review
+  [2mshipwright linear update 42 done[0m          # Mark as Done
+  [2mshipwright linear status[0m                  # Show dashboard
+
+[1mENVIRONMENT[0m
+  [2mLINEAR_API_KEY[0m      API key (or use 'linear init' to save)
+  [2mLINEAR_TEAM_ID[0m      Override team ID
+  [2mLINEAR_PROJECT_ID[0m   Override project ID
+  [38;2;74;222;128m✓[0m unknown command exits non-zero
+  [38;2;74;222;128m✓[0m unknown command shows error
+
+[1m  Default Behavior[0m
+  [38;2;74;222;128m✓[0m no-arg defaults to help
+
+[1m  Configuration[0m
+  [38;2;74;222;128m✓[0m sync without API key shows error
+  [38;2;74;222;128m✓[0m update without API key shows error
+  [38;2;74;222;128m✓[0m status without API key shows error
+
+[1m  Config Loading[0m
+  [38;2;74;222;128m✓[0m sync with config proceeds
+
+[1m  Update Subcommand[0m
+  [38;2;74;222;128m✓[0m update without args shows usage
+
+[1m  Notify Integration[0m
+  [38;2;74;222;128m✓[0m notify subcommand executes without crash
+
+[1m  Atomic Writes[0m
+  [38;2;74;222;128m✓[0m init uses atomic write (tmp + mv)
+  [38;2;74;222;128m✓[0m config file gets restricted permissions
+
+[1m  GraphQL Helper[0m
+  [38;2;74;222;128m✓[0m linear_graphql helper defined
+  [38;2;74;222;128m✓[0m uses jq --arg for safe JSON escaping
+
+[1m  Event Emission[0m
+  [38;2;74;222;128m✓[0m emits linear events
+  [38;2;74;222;128m✓[0m uses EVENTS_FILE for event logging
+
+
+
+
+[2m  ──────────────────────────────────────────[0m
+
+  [38;2;74;222;128m[1mAll 0 tests passed[0m
+
+
+
+[38;2;0;212;255m[1m  shipwright logs test[0m
+[2m  ══════════════════════════════════════════[0m
+
+[2m  ══════════════════════════════════════════[0m
+
+[1mScript Safety[0m
+  [38;2;74;222;128m✓[0m set -euo pipefail present
+  [38;2;74;222;128m✓[0m ERR trap present
+
+[1mVersion[0m
+  [38;2;74;222;128m✓[0m VERSION variable defined
+
+[1mHelp Output[0m
+  [38;2;74;222;128m✓[0m help contains USAGE
+  [38;2;74;222;128m✓[0m help contains --pane option
+  [38;2;74;222;128m✓[0m help contains --follow option
+  [38;2;74;222;128m✓[0m help contains --grep option
+  [38;2;74;222;128m✓[0m help contains --capture option
+  [38;2;74;222;128m✓[0m help contains -f shorthand
+
+[1mHelp Exit Code[0m
+  [38;2;74;222;128m✓[0m help exits 0
+  [38;2;74;222;128m✓[0m -h exits 0
+
+[1mError Handling[0m
+  [38;2;74;222;128m✓[0m unknown option exits non-zero
+  [38;2;74;222;128m✓[0m unknown option error
+
+[1mList Logs[0m
+  [38;2;74;222;128m✓[0m list shows Agent Logs heading
+  [38;2;74;222;128m✓[0m list shows team directory
+
+[1mTeam Logs[0m
+  [38;2;74;222;128m✓[0m team logs shows team name
+  [38;2;74;222;128m✓[0m team logs lists log files
+  [38;2;74;222;128m✓[0m team logs shows builder log
+
+[1mGrep Search[0m
+  [38;2;74;222;128m✓[0m grep finds ERROR pattern
+  [38;2;74;222;128m✓[0m grep shows file context
+  [38;2;74;222;128m✓[0m grep shows no matches warning
+
+[1mPane Filter[0m
+  [38;2;74;222;128m✓[0m pane filter shows reviewer logs
+  [38;2;74;222;128m✓[0m nonexistent pane warns
+
+[1mCapture Command[0m
+  [38;2;74;222;128m✓[0m capture reports status
+
+[1mMissing Arguments[0m
+  [38;2;74;222;128m✓[0m missing --pane value exits non-zero
+  [38;2;74;222;128m✓[0m missing --pane shows error
+  [38;2;74;222;128m✓[0m missing --grep value exits non-zero
+  [38;2;74;222;128m✓[0m missing --grep shows error
+
+[1mIntelligence Integration[0m
+  [38;2;74;222;128m✓[0m intelligence_available function defined
+  [38;2;74;222;128m✓[0m semantic_rank_results function defined
+
+[1mScript Structure[0m
+  [38;2;74;222;128m✓[0m LOGS_DIR defined
+  [38;2;74;222;128m✓[0m capture_logs function defined
+  [38;2;74;222;128m✓[0m list_logs function defined
+  [38;2;74;222;128m✓[0m show_team_logs function defined
+
+
+
+
+[2m  ──────────────────────────────────────────[0m
+
+  [38;2;74;222;128m[1mAll 0 tests passed[0m
+
+
+
+[38;2;0;212;255m[1m  Shipwright Loop Tests[0m
+[2m  ══════════════════════════════════════════[0m
+
+[2m  ══════════════════════════════════════════[0m
+
+[2m  help / version[0m
+  [38;2;74;222;128m✓[0m --help exits 0
+  [38;2;74;222;128m✓[0m --help shows usage
+  [38;2;74;222;128m✓[0m --help shows options
+  [38;2;74;222;128m✓[0m --help mentions --max-iterations
+  [38;2;74;222;128m✓[0m --help mentions --test-cmd
+  [38;2;74;222;128m✓[0m --help mentions --model
+  [38;2;74;222;128m✓[0m --help mentions --agents
+  [38;2;74;222;128m✓[0m --help mentions --resume
+  [38;2;74;222;128m✓[0m VERSION variable defined in sw-loop.sh
+
+[2m  argument parsing[0m
+  [38;2;74;222;128m✓[0m No arguments exits non-zero
+
+[2m  script safety[0m
+  [38;2;74;222;128m✓[0m Uses set -euo pipefail
+  [38;2;74;222;128m✓[0m ERR trap is set
+  [38;2;74;222;128m✓[0m SIGHUP trap set for daemon resilience
+  [38;2;74;222;128m✓[0m CLAUDECODE env var is unset
+
+[2m  defaults[0m
+  [38;2;74;222;128m✓[0m Default MAX_ITERATIONS is 20
+  [38;2;74;222;128m✓[0m Default AGENTS is 1
+  [38;2;74;222;128m✓[0m Default MAX_RESTARTS is 0
+  [38;2;74;222;128m✓[0m Sources lib/compat.sh
+
+[2m  json output format[0m
+  [38;2;74;222;128m✓[0m build_claude_flags includes --output-format json
+[2m  effort level flag[0m
+  [38;2;74;222;128m✓[0m build_claude_flags supports --effort
+[2m  fallback model flag[0m
+  [38;2;74;222;128m✓[0m build_claude_flags supports --fallback-model
+  [38;2;74;222;128m✓[0m accumulate_loop_tokens parses JSON usage
+  [38;2;74;222;128m✓[0m LOOP_COST_MILLICENTS initialized
+  [38;2;74;222;128m✓[0m write_loop_tokens includes cost_usd
+  [38;2;74;222;128m✓[0m _extract_text_from_json helper defined
+  [38;2;74;222;128m✓[0m validate_claude_output helper defined
+  [38;2;74;222;128m✓[0m check_budget_gate helper defined
+  [38;2;74;222;128m✓[0m run_claude_iteration separates stdout from stderr
+
+[2m  json extraction robustness[0m
+  [38;2;74;222;128m✓[0m _extract_text_from_json handles empty file
+  [38;2;74;222;128m✓[0m _extract_text_from_json extracts .result from JSON
+  [38;2;74;222;128m✓[0m _extract_text_from_json passes through plain text
+
+[2m  default config from source[0m
+  [38;2;74;222;128m✓[0m Default MAX_ITERATIONS is 20 (from source)
+  [38;2;74;222;128m✓[0m Default AGENTS is 1 (from source)
+  [38;2;74;222;128m✓[0m Default MAX_RESTARTS is 0 (from source)
+
+[2m  json extraction edge cases[0m
+  [38;2;74;222;128m✓[0m _extract_text_from_json handles nested JSON objects
+  [38;2;74;222;128m✓[0m _extract_text_from_json handles binary garbage without crash
+
+[2m  script structure[0m
+  [38;2;74;222;128m✓[0m Script has circuit breaker logic
+  [38;2;74;222;128m✓[0m Script has stuckness detection
+  [38;2;74;222;128m✓[0m Script has test/quality gate functions
+  [38;2;74;222;128m✓[0m Help text defines --model and --agents flags
+  [38;2;74;222;128m✓[0m Help text defines --test-cmd and --resume flags
+[2m  help mentions --effort[0m
+  [38;2;74;222;128m✓[0m Help text defines --effort flag
+[2m  help mentions --fallback-model[0m
+  [38;2;74;222;128m✓[0m Help text defines --fallback-model flag
+
+[2m  loop behavior: LOOP_COMPLETE[0m
+  [38;2;74;222;128m✓[0m Loop detected completion signal
+
+[2m  loop behavior: iterations on test failure[0m
+  [38;2;74;222;128m✓[0m Loop runs multiple iterations when tests fail initially
+
+[2m  loop behavior: max iterations[0m
+  [38;2;74;222;128m✓[0m Loop stops at max iterations
+
+[2m  loop behavior: stuckness detection[0m
+  [38;2;74;222;128m✓[0m Loop stops at limit (stuckness test)
+
+[2m  loop behavior: budget gate[0m
+  [38;2;74;222;128m✓[0m Budget gate stops loop
+
+[2m  validate_claude_output[0m
+  [38;2;74;222;128m✓[0m validate_claude_output catches corrupt output
+
+[2m  loop behavior: progress tracking[0m
+  [38;2;74;222;128m✓[0m Loop tracks progress via git
+
+[2m  context efficiency metrics[0m
+  [38;2;74;222;128m✓[0m loop.context_efficiency event exists in run_claude_iteration
+  [38;2;74;222;128m✓[0m Context efficiency emits raw and trimmed char counts
+  [38;2;74;222;128m✓[0m Context efficiency emits trim_ratio and budget_utilization
+  [38;2;74;222;128m✓[0m raw_prompt_chars measured from pre-trim prompt
+
+[2m  multi-test gate[0m
+  [38;2;74;222;128m✓[0m ADDITIONAL_TEST_CMDS variable defined
+  [38;2;74;222;128m✓[0m --additional-test-cmds flag in arg parser
+  [38;2;74;222;128m✓[0m --help documents --additional-test-cmds
+  [38;2;74;222;128m✓[0m run_test_gate writes test-evidence JSON
+  [38;2;74;222;128m✓[0m run_audit_agent reads structured test evidence
+
+[2m  verification gap handler[0m
+  [38;2;74;222;128m✓[0m Verification gap detection present
+  [38;2;74;222;128m✓[0m Verification gap resolved event emitted
+  [38;2;74;222;128m✓[0m Verification gap confirmed event emitted
+  [38;2;74;222;128m✓[0m Verification gap can override audit result
+  [38;2;74;222;128m✓[0m Verification re-runs tests to dedicated log
+  [38;2;74;222;128m✓[0m Mid-build test file discovery integrated
+
+
+
+[2m  ──────────────────────────────────────────[0m
+
+  [38;2;74;222;128m[1mAll 65 tests passed[0m
+
+
+[38;2;168;85;247m[1m╔═══════════════════════════════════════════════════════════════════╗[0m
+[38;2;168;85;247m[1m║  shipwright memory+cost test — Unit Tests for Memory & Cost      ║[0m
+[38;2;168;85;247m[1m╚═══════════════════════════════════════════════════════════════════╝[0m
+
+[2mSetting up mock environment...[0m
+[38;2;74;222;128m✓[0m Environment ready: [2m/var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-memory-test.62S2eY[0m
+
+  [38;2;0;212;255m▸[0m Memory capture from pipeline state... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Memory inject returns context for each stage... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Failure capture stores patterns... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Pattern detection identifies project type... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Cross-repo vs per-repo isolation... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Memory show displays dashboard... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Memory search finds matching entries... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Memory export produces valid JSON... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Memory forget clears repo memory... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Cost calculation for each model... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Cost recording writes to costs.json... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Budget set and check... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Cost dashboard runs without errors... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Cost JSON output is valid... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Actionable failures threshold filtering... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Actionable failures with no file returns []... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m DORA baseline calculation from events... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Error log entries captured into failures.json... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Fix outcome tracking increments counters... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Closed-loop inject returns formatted fix... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Global aggregation promotes frequent patterns... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Finalize pipeline runs capture + aggregate... [38;2;0;212;255m[1m▸[0m Capturing pipeline learnings for [38;2;0;212;255mtest-org/test-repo[0m...
+[38;2;74;222;128m[1m✓[0m Captured pipeline learnings (status: complete)
+[38;2;74;222;128m✓[0m
+
+[38;2;168;85;247m[1m━━━ Results ━━━[0m
+  [38;2;74;222;128mPassed:[0m 22
+  [38;2;248;113;113mFailed:[0m 0
+  [2mTotal:[0m  22
+
+[38;2;74;222;128m[1mAll 22 tests passed![0m
+
+
+
+[38;2;0;212;255m[1m  Shipwright Mission Control Tests[0m
+[2m  ══════════════════════════════════════════[0m
+
+[2m  ══════════════════════════════════════════[0m
+
+[1m  Help & Navigation[0m
+  [38;2;74;222;128m✓[0m help shows usage
+  [38;2;74;222;128m✓[0m help shows commands
+  [38;2;74;222;128m✓[0m --help flag works
+  [38;2;74;222;128m✓[0m unknown command shows error
+[1m  Overview[0m
+  [38;2;74;222;128m✓[0m overview shows MISSION CONTROL header
+  [38;2;74;222;128m✓[0m overview shows Summary Statistics
+  [38;2;74;222;128m✓[0m overview shows Active Pipelines
+  [38;2;74;222;128m✓[0m overview with active job shows count
+[1m  Agent Tree[0m
+  [38;2;74;222;128m✓[0m agents shows hierarchy
+  [38;2;74;222;128m✓[0m agents shows Pipeline Agent
+[1m  Resources[0m
+  [38;2;74;222;128m✓[0m resources shows utilization
+[1m  Alerts[0m
+  [38;2;74;222;128m✓[0m alerts shows alert feed
+[1m  Stage Commands[0m
+  [38;2;74;222;128m✓[0m pause without id exits nonzero
+  [38;2;74;222;128m✓[0m pause emits success
+  [38;2;74;222;128m✓[0m resume without id exits nonzero
+  [38;2;74;222;128m✓[0m resume emits success
+  [38;2;74;222;128m✓[0m skip without stage shows usage
+  [38;2;74;222;128m✓[0m skip emits success
+  [38;2;74;222;128m✓[0m retry emits success
+
+
+
+[2m  ──────────────────────────────────────────[0m
+
+  [38;2;74;222;128m[1mAll 19 tests passed[0m
+
+
+
+[38;2;0;212;255m[1m  Shipwright Model Router Tests[0m
+[2m  ══════════════════════════════════════════[0m
+
+[2m  ══════════════════════════════════════════[0m
+
+[1m  Help & Version[0m
+  [38;2;74;222;128m✓[0m help shows usage
+  [38;2;74;222;128m✓[0m help shows route
+  [38;2;74;222;128m✓[0m help shows escalate
+  [38;2;74;222;128m✓[0m help shows config
+
+[1m  Route Model[0m
+  [38;2;74;222;128m✓[0m route intake at 50 = haiku
+  [38;2;74;222;128m✓[0m route build at 50 = opus
+  [38;2;74;222;128m✓[0m route test at 50 = sonnet
+  [38;2;74;222;128m✓[0m route build at 10 (low) = sonnet
+  [38;2;74;222;128m✓[0m route intake at 90 (high) = opus
+  [38;2;74;222;128m✓[0m route unknown stage at 50 = sonnet
+
+[1m  Escalate Model[0m
+  [38;2;74;222;128m✓[0m escalate haiku -> sonnet
+  [38;2;74;222;128m✓[0m escalate sonnet -> opus
+  [38;2;74;222;128m✓[0m escalate opus -> opus (ceiling)
+  [38;2;74;222;128m✓[0m escalate unknown exits non-zero
+
+[1m  Config[0m
+  [38;2;74;222;128m✓[0m config show displays JSON
+  [38;2;74;222;128m✓[0m config creates default file
+  [38;2;74;222;128m✓[0m config set confirms update
+  [38;2;74;222;128m✓[0m config set persists value
+
+[1m  Estimate[0m
+  [38;2;74;222;128m✓[0m estimate shows stages
+  [38;2;74;222;128m✓[0m estimate shows total
+
+[1m  Report[0m
+  [38;2;74;222;128m✓[0m report with no data warns
+
+[1m  Record Usage[0m
+  [38;2;74;222;128m✓[0m record_usage creates usage file
+  [38;2;74;222;128m✓[0m record_usage writes entries
+  [38;2;74;222;128m✓[0m report with data shows summary
+  [38;2;74;222;128m✓[0m report shows total runs
+  [38;2;74;222;128m✓[0m report shows cost
+  [38;2;74;222;128m✓[0m report shows model counts
+
+[1m  Route All Stages & Complexity[0m
+  [38;2;74;222;128m✓[0m route intake at 50 returns model
+  [38;2;74;222;128m✓[0m route plan at 50 returns model
+  [38;2;74;222;128m✓[0m route design at 50 returns model
+  [38;2;74;222;128m✓[0m route build at 50 returns model
+  [38;2;74;222;128m✓[0m route test at 50 returns model
+  [38;2;74;222;128m✓[0m route review at 50 returns model
+  [38;2;74;222;128m✓[0m route compound_quality at 50 returns model
+  [38;2;74;222;128m✓[0m route validate at 50 returns model
+  [38;2;74;222;128m✓[0m route monitor at 50 returns model
+  [38;2;74;222;128m✓[0m route plan at low complexity = sonnet
+  [38;2;74;222;128m✓[0m route plan at high complexity = opus
+
+[1m  Config Set/Show Cycle[0m
+[38;2;74;222;128m[1m✓[0m Updated cost_aware_mode = false
+  [38;2;74;222;128m✓[0m config show reflects settings
+  [38;2;74;222;128m✓[0m config set persists
+  [38;2;74;222;128m✓[0m estimate with low complexity shows stages
+  [38;2;74;222;128m✓[0m estimate shows Total
+  [38;2;74;222;128m✓[0m estimate with high complexity
+
+[1m  Error Handling[0m
+  [38;2;74;222;128m✓[0m unknown subcommand exits non-zero
+  [38;2;74;222;128m✓[0m unknown subcommand shows error
+
+[1m  Reasoning Chains[0m
+  [38;2;74;222;128m✓[0m chain config shows templates
+  [38;2;74;222;128m✓[0m chain config shows explore-synthesize-decide
+  [38;2;74;222;128m✓[0m chain config shows fast-verify
+  [38;2;74;222;128m✓[0m chain config shows deep-analysis
+  [38;2;74;222;128m✓[0m chain config creates templates file
+  [38;2;74;222;128m✓[0m chain define shows success
+  [38;2;74;222;128m✓[0m chain define persists custom chain
+  ✓ chain_score_confidence returns numeric score
+  ✓ chain_score_confidence scores conclusion text higher
+  ✓ chain execute returns valid JSON
+  ✓ chain execute result has steps
+  ✓ chain step-cost returns numeric cost for haiku
+  ✓ chain step-cost ordering correct (haiku < sonnet < opus)
+  ✓ chain report outputs summary
+  ✓ chain define with invalid JSON exits non-zero
+  ✓ chain define validates JSON
+  ✓ explore-decide has 2 steps
+  ✓ explore-decide first step is haiku
+  ✓ explore-decide last step is opus
+  ✓ chain execute with invalid chain exits non-zero
+  ✓ chain execute shows error
+
+
+
+  ──────────────────────────────────────────
+
+  All 66 tests passed
+
+
+
+[38;2;0;212;255m[1m  Shipwright OTel Tests[0m
+[2m  ══════════════════════════════════════════[0m
+
+[2m  ══════════════════════════════════════════[0m
+
+[1m  Help & Version[0m
+  [38;2;74;222;128m✓[0m help shows usage
+  [38;2;74;222;128m✓[0m help shows metrics
+  [38;2;74;222;128m✓[0m help shows trace
+  [38;2;74;222;128m✓[0m help shows export
+  [38;2;74;222;128m✓[0m help shows webhook
+  [38;2;74;222;128m✓[0m help shows dashboard
+
+[1m  Metrics[0m
+  [38;2;74;222;128m✓[0m metrics text has pipelines_total
+  [38;2;74;222;128m✓[0m metrics text has active_pipelines
+  [38;2;74;222;128m✓[0m metrics text has cost
+  [38;2;74;222;128m✓[0m metrics text has queue depth
+  [38;2;74;222;128m✓[0m metrics json has metrics key
+  [38;2;74;222;128m✓[0m metrics json has pipelines_total
+  [38;2;74;222;128m✓[0m metrics json is valid JSON
+
+[1m  Trace[0m
+  [38;2;74;222;128m✓[0m trace has resourceSpans
+  [38;2;74;222;128m✓[0m trace has service.name
+  [38;2;74;222;128m✓[0m trace output is valid JSON
+
+[1m  Dashboard[0m
+  [38;2;74;222;128m✓[0m dashboard has dashboard key
+  [38;2;74;222;128m✓[0m dashboard output is valid JSON
+
+[1m  Report[0m
+  [38;2;74;222;128m✓[0m report shows header
+  [38;2;74;222;128m✓[0m report shows events section
+  [38;2;74;222;128m✓[0m report shows pipeline metrics
+  [38;2;74;222;128m✓[0m report shows recommendations
+
+[1m  Webhook[0m
+  [38;2;74;222;128m✓[0m webhook without URL exits non-zero
+  [38;2;74;222;128m✓[0m webhook without URL shows error
+
+[1m  Metrics With Events[0m
+  [38;2;74;222;128m✓[0m metrics count total pipelines = 2
+
+[1m  Error Handling[0m
+  [38;2;74;222;128m✓[0m unknown command exits non-zero
+  [38;2;74;222;128m✓[0m unknown command shows error
+
+
+
+[2m  ──────────────────────────────────────────[0m
+
+  [38;2;74;222;128m[1mAll 27 tests passed[0m
+
+
+
+[38;2;0;212;255m[1m  Shipwright Oversight Tests[0m
+[2m  ══════════════════════════════════════════[0m
+
+[2m  ══════════════════════════════════════════[0m
+
+  [38;2;74;222;128m✓[0m help shows usage text
+  [38;2;74;222;128m✓[0m help exits 0
+  [38;2;74;222;128m✓[0m --help flag works
+  [38;2;74;222;128m✓[0m unknown command exits 1
+  [38;2;74;222;128m✓[0m members shows board
+  [38;2;74;222;128m✓[0m members.json created
+  [38;2;74;222;128m✓[0m members.json is valid JSON
+  [38;2;74;222;128m✓[0m config show works
+  [38;2;74;222;128m✓[0m config.json created
+  [38;2;74;222;128m✓[0m stats shows statistics
+  [38;2;74;222;128m✓[0m history handles empty
+  [38;2;74;222;128m✓[0m review without args exits nonzero
+  [38;2;74;222;128m✓[0m review submission accepted
+  [38;2;74;222;128m✓[0m review JSON file created
+  [38;2;74;222;128m✓[0m review file is valid JSON
+  [38;2;74;222;128m✓[0m stats shows total reviews >= 1
+
+
+
+[2m  ──────────────────────────────────────────[0m
+
+  [38;2;74;222;128m[1mAll 0 tests passed[0m
+
+
+
+[38;2;0;212;255m[1m  Shipwright Patrol Meta Test Suite[0m
+[2m  ══════════════════════════════════════════[0m
+
+
+[1m  Script Structure[0m
+  [38;2;74;222;128m✓[0m contains sourced-file note
+  [38;2;74;222;128m✓[0m does NOT have set -euo pipefail as code (sourced script)
+  [38;2;74;222;128m✓[0m no main() function (sourced script)
+
+[1m  Function Definitions[0m
+  [38;2;74;222;128m✓[0m patrol_meta_run() defined
+  [38;2;74;222;128m✓[0m patrol_meta_create_issue() defined
+  [38;2;74;222;128m✓[0m patrol_meta_untested_scripts() defined
+  [38;2;74;222;128m✓[0m patrol_meta_bash_compat() defined
+  [38;2;74;222;128m✓[0m patrol_meta_version_sync() defined
+  [38;2;74;222;128m✓[0m patrol_meta_dora_trends() defined
+  [38;2;74;222;128m✓[0m patrol_meta_template_effectiveness() defined
+  [38;2;74;222;128m✓[0m patrol_meta_memory_pruning() defined
+  [38;2;74;222;128m✓[0m patrol_meta_event_analysis() defined
+
+[1m  Sourcing[0m
+  [38;2;74;222;128m✓[0m script can be sourced without error
+
+[1m  NO_GITHUB Dry Run[0m
+  [38;2;74;222;128m✓[0m checks NO_GITHUB for dry-run mode
+  [38;2;74;222;128m✓[0m supports dry-run output
+
+[1m  Bash Compat Checks[0m
+  [38;2;74;222;128m✓[0m bash compat check looks for declare -A
+  [38;2;74;222;128m✓[0m bash compat check looks for readarray/mapfile
+
+[1m  Dedup Logic[0m
+  [38;2;74;222;128m✓[0m dedup logic skips duplicate issues
+  [38;2;74;222;128m✓[0m dedup searches existing issues
+
+[1m  Memory Pruning Check[0m
+  [38;2;74;222;128m✓[0m memory pruning uses du -sk for size check
+  [38;2;74;222;128m✓[0m memory pruning has MB threshold
+
+[1m  Event Analysis[0m
+  [38;2;74;222;128m✓[0m event analysis uses 7-day window
+  [38;2;74;222;128m✓[0m event analysis checks pipeline.completed events
+
+[1m  Closed-Loop Self-Improvement Functions[0m
+  [38;2;74;222;128m✓[0m patrol_meta_score_impact() defined
+  [38;2;74;222;128m✓[0m patrol_meta_execute_fix() defined
+  [38;2;74;222;128m✓[0m patrol_meta_verify_fix() defined
+  [38;2;74;222;128m✓[0m patrol_meta_rollback() defined
+  [38;2;74;222;128m✓[0m patrol_meta_learn() defined
+  [38;2;74;222;128m✓[0m patrol_meta_batch_improve() defined
+  [38;2;74;222;128m✓[0m patrol_meta_auto() defined
+
+[1m  Impact Scoring[0m
+  [38;2;74;222;128m✓[0m untested-scripts category gets high score (75)
+  [38;2;74;222;128m✓[0m dora-regression category gets critical score (85)
+
+[1m  Pipeline Integration[0m
+  [38;2;74;222;128m✓[0m execute_fix calls shipwright pipeline start
+  [38;2;74;222;128m✓[0m uses --worktree for isolated execution
+
+[1m  Learning & Memory[0m
+  [38;2;74;222;128m✓[0m records self-improvements in memory
+  [38;2;74;222;128m✓[0m emits patrol.meta_learned events
+
+[1m  Batch Processing[0m
+  [38;2;74;222;128m✓[0m batch_improve looks for meta-improvement labeled issues
+  [38;2;74;222;128m✓[0m sorts issues by impact score (highest first)
+
+[1m  Dry-Run Mode[0m
+  [38;2;74;222;128m✓[0m new functions respect NO_GITHUB for dry-run
+
+[1m  Autonomous Loop[0m
+  [38;2;74;222;128m✓[0m patrol_meta_auto() orchestrates full loop
+  [38;2;74;222;128m✓[0m auto loop has stage 1 (detection) and stage 2 (batch)
+
+
+
+
+[2m  ──────────────────────────────────────────[0m
+
+  [38;2;74;222;128m[1mAll 0 tests passed[0m
+
+
+[38;2;0;212;255m[1m╔═══════════════════════════════════════════════════╗[0m
+[38;2;0;212;255m[1m║  shipwright pipeline composer — Test Suite        ║[0m
+[38;2;0;212;255m[1m╚═══════════════════════════════════════════════════╝[0m
+
+[2mSetting up test environment...[0m
+
+[38;2;168;85;247m[1mPipeline Composition[0m
+  [38;2;0;212;255m▸[0m Composed pipeline has valid stage ordering... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m High-risk issue gets security stages... .claude/pipeline-artifacts/composed-pipeline.json
+[38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Fallback to static template when no intelligence... [38;2;74;222;128m✓[0m
+
+[38;2;168;85;247m[1mConditional Stage Insertion[0m
+  [38;2;0;212;255m▸[0m Stage inserted at correct position after build... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Insert into nonexistent stage fails... [38;2;74;222;128m✓[0m
+
+[38;2;168;85;247m[1mModel Downgrade[0m
+  [38;2;0;212;255m▸[0m Budget constraint triggers model downgrades... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Downgrade with nonexistent stage fails... [38;2;74;222;128m✓[0m
+
+[38;2;168;85;247m[1mPipeline Validation[0m
+  [38;2;0;212;255m▸[0m Validation accepts valid pipeline... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Validation rejects invalid ordering (test before build)... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Validation rejects missing stage ids... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Validation rejects missing stages array... [38;2;74;222;128m✓[0m
+
+[38;2;168;85;247m[1mIteration Estimation[0m
+  [38;2;0;212;255m▸[0m Iteration estimates are reasonable (1-50 range)... [38;2;74;222;128m✓[0m
+
+[38;2;0;212;255m[1m════════════════════════════════════════════════════[0m
+[38;2;74;222;128m[1m  All 12 tests passed ✓[0m
+[38;2;0;212;255m[1m════════════════════════════════════════════════════[0m
+
+
+[38;2;168;85;247m[1m╔═══════════════════════════════════════════════════════════════════╗[0m
+[38;2;168;85;247m[1m║  shipwright pipeline test — E2E Validation (Real Subprocess)     ║[0m
+[38;2;168;85;247m[1m╚═══════════════════════════════════════════════════════════════════╝[0m
+
+[2mSetting up mock environment...[0m
+[38;2;74;222;128m✓[0m Environment ready: [2m/var/folders/57/0gs_mdl104q8vk054nz3wp3h0000gn/T//sw-pipeline-test.gCxJon[0m
+
+  [38;2;0;212;255m▸[0m Preflight passes with all mocks... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Preflight fails when sw-loop.sh missing... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Start requires --goal or --issue... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Intake with --goal creates branch + artifacts... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Intake with --issue fetches from GitHub... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Plan generates plan.md, dod.md, tasks...     [38;2;248;113;113m✗[0m File not found: .claude/pipeline-artifacts/plan.md (plan generated)
+[38;2;248;113;113m✗ FAILED[0m
+  [38;2;0;212;255m▸[0m Build invokes sw loop and commits... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Test stage captures results to log... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Review generates report with severities...     [38;2;248;113;113m✗[0m File not found: .claude/pipeline-artifacts/review.md (review generated)
+[38;2;248;113;113m✗ FAILED[0m
+  [38;2;0;212;255m▸[0m PR stage creates PR URL artifact... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Full E2E pipeline (6 stages)...     [38;2;248;113;113m✗[0m File not found: .claude/pipeline-artifacts/plan.md (plan artifact)
+[38;2;248;113;113m✗ FAILED[0m
+  [38;2;0;212;255m▸[0m Resume continues from partial state...     [38;2;248;113;113m✗[0m File not found: .claude/pipeline-artifacts/plan.md (plan generated after resume)
+[38;2;248;113;113m✗ FAILED[0m
+  [38;2;0;212;255m▸[0m Abort marks pipeline as aborted... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Dry run shows config, no artifacts...     [38;2;248;113;113m✗[0m Output missing pattern: Pipeline.*standard (shows pipeline name)
+    [2mOutput (last 5 lines):[0m
+        [1mEstimated Cost:[0m         $0.5040 USD
+      
+      [38;2;74;222;128m[1m✓[0m Dry run validation passed
+      
+        To execute this pipeline: [2mremove --dry-run flag[0m
+[38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Self-healing build→test retry loop... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Intelligence: Skip stages for documentation issues... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Intelligence: Skip stages for low complexity...     [38;2;248;113;113m✗[0m Output missing pattern: intelligence.*complexity.*[0-3]|stage.*skipped (should show intelligence skip due to complexity)
+    [2mOutput (last 5 lines):[0m
+      [38;2;0;212;255m[1m▸[0m RL episode recorded (success=true, iterations=1)
+      {"timestamp":"2026-04-04T12:55:26Z","epoch":1775307326,"pipeline_id":"fast","reward":0.4950,"components":{"test_outcome":0.5,"iteration_efficiency":0.5,"cost_efficiency":0.8,"quality_score":0.5,"convergence_speed":0.0000,"memory_hit_rate":0.5},"context":{"language":"unknown","complexity":"2"}}
+      [38;2;74;222;128m[1m✓[0m Learned policy from 17 episodes across 3 context buckets
+      jq: parse error: Invalid numeric literal at line 1, column 2
+      jq: parse error: Invalid numeric literal at line 1, column 2
+[38;2;248;113;113m✗ FAILED[0m
+  [38;2;0;212;255m▸[0m Intelligence: Finding classification and routing... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Intelligence: Mid-pipeline complexity reassessment... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Intelligence: Backtracking limit (1 per pipeline)... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Cleanup: Post-completion clears checkpoints and transient artifacts...     [38;2;248;113;113m✗[0m Expected exit code 0, got 1 (pipeline should complete)
+[38;2;248;113;113m✗ FAILED[0m
+  [38;2;0;212;255m▸[0m Cleanup: pipeline_cancel_check_runs function exists... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Vitals: sw-pipeline-vitals.sh exists and is syntactically valid... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Vitals: All vitals functions defined in module... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Vitals: Health verdict maps scores correctly... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Vitals: Adaptive limit returns valid integer... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Vitals: Budget trajectory returns ok/warn/stop... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Quality: pipeline_select_audits function exists... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Quality: pipeline_security_source_scan function exists... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Quality: pipeline_verify_dod function exists... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Quality: pipeline_record_quality_score function exists... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Quality: Templates have compound_quality_blocking... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Vitals: Progress snapshot writes correct file... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Vitals: Momentum score from snapshot history... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Vitals: Convergence with decreasing errors... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Vitals: Configurable weights via env vars... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Vitals: Budget trajectory warn/stop on exhaustion... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Quality: Structured findings JSON is valid... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Quality: Multi-backtrack counter tracking... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Quality: 6 categories in classify_quality_findings... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Deploy: Pre-deploy gates exist in pipeline... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Deploy: Deploy strategy config pattern... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Deploy: Canary deploy flow patterns exist... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Pipeline: PIPELINE_STATE references removed... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Pipeline: Coverage JSON creation in test stage... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Pipeline: _pipeline_compact_goal returns goal+plan+design... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Pipeline: load_composed_pipeline sets COMPOSED_STAGES... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Vitals: Momentum returns 60 for single snapshot past intake... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Vitals: Health gate blocks when health < threshold... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Vitals: Health gate passes with default threshold=40... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Durable: persist_artifacts function exists... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Durable: persist_artifacts skips in non-CI mode... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Durable: verify_stage_artifacts passes when artifacts present... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Durable: verify_stage_artifacts fails when artifacts missing... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Durable: verify_stage_artifacts fails when artifacts empty... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Durable: verify_stage_artifacts passes for stages with no requirements... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Durable: verify_stage_artifacts design requires plan.md... [38;2;74;222;128m✓[0m
+  [38;2;0;212;255m▸[0m Durable: mark_stage_complete wires persist for plan stage... [38;2;74;222;128m✓[0m
+
+[38;2;168;85;247m[1m━━━ Results ━━━[0m
+  [38;2;74;222;128mPassed:[0m 52
+  [38;2;248;113;113mFailed:[0m 6
+  [2mTotal:[0m  58
+
+[38;2;248;113;113m[1mFailed tests:[0m
+  [38;2;248;113;113m✗[0m Plan generates plan.md, dod.md, tasks
+  [38;2;248;113;113m✗[0m Review generates report with severities
+  [38;2;248;113;113m✗[0m Full E2E pipeline (6 stages)
+  [38;2;248;113;113m✗[0m Resume continues from partial state
+  [38;2;248;113;113m✗[0m Intelligence: Skip stages for low complexity
+  [38;2;248;113;113m✗[0m Cleanup: Post-completion clears checkpoints and transient artifacts
+
diff --git a/.claude/loop-state.md b/.claude/loop-state.md
index 0362dc9e6..e1c4fe7b5 100644
--- a/.claude/loop-state.md
+++ b/.claude/loop-state.md
@@ -1,104 +1,79 @@
 ---
-goal: "Add a shipwright ping command that prints pong to stdout and exits 0
+goal: "Add version display to sw-hello command: read version from package.json, display Shipwright vX.Y.Z, add test
 
-## Plan Summary
-Plan complete and saved to `docs/plans/2026-03-02-ping-command.md`.
+## Specification: Add version display to sw-hello command: read version from package.json, display Shipwright vX.Y.Z, add test
 
----
-
-## Summary
-
-The plan adds the `shipwright ping` command in **4 files, 9 tasks**:
-
-| # | Task | File(s) |
-|---|------|---------|
-| 1-2 | Create + chmod `sw-ping.sh` | `scripts/sw-ping.sh` (new) |
-| 3-4 | Create + chmod `sw-ping-test.sh` | `scripts/sw-ping-test.sh` (new) |
-| 5 | Run test in isolation — verify 6 PASS | — |
-| 6 | Register `ping)` case in router | `scripts/sw` |
-| 7 | Add test to `npm test` chain | `package.json` |
-| 8 | Smoke-test via router | — |
-| 9 | Commit | — |
+### Goals
+- Add version display to sw-hello command: read version from package.json, display Shipwright vX.Y.Z, add test
 
-**Key decisions:**
-- **Standalone script** (not inline in router) — only approach consistent with all 100+ existing commands, independently testable
-[... full plan in .claude/pipeline-artifacts/plan.md]
-
-## Key Design Decisions
-# Design: Add a shipwright ping command that prints pong to stdout and exits 0
-## Context
-## Component Diagram
-## Decision
-## Interface Contracts
-# sw-ping.sh — Public interface
-# Invocation (no args): happy path
-# stdout: "pong\n"
-# stderr: (empty)
-# exit:   0
-[... full design in .claude/pipeline-artifacts/design.md]
+### Acceptance Criteria
+- [testable] All existing tests continue to pass
 
 Historical context (lessons from previous pipelines):
 {
   "results": [
     {
-      "file": "architecture.json",
-      "relevance": 95,
-      "summary": "Describes Command Router pattern, bash 3.2 conventions (set -euo pipefail, VERSION at top), snake_case function naming, and test harness structure — exactly what's needed to implement the ping command correctly"
-    },
-    {
-      "file": "failures.json (comprehensive with 8 entries)",
+      "file": "patterns.json",
       "relevance": 85,
-      "summary": "Shows critical historical failures including 'output missing: intake' (23 occurrences, highest weight 7.8e+47), shell-init errors, and test infrastructure issues — directly relevant to avoiding similar failures in build stage"
+      "summary": "Defines project conventions: vitest test runner, npm package manager, test_pattern *.test.js, source_dir src/, commonjs imports — directly relevant for writing new tests for the version display feature"
     },
     {
-      "file": "metrics.json (build_duration_s: 2826)",
+      "file": "metrics.json",
       "relevance": 55,
-      "summary": "Previous build took 47 minutes — provides performance baseline and expectation setting for current build duration"
+      "summary": "Recent baseline metrics (2026-03-09) showing build_duration_s: 17827, test_duration_s: 1575 — provides performance context for the build stage and typical test execution time"
     },
     {
-      "file": "failures.json (shell-init: error retrieving current directory)",
-      "relevance": 50,
-      "summary": "Test stage failure in getcwd — indicates potential sandbox/environment issues that could affect ping command testing"
+      "file": "patterns.json",
+      "relevance": 40,
+      "summary": "Simpler project type confirmation (nodejs, detected 2026-02-21) — validates project classification but less actionable than the conventions entry above"
     },
     {
-      "file": "patterns.json (import_style: commonjs)",
+      "file": "metrics.json",
       "relevance": 30,
-      "summary": "Indicates JavaScript/Node.js project context; mostly empty but shows partial project type detection from previous runs"
+      "summary": "Older baseline (2026-02-21) with build_duration_s: 147, test_duration_s: 1 — historical reference point, less relevant than recent metrics"
+    },
+    {
+      "file": "failures.json",
+      "relevance": 10,
+      "summary": "Pipeline and mock binary test failures from Shipwright itself — not relevant to sw-hello version display feature implementation"
     }
   ]
 }
 
 Discoveries from other pipelines:
-[38;2;74;222;128m[1m✓[0m Injected 1 new discoveries
-[design] Design completed for Add a shipwright ping command that prints pong to stdout and exits 0 — Resolution: 
-
-## Failure Diagnosis (Iteration 2)
-Classification: unknown
-Strategy: retry_with_context
-Repeat count: 0
-
-## Failure Diagnosis (Iteration 3)
-Classification: unknown
-Strategy: retry_with_context
-Repeat count: 1
-
-## Failure Diagnosis (Iteration 4)
-Classification: unknown
-Strategy: retry_with_context
-Repeat count: 0"
-iteration: 4
-max_iterations: 20
-status: error
+[38;2;74;222;128m[1m✓[0m Injected 126 new discoveries
+[intake] Stage intake completed — Resolution: 
+[intake] Stage intake completed — Resolution: 
+[intake] Stage intake completed — Resolution: 
+[compound_quality] Stage compound_quality completed — Resolution: 
+[intake] Stage intake completed — Resolution: 
+[pr] Stage pr completed — Resolution: 
+[pipeline_success] Pipeline success for issue #0 (fast template, stage=validate) — Resolution: success
+[intake] Stage intake completed — Resolution: 
+[pr] Stage pr completed — Resolution: 
+[intake] Stage intake completed — Resolution: 
+[compound_quality] Stage compound_quality completed — Resolution: 
+[pr] Stage pr completed — Resolution: 
+[intake] Stage intake completed — Resolution: 
+[compound_quality] Stage compound_quality completed — Resolution: 
+[pr] Stage pr completed — Resolution: 
+[intake] Stage intake completed — Resolution: 
+[design] Design completed for Build a production-grade todo application. TypeScript + React frontend with Vite, Express REST API backend, SQLite persistence with Drizzle ORM, JWT authentication (register/login), full CRUD for todos with filtering (all/active/completed), drag-and-drop reorder, due dates, priorities (low/medium/high), dark mode, responsive design. Include comprehensive test suite (unit + integration + e2e). Production-ready: error handling, input validation, rate limiting, CORS, environment config. — Resolution: 
+[intake] Stage intake completed — Resolution: 
+[intake] Stage intake completed — Resolution: "
+iteration: 1
+max_iterations: 10
+status: running
 test_cmd: "npm test"
 model: sonnet
 agents: 1
-started_at: 2026-03-02T08:27:01Z
-last_iteration_at: 2026-03-02T08:27:01Z
-consecutive_failures: 1
-total_commits: 3
-audit_enabled: true
-audit_agent_enabled: true
-quality_gates_enabled: true
+started_at: 2026-04-04T12:34:56Z
+last_iteration_at: 2026-04-04T12:34:56Z
+consecutive_failures: 0
+total_commits: 1
+audit_enabled: false
+audit_agent_enabled: false
+quality_gates_enabled: false
 dod_file: ""
 auto_extend: true
 extension_count: 0
@@ -106,14 +81,6 @@ max_extensions: 3
 ---
 
 ## Log
-### Iteration 1 (2026-03-02T08:06:08Z)
-This is also a task notification for a background command that was already retrieved and reviewed via `TaskOutput` in th
-No new information — the ping command implementation is complete and `LOOP_COMPLETE` was already declared.
-
-### Iteration 2 (2026-03-02T08:25:28Z)
-The background task already completed and was retrieved in my previous turn — `npm test` exited with code 0. The ping co
-LOOP_COMPLETE
-
-### Iteration 3 (2026-03-02T08:26:58Z)
-(no output)
+### Iteration 1 (2026-04-04T12:34:56Z)
+{"type":"result","subtype":"success","is_error":false,"duration_ms":90646,"duration_api_ms":90727,"num_turns":13,"result
 
diff --git a/.claude/platform-hygiene.json b/.claude/platform-hygiene.json
index 9338cc285..43a34aaca 100644
--- a/.claude/platform-hygiene.json
+++ b/.claude/platform-hygiene.json
@@ -1,12 +1,12 @@
 {
-  "timestamp": "2026-03-10T15:34:26Z",
-  "repository": "shipwright",
+  "timestamp": "2026-04-04T12:42:58Z",
+  "repository": "hello-v3",
   "counts": {
-    "hardcoded": 46,
-    "fallback": 68,
-    "todo": 45,
-    "fixme": 23,
-    "hack": 18
+    "hardcoded": 48,
+    "fallback": 67,
+    "todo": 51,
+    "fixme": 25,
+    "hack": 20
   },
   "findings_sample": [
     {
@@ -298,9 +298,21 @@
       "line": 454
     },
     {
-      "file": "scripts/lib/adaptive-timeout.sh",
+      "file": "scripts/lib/process-reward.sh",
       "line": 459
     },
+    {
+      "file": "scripts/lib/process-reward.sh",
+      "line": 115
+    },
+    {
+      "file": "scripts/lib/process-reward.sh",
+      "line": 117
+    },
+    {
+      "file": "scripts/lib/adaptive-timeout.sh",
+      "line": 261
+    },
     {
       "file": "scripts/lib/pipeline-detection.sh",
       "line": 214
@@ -325,13 +337,9 @@
       "file": "scripts/lib/pipeline-intelligence-compound.sh",
       "line": 241
     },
-    {
-      "file": "scripts/lib/loop-convergence.sh",
-      "line": 242
-    },
     {
       "file": "scripts/lib/test-optimizer.sh",
-      "line": 85
+      "line": 242
     },
     {
       "file": "scripts/lib/pipeline-execution.sh",
@@ -395,7 +403,7 @@
     },
     {
       "file": "scripts/lib/pipeline-stages-build.sh",
-      "line": 1008
+      "line": 1041
     },
     {
       "file": "scripts/lib/convergence.sh",
@@ -403,7 +411,7 @@
     },
     {
       "file": "scripts/lib/pipeline-quality-gates.sh",
-      "line": 342
+      "line": 343
     },
     {
       "file": "scripts/lib/pipeline-quality-gates.sh",
@@ -451,7 +459,7 @@
     },
     {
       "file": "scripts/lib/compat.sh",
-      "line": 467
+      "line": 624
     },
     {
       "file": "scripts/lib/pipeline-quality-checks.sh",
@@ -471,7 +479,7 @@
     },
     {
       "file": "scripts/lib/pipeline-util.sh",
-      "line": 439
+      "line": 482
     },
     {
       "file": "scripts/sw-fix.sh",
@@ -547,31 +555,31 @@
     },
     {
       "file": "scripts/sw-loop.sh",
-      "line": 548
+      "line": 561
     },
     {
       "file": "scripts/sw-loop.sh",
-      "line": 1106
+      "line": 1119
     },
     {
       "file": "scripts/sw-loop.sh",
-      "line": 1182
+      "line": 1195
     },
     {
       "file": "scripts/sw-loop.sh",
-      "line": 1246
+      "line": 1259
     },
     {
       "file": "scripts/sw-loop.sh",
-      "line": 1250
+      "line": 1263
     },
     {
       "file": "scripts/sw-loop.sh",
-      "line": 1253
+      "line": 1266
     },
     {
       "file": "scripts/sw-linear.sh",
-      "line": 1509
+      "line": 1522
     },
     {
       "file": "scripts/sw-linear.sh",
@@ -614,18 +622,38 @@
       "line": 161
     },
     {
-      "file": "scripts/sw-model-router.sh",
+      "file": "scripts/sw-constitutional-test.sh",
       "line": 160
+    },
+    {
+      "file": "scripts/sw-constitutional-test.sh",
+      "line": 67
+    },
+    {
+      "file": "scripts/sw-constitutional-test.sh",
+      "line": 71
+    },
+    {
+      "file": "scripts/sw-constitutional-test.sh",
+      "line": 154
+    },
+    {
+      "file": "scripts/sw-constitutional-test.sh",
+      "line": 162
+    },
+    {
+      "file": "scripts/sw-model-router.sh",
+      "line": 206
     }
   ],
   "script_size_hotspots": [
     {
       "script": "sw-loop.sh",
-      "lines": 2530
+      "lines": 2561
     },
     {
       "script": "sw-memory.sh",
-      "lines": 2118
+      "lines": 2240
     },
     {
       "script": "sw-daemon-test.sh",
diff --git a/.claude/recovery-state.json b/.claude/recovery-state.json
new file mode 100644
index 000000000..56986a1c6
--- /dev/null
+++ b/.claude/recovery-state.json
@@ -0,0 +1 @@
+{"attempts":0,"history":[],"current_model":"","escalation_level":0}
diff --git a/.claude/test-holdout/manifest.json b/.claude/test-holdout/manifest.json
new file mode 100644
index 000000000..f6a8a5bfb
--- /dev/null
+++ b/.claude/test-holdout/manifest.json
@@ -0,0 +1,8 @@
+{
+  "created": "2026-04-04T12:31:17Z",
+  "ratio": 30,
+  "total_tests": 22,
+  "visible_count": 20,
+  "sealed_count": 2,
+  "tests": [{"original":"tests/edge.test.js","sealed":".claude/test-holdout/.sealed/tests/edge.test.js","hash":"3815f72e3ca0f2f4733a4a5a96c49a4d"},{"original":"tests/util.test.js","sealed":".claude/test-holdout/.sealed/tests/util.test.js","hash":"fe8b5b0649713da37789013a82ee7007"}]
+}
diff --git a/.gitignore b/.gitignore
index c7f4f2ede..e54c8e652 100644
--- a/.gitignore
+++ b/.gitignore
@@ -35,3 +35,6 @@ node_modules/
 website/node_modules/
 website/dist/
 website/.astro/
+
+# Shipwright test holdout (sealed tests hidden from agents)
+.claude/test-holdout/.sealed/
diff --git a/scripts/sw-cost-test.sh b/scripts/sw-cost-test.sh
index 949af0c83..69d74a477 100755
--- a/scripts/sw-cost-test.sh
+++ b/scripts/sw-cost-test.sh
@@ -197,14 +197,17 @@ fi
 
 # Functional test: write mock events and verify dashboard parses them
 mkdir -p "$TEST_TEMP_DIR/home/.shipwright"
-cat > "$TEST_TEMP_DIR/home/.shipwright/events.jsonl" <<'EVTEOF'
-{"ts":"2026-02-27T10:00:00Z","type":"loop.context_efficiency","iteration":"1","raw_prompt_chars":"200000","trimmed_prompt_chars":"180000","trim_ratio":"10.0","budget_utilization":"100.0","budget_chars":"180000","job_id":"test-1"}
-{"ts":"2026-02-27T10:01:00Z","type":"loop.context_efficiency","iteration":"2","raw_prompt_chars":"150000","trimmed_prompt_chars":"150000","trim_ratio":"0.0","budget_utilization":"83.3","budget_chars":"180000","job_id":"test-1"}
+# Use current timestamp so entries are within the 30-day window
+_now_ts=$(date -u +"%Y-%m-%dT%H:%M:%SZ")
+_now_epoch=$(date +%s)
+cat > "$TEST_TEMP_DIR/home/.shipwright/events.jsonl" <<EVTEOF
+{"ts":"${_now_ts}","type":"loop.context_efficiency","iteration":"1","raw_prompt_chars":"200000","trimmed_prompt_chars":"180000","trim_ratio":"10.0","budget_utilization":"100.0","budget_chars":"180000","job_id":"test-1"}
+{"ts":"${_now_ts}","type":"loop.context_efficiency","iteration":"2","raw_prompt_chars":"150000","trimmed_prompt_chars":"150000","trim_ratio":"0.0","budget_utilization":"83.3","budget_chars":"180000","job_id":"test-1"}
 EVTEOF
 
-# Also need cost data for the dashboard to run
-cat > "$TEST_TEMP_DIR/home/.shipwright/costs.json" <<'COSTEOF'
-{"entries":[{"ts":"2026-02-27T10:00:00Z","ts_epoch":1772125200,"input_tokens":50000,"output_tokens":10000,"cost_usd":1.50,"model":"opus","stage":"build","issue":"1"}],"summary":{}}
+# Also need cost data for the dashboard to run (use current epoch so it's within 30-day window)
+cat > "$TEST_TEMP_DIR/home/.shipwright/costs.json" <<COSTEOF
+{"entries":[{"ts":"${_now_ts}","ts_epoch":${_now_epoch},"input_tokens":50000,"output_tokens":10000,"cost_usd":1.50,"model":"opus","stage":"build","issue":"1"}],"summary":{}}
 COSTEOF
 cat > "$TEST_TEMP_DIR/home/.shipwright/budget.json" <<'BUDEOF'
 {"daily_budget_usd":0,"enabled":false}
diff --git a/scripts/sw-formal-spec-test.sh b/scripts/sw-formal-spec-test.sh
old mode 100644
new mode 100755
diff --git a/scripts/sw-hello-test.sh b/scripts/sw-hello-test.sh
index 666299431..78a9fa8f7 100755
--- a/scripts/sw-hello-test.sh
+++ b/scripts/sw-hello-test.sh
@@ -35,11 +35,18 @@ assert_exit_code() {
     fi
 }
 
-# ─── Test: hello command outputs "hello world" ──────────────────────────────
+# ─── Test: hello command outputs "Shipwright vX.Y.Z" ───────────────────────
 test_hello_output() {
     local output
     output=$("$SCRIPT_DIR/sw-hello.sh")
-    assert_equals "hello world" "$output" "hello command outputs 'hello world'"
+    if [[ "$output" =~ ^Shipwright\ v[0-9]+\.[0-9]+\.[0-9]+ ]]; then
+        ((PASS++))
+        echo -e "  \033[38;2;74;222;128m\033[1m✓\033[0m hello command outputs 'Shipwright vX.Y.Z'"
+    else
+        ((FAIL++))
+        echo -e "  \033[38;2;248;113;113m\033[1m✗\033[0m hello command outputs 'Shipwright vX.Y.Z'"
+        echo "    Actual: $output"
+    fi
 }
 
 # ─── Test: hello command exits with 0 ───────────────────────────────────────
@@ -74,16 +81,36 @@ test_hello_short_help() {
     fi
 }
 
-# ─── Test: hello --version shows version ────────────────────────────────────
+# ─── Test: hello --version shows "Shipwright vX.Y.Z" ───────────────────────
 test_hello_version() {
     local output
     output=$("$SCRIPT_DIR/sw-hello.sh" --version)
-    if [[ "$output" =~ ^[0-9]+\.[0-9]+\.[0-9]+ ]]; then
+    if [[ "$output" =~ ^Shipwright\ v[0-9]+\.[0-9]+\.[0-9]+ ]]; then
+        ((PASS++))
+        echo -e "  \033[38;2;74;222;128m\033[1m✓\033[0m hello --version displays 'Shipwright vX.Y.Z'"
+    else
+        ((FAIL++))
+        echo -e "  \033[38;2;248;113;113m\033[1m✗\033[0m hello --version displays 'Shipwright vX.Y.Z'"
+        echo "    Actual: $output"
+    fi
+}
+
+# ─── Test: version is read from package.json ────────────────────────────────
+test_hello_version_from_package_json() {
+    local script_dir output pkg_version
+    script_dir="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
+    pkg_version=$(jq -r '.version' "$script_dir/../package.json" 2>/dev/null \
+        || grep '"version"' "$script_dir/../package.json" \
+            | grep -o '[0-9][0-9]*\.[0-9][0-9]*\.[0-9][0-9]*' | head -1)
+    output=$("$SCRIPT_DIR/sw-hello.sh")
+    if [[ "$output" == "Shipwright v${pkg_version}" ]]; then
         ((PASS++))
-        echo -e "  \033[38;2;74;222;128m\033[1m✓\033[0m hello --version displays version"
+        echo -e "  \033[38;2;74;222;128m\033[1m✓\033[0m hello version matches package.json ($pkg_version)"
     else
         ((FAIL++))
-        echo -e "  \033[38;2;248;113;113m\033[1m✗\033[0m hello --version displays version"
+        echo -e "  \033[38;2;248;113;113m\033[1m✗\033[0m hello version matches package.json"
+        echo "    Expected: Shipwright v${pkg_version}"
+        echo "    Actual:   $output"
     fi
 }
 
@@ -100,6 +127,7 @@ test_hello_exit_code
 test_hello_help
 test_hello_short_help
 test_hello_version
+test_hello_version_from_package_json
 test_hello_invalid_option
 
 echo ""
diff --git a/scripts/sw-hello.sh b/scripts/sw-hello.sh
index 4c6180e90..4a0ccbc14 100755
--- a/scripts/sw-hello.sh
+++ b/scripts/sw-hello.sh
@@ -11,6 +11,13 @@ trap 'echo "ERROR: $BASH_SOURCE:$LINENO exited with status $?" >&2' ERR
 
 SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
 
+# Read version from package.json (fall back to script VERSION if unavailable)
+_pkg_version=$(jq -r '.version' "$SCRIPT_DIR/../package.json" 2>/dev/null \
+    || grep '"version"' "$SCRIPT_DIR/../package.json" 2>/dev/null \
+        | grep -o '[0-9][0-9]*\.[0-9][0-9]*\.[0-9][0-9]*' | head -1 \
+    || true)
+[[ -n "${_pkg_version:-}" ]] && VERSION="$_pkg_version"
+
 # Canonical helpers (colors, output, events)
 # shellcheck source=lib/helpers.sh
 [[ -f "$SCRIPT_DIR/lib/helpers.sh" ]] && source "$SCRIPT_DIR/lib/helpers.sh"
@@ -48,12 +55,12 @@ main() {
             exit 0
             ;;
         --version|-v)
-            echo "$VERSION"
+            echo "Shipwright v${VERSION}"
             exit 0
             ;;
         "")
-            # No arguments: output hello world
-            echo "hello world"
+            # No arguments: display Shipwright version
+            echo "Shipwright v${VERSION}"
             exit 0
             ;;
         *)
diff --git a/scripts/sw-mutation-executor-test.sh b/scripts/sw-mutation-executor-test.sh
old mode 100644
new mode 100755
diff --git a/scripts/sw-process-reward-test.sh b/scripts/sw-process-reward-test.sh
old mode 100644
new mode 100755
diff --git a/scripts/sw-reward-aggregator-test.sh b/scripts/sw-reward-aggregator-test.sh
old mode 100644
new mode 100755