diff --git a/.cc-pipeline/plan.md b/.cc-pipeline/plan.md
new file mode 100644
index 0000000..47f5228
--- /dev/null
+++ b/.cc-pipeline/plan.md
@@ -0,0 +1,961 @@
+# Implementation Plan
+
+> **For Claude:** REQUIRED SUB-SKILL: Use superpowers:executing-plans to implement this plan task-by-task.
+
+**Goal:** Implement v0.1.6 Phase 1 Critical Path: fix prompt accumulation on retry, add staged rebase after merge, and support array dependency DAGs.
+
+**Architecture:** Three independent features layered bottom-up through types → store → worktree-pool → agent-runner → scheduler. Types change first (Wave 0), then store + worktree-pool in parallel (Wave 1), then agent-runner (Wave 2), then scheduler integrates everything (Wave 3), then tests (Wave 4).
+
+**Tech Stack:** TypeScript 5, Node.js ESM, better-sqlite3, node:test + assert/strict
+
+---
+
+## Summary
+
+**Feature 1 — Prompt accumulation fix + model escalation:** Each retry currently appends error context to `task.prompt`, so by retry 3 the prompt contains 3 stacked error sections. Fix by saving the original prompt in `task._originalPrompt` on first retry, then rebuilding from `_originalPrompt + latest error` on each subsequent retry. Add model escalation: when `retryCount >= 2` set `task.modelOverride = "claude-opus-4-6"` so hard tasks get a more powerful model. `_originalPrompt` is persisted in SQLite (new `original_prompt` column migration). `modelOverride` is transient (set in memory at retry time, recomputed each retry).
+
+**Feature 2 — Staged rebase:** After a successful merge, other busy workers operate on a stale `main`. Add `WorktreePool.getActiveWorkers(exclude?)` (returns busy worker names, optionally excluding one) and `WorktreePool.rebaseOnMain(workerName)` (rebases branch onto current `main` tip, returns false on conflict). After every successful merge in `scheduler.executeAndRelease`, fire `rebaseOnMain` on all other active workers as best-effort (errors caught and logged, never blocking dispatch).
+
+**Feature 3 — Dependency DAG:** `dependsOn` currently accepts only a single string task ID. Extend to `string | string[]` (backward-compatible). The dispatch loop checks ALL dependencies; if any is failed/timeout/cancelled the task fails immediately; if any is still pending/running the task is re-queued. Store serializes array values as JSON (detected on read by `startsWith('[')`).
+
+---
+
+## Files to Create
+_(none — all changes are modifications to existing files)_
+
+## Files to Modify
+- `src/types.ts` — add `_originalPrompt?`, `modelOverride?` to Task; change `dependsOn` to `string | string[]`; update `createTask` opts
+- `src/store.ts` — add `original_prompt` column migration; update taskToParams/rowToTask for `_originalPrompt`; serialize array `dependsOn` as JSON; update `fieldMap` in `update()`
+- `src/worktree-pool.ts` — add `getActiveWorkers(exclude?)` and `rebaseOnMain(workerName)` public methods
+- `src/agent-runner.ts` — use `task.modelOverride ?? task.model ?? this.model` in `runClaudeSDK` and `runClaude`
+- `src/scheduler.ts` — fix prompt accumulation in `executeAndRelease` + `requeue`; add model escalation; update dependency check loop for arrays; call `pool.rebaseOnMain` on other workers after successful merge; update `submit()` opts type
+- `src/__tests__/scheduler.test.ts` — update `makePool()` mock; add tests for prompt accumulation fix, model escalation, array dependsOn
+- `src/__tests__/worktree-pool.test.ts` — add tests for `getActiveWorkers` and `rebaseOnMain`
+
+---
+
+## Waves (execution order)
+
+### Wave 0: Types (single task, blocks everything else)
+
+#### Task 1: Update `src/types.ts`
+
+**Files:**
+- Modify: `src/types.ts`
+
+**Step 1: Add two new optional fields to the Task interface**
+
+After line 39 (`model?: string;`), insert:
+```typescript
+  modelOverride?: string;
+  _originalPrompt?: string;
+```
+
+**Step 2: Change `dependsOn` type**
+
+Line 34: change `dependsOn?: string;` to:
+```typescript
+  dependsOn?: string | string[];
+```
+
+No changes needed to `createTask` body — `opts?.dependsOn` assignment already works for `string | string[]`.
+
+**Step 3: Run tsc to verify**
+```bash
+npx tsc --noEmit
+```
+Expected: no errors (this is a pure type widening, no breaking changes)
+
+**Step 4: Commit**
+```bash
+git add -A && git commit -m "feat(types): add modelOverride, _originalPrompt; widen dependsOn to string|string[]"
+```
+
+---
+
+### Wave 1: Store + WorktreePool (parallel — independent files, both depend on Wave 0)
+
+#### Task 2: Update `src/store.ts`
+
+**Files:**
+- Modify: `src/store.ts`
+
+This task has four parts. Apply them in sequence within this task.
+
+**Part A — Add migration for `original_prompt` column**
+
+In `migrate()`, after the existing `review` column migration block (around line 89, after `"ALTER TABLE tasks ADD COLUMN review TEXT"`), add:
+```typescript
+    // Add original_prompt column to preserve original prompt across retries
+    try {
+      this.db.exec("ALTER TABLE tasks ADD COLUMN original_prompt TEXT");
+    } catch {
+      // Column already exists — safe to ignore
+    }
+```
+
+**Part B — Update `taskToParams()`**
+
+The existing method returns 25 params. Replace it entirely:
+```typescript
+  private taskToParams(task: Task): unknown[] {
+    return [
+      task.id, task.prompt, task.status, task.worktree ?? null,
+      task.output, task.error, JSON.stringify(task.events),
+      task.createdAt, task.startedAt ?? null, task.completedAt ?? null,
+      task.timeout, task.maxBudget, task.costUsd,
+      task.tokenInput, task.tokenOutput, task.durationMs, task.retryCount, task.maxRetries,
+      task.priority ?? "normal",
+      JSON.stringify(task.tags ?? []),
+      task.dependsOn == null
+        ? null
+        : Array.isArray(task.dependsOn)
+          ? JSON.stringify(task.dependsOn)
+          : task.dependsOn,
+      task.webhookUrl ?? null, task.summary ?? null,
+      task.agent ?? "claude",
+      JSON.stringify(task.review ?? null),
+      task._originalPrompt ?? null,
+    ];
+  }
+```
+(26 params now — `original_prompt` is the last one)
+
+**Part C — Update all SQL statements to include `original_prompt`**
+
+There are 4 SQL statements across `save()`, `updateBatch()`, and `saveBatch()` — two variants each (INSERT and UPDATE). Update all of them:
+
+INSERT (add `original_prompt` to column list and add `?` to VALUES — goes from 25 `?` to 26):
+```sql
+INSERT OR IGNORE INTO tasks
+(id, prompt, status, worktree, output, error, events, created_at,
+ started_at, completed_at, timeout, max_budget, cost_usd,
+ token_input, token_output, duration_ms, retry_count, max_retries, priority, tags,
+ depends_on, webhook_url, summary, agent, review, original_prompt)
+VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?)
+```
+
+UPDATE (add `original_prompt=?` before `WHERE id=?`):
+```sql
+UPDATE tasks SET
+  prompt=?, status=?, worktree=?, output=?, error=?, events=?, created_at=?,
+  started_at=?, completed_at=?, timeout=?, max_budget=?, cost_usd=?,
+  token_input=?, token_output=?, duration_ms=?, retry_count=?, max_retries=?,
+  priority=?, tags=?, depends_on=?, webhook_url=?, summary=?, agent=?, review=?,
+  original_prompt=?
+WHERE id=?
+```
+
+Apply these SQL changes to `save()`, `updateBatch()` (insertStmt + updateStmt), and `saveBatch()` (insertStmt + updateStmt) — 6 SQL strings total.
+
+**Part D — Update `update()` fieldMap and `rowToTask()`**
+
+In `update()` fieldMap, replace the existing `dependsOn` entry and add `_originalPrompt`:
+```typescript
+      dependsOn:   { col: "depends_on", serialize: (v) => {
+        if (v == null) return null;
+        return Array.isArray(v) ? JSON.stringify(v as unknown[]) : v as string;
+      }},
+      _originalPrompt: { col: "original_prompt" },
+```
+
+In `rowToTask()`, replace the `dependsOn` line and add `_originalPrompt`:
+```typescript
+      dependsOn: (() => {
+        const raw = row.depends_on as string | null | undefined;
+        if (!raw) return undefined;
+        if (raw.startsWith("[")) {
+          try { return JSON.parse(raw) as string[]; } catch { return raw; }
+        }
+        return raw;
+      })(),
+      _originalPrompt: (row.original_prompt as string | null) ?? undefined,
+```
+
+**Step 5: Run tsc**
+```bash
+npx tsc --noEmit
+```
+Expected: no errors. Fix any type errors before committing.
+
+**Step 6: Commit**
+```bash
+git add -A && git commit -m "feat(store): persist _originalPrompt; serialize dependsOn array as JSON"
+```
+
+---
+
+#### Task 3: Add rebase methods to `src/worktree-pool.ts`
+
+**Files:**
+- Modify: `src/worktree-pool.ts`
+
+**Step 1: Add two public methods**
+
+Insert after the `getWorkerStats()` method (around line 386) and before the private `git()` helper:
+
+```typescript
+  /**
+   * Returns names of all currently-busy workers, optionally excluding one.
+   * Used by the scheduler to find other workers to rebase after a merge.
+   */
+  getActiveWorkers(exclude?: string): string[] {
+    const result: string[] = [];
+    for (const w of this.workers.values()) {
+      if (w.busy && w.name !== exclude) result.push(w.name);
+    }
+    return result;
+  }
+
+  /**
+   * Rebases the worker's branch onto the current tip of main.
+   * Returns true on success, false if there were conflicts (rebase is aborted).
+   * Best-effort — callers must not block on failure.
+   */
+  async rebaseOnMain(workerName: string): Promise<boolean> {
+    const w = this.workers.get(workerName);
+    if (!w) return false;
+    try {
+      const { stdout } = await this.git("rev-parse", "main");
+      const mainSha = stdout.trim();
+      await this.gitIn(w.path, "rebase", mainSha);
+      return true;
+    } catch {
+      await this.gitIn(w.path, "rebase", "--abort").catch(() => {});
+      log("warn", "[pool] rebaseOnMain: conflict, aborted", { worker: workerName });
+      return false;
+    }
+  }
+```
+
+**Step 2: Run tsc**
+```bash
+npx tsc --noEmit
+```
+Expected: no errors
+
+**Step 3: Commit**
+```bash
+git add -A && git commit -m "feat(worktree-pool): add getActiveWorkers() and rebaseOnMain()"
+```
+
+---
+
+### Wave 2: AgentRunner model override (depends on Wave 0)
+
+#### Task 4: Update `src/agent-runner.ts`
+
+**Files:**
+- Modify: `src/agent-runner.ts`
+
+**Step 1: Update `runClaudeSDK()` model selection**
+
+Find (~line 400):
+```typescript
+          model: task.model ?? this.model,
+```
+Change to:
+```typescript
+          model: task.modelOverride ?? task.model ?? this.model,
+```
+
+**Step 2: Update `runClaude()` model selection**
+
+Find (~line 438):
+```typescript
+        "--model", task.model ?? this.model,
+```
+Change to:
+```typescript
+        "--model", task.modelOverride ?? task.model ?? this.model,
+```
+
+**Step 3: Run tsc**
+```bash
+npx tsc --noEmit
+```
+Expected: no errors
+
+**Step 4: Commit**
+```bash
+git add -A && git commit -m "feat(agent-runner): honour task.modelOverride in runClaude and runClaudeSDK"
+```
+
+---
+
+### Wave 3: Scheduler — integrate all three features (depends on Waves 1 + 2)
+
+#### Task 5: Update `src/scheduler.ts`
+
+**Files:**
+- Modify: `src/scheduler.ts`
+
+Apply four sub-changes in sequence. Run `npx tsc --noEmit` after all four before committing.
+
+---
+
+**Sub-change A: Fix prompt accumulation in `executeAndRelease()`**
+
+Find the retry block starting at ~line 544:
+```typescript
+      if (task.status === "failed" && task.retryCount < task.maxRetries) {
+        shouldRetry = true;
+        const prevError = task.error ?? "";
+        task.retryCount++;
+        task.status = "pending";
+        task.completedAt = undefined;
+        // Inject previous error into prompt so the agent can learn from it
+        if (prevError) {
+          const errorContext = prevError.length > 500 ? prevError.slice(0, 500) + "..." : prevError;
+          task.prompt = `${task.prompt}\n\n---\n## Previous Attempt Failed (attempt ${task.retryCount})\nError: ${errorContext}\nFix the error above and try again.`;
+        }
+        task.error = "";
+        // Swap agent on retry for better chance of success
+        const prevAgent = task.agent ?? "claude";
+        task.agent = AgentRunner.pickFallbackAgent(prevAgent);
+        log("info", "task retrying with error context", { taskId: task.id, attempt: task.retryCount, maxRetries: task.maxRetries, agent: prevAgent, fallback: task.agent });
+      }
+```
+
+Replace with:
+```typescript
+      if (task.status === "failed" && task.retryCount < task.maxRetries) {
+        shouldRetry = true;
+        const prevError = task.error ?? "";
+        task.retryCount++;
+        task.status = "pending";
+        task.completedAt = undefined;
+        // Save original prompt on first retry; rebuild from it on subsequent retries
+        if (!task._originalPrompt) {
+          task._originalPrompt = task.prompt;
+        }
+        if (prevError) {
+          const errorContext = prevError.length > 500 ? prevError.slice(0, 500) + "..." : prevError;
+          task.prompt = `${task._originalPrompt}\n\n---\n## Previous Attempt Failed (attempt ${task.retryCount})\nError: ${errorContext}\nFix the error above and try again.`;
+        } else {
+          task.prompt = task._originalPrompt;
+        }
+        // Escalate to opus on second retry (retryCount has already been incremented above)
+        if (task.retryCount >= 2) {
+          task.modelOverride = "claude-opus-4-6";
+        }
+        task.error = "";
+        // Swap agent on retry for better chance of success
+        const prevAgent = task.agent ?? "claude";
+        task.agent = AgentRunner.pickFallbackAgent(prevAgent);
+        log("info", "task retrying with error context", { taskId: task.id, attempt: task.retryCount, maxRetries: task.maxRetries, agent: prevAgent, fallback: task.agent });
+      }
+```
+
+---
+
+**Sub-change B: Fix prompt accumulation in `requeue()`**
+
+Find in `requeue()` (~lines 149–164):
+```typescript
+    // Inject previous error into prompt so agent can learn from it
+    const prevError = task.error ?? "";
+    if (prevError) {
+      const errorContext = prevError.length > 500 ? prevError.slice(0, 500) + "..." : prevError;
+      task.prompt = `${task.prompt}\n\n---\n## Previous Attempt Failed (attempt ${task.retryCount + 1})\nError: ${errorContext}\nFix the error above and try again.`;
+    }
+
+    task.status = "pending";
+    task.error = "";
+    task.retryCount += 1;
+    task.completedAt = undefined;
+```
+
+Replace with:
+```typescript
+    // Save original prompt on first retry; rebuild from it on subsequent retries
+    const prevError = task.error ?? "";
+    if (!task._originalPrompt) {
+      task._originalPrompt = task.prompt;
+    }
+    if (prevError) {
+      const errorContext = prevError.length > 500 ? prevError.slice(0, 500) + "..." : prevError;
+      task.prompt = `${task._originalPrompt}\n\n---\n## Previous Attempt Failed (attempt ${task.retryCount + 1})\nError: ${errorContext}\nFix the error above and try again.`;
+    } else {
+      task.prompt = task._originalPrompt;
+    }
+
+    task.status = "pending";
+    task.error = "";
+    task.retryCount += 1;
+    task.completedAt = undefined;
+    // Escalate to opus on second+ manual retry
+    if (task.retryCount >= 2) {
+      task.modelOverride = "claude-opus-4-6";
+    }
+```
+
+---
+
+**Sub-change C: Update dependency DAG check in `loop()`**
+
+Find the dependency check block (~lines 443–461):
+```typescript
+      if (task.dependsOn) {
+        const dep = this.tasks.get(task.dependsOn) ?? this.store.get(task.dependsOn) ?? undefined;
+        if (dep?.status !== "success") {
+          // If dependency is in a terminal failure state (or missing), fail this task
+          if (!dep || dep.status === "failed" || dep.status === "timeout" || dep.status === "cancelled") {
+            task.status = "failed";
+            task.error = `dependency ${task.dependsOn} is ${dep?.status ?? "missing"}`;
+            task.completedAt = new Date().toISOString();
+            this.store.save(task);
+            this.onEvent?.({ type: "task_final", taskId: task.id, status: task.status });
+            continue;
+          }
+          // Still pending/running — re-queue and wait
+          log("info", "task waiting on dependency", { taskId: task.id, dependsOn: task.dependsOn });
+          this.queue.push(task);
+          await this.waitForDispatch(1_000);
+          continue;
+        }
+      }
+```
+
+Replace with:
+```typescript
+      if (task.dependsOn) {
+        const depIds = Array.isArray(task.dependsOn) ? task.dependsOn : [task.dependsOn];
+        let anyFailed = false;
+        let failedDepId: string | undefined;
+        let failedDepStatus: string | undefined;
+        let allSuccess = true;
+
+        for (const depId of depIds) {
+          const dep = this.tasks.get(depId) ?? this.store.get(depId) ?? undefined;
+          if (!dep || dep.status === "failed" || dep.status === "timeout" || dep.status === "cancelled") {
+            anyFailed = true;
+            failedDepId = depId;
+            failedDepStatus = dep?.status ?? "missing";
+            break;
+          }
+          if (dep.status !== "success") {
+            allSuccess = false;
+          }
+        }
+
+        if (anyFailed) {
+          task.status = "failed";
+          task.error = `dependency ${failedDepId} is ${failedDepStatus}`;
+          task.completedAt = new Date().toISOString();
+          this.store.save(task);
+          this.onEvent?.({ type: "task_final", taskId: task.id, status: task.status });
+          continue;
+        }
+        if (!allSuccess) {
+          log("info", "task waiting on dependency", { taskId: task.id, dependsOn: task.dependsOn });
+          this.queue.push(task);
+          await this.waitForDispatch(1_000);
+          continue;
+        }
+      }
+```
+
+---
+
+**Sub-change D: Staged rebase after merge + update `submit()` opts type**
+
+Find in `executeAndRelease()` the merge result line (~line 514):
+```typescript
+      const mergeResult = await this.pool.release(workerName, shouldMerge, task.id);
+
+      if (shouldMerge && !mergeResult.merged) {
+```
+
+After `pool.release(...)`, insert the rebase block:
+```typescript
+      const mergeResult = await this.pool.release(workerName, shouldMerge, task.id);
+
+      // After a successful merge, rebase other active workers onto new main (best-effort)
+      if (shouldMerge && mergeResult.merged) {
+        for (const otherWorker of this.pool.getActiveWorkers(workerName)) {
+          this.pool.rebaseOnMain(otherWorker).catch((err: unknown) => {
+            log("warn", "staged rebase failed (best-effort)", { worker: otherWorker, error: String(err) });
+          });
+        }
+      }
+
+      if (shouldMerge && !mergeResult.merged) {
+```
+
+Also update the `submit()` method signature to accept `dependsOn?: string | string[]`:
+
+Find (~line 72):
+```typescript
+  submit(prompt: string, opts?: { id?: string; timeout?: number; maxBudget?: number; priority?: import("./types.js").TaskPriority; dependsOn?: string; webhookUrl?: string; tags?: string[]; agent?: string; allowLongPrompt?: boolean }): Task {
+```
+
+Change `dependsOn?: string` to `dependsOn?: string | string[]`.
+
+---
+
+**Step 5: Run tsc**
+```bash
+npx tsc --noEmit
+```
+Expected: no errors. Fix any type errors before proceeding.
+
+**Step 6: Run existing tests to verify nothing broke**
+```bash
+node --import tsx --test src/__tests__/scheduler.test.ts
+```
+Expected: all existing tests pass (some may fail due to missing `getActiveWorkers`/`rebaseOnMain` in the mock — see Task 6 fix below, but do not commit tests yet)
+
+**Step 7: Commit**
+```bash
+git add -A && git commit -m "feat(scheduler): fix prompt accumulation, model escalation, array dependsOn, staged rebase"
+```
+
+---
+
+### Wave 4: Tests (parallel — different test files)
+
+#### Task 6: Tests for WorktreePool new methods
+
+**Files:**
+- Modify: `src/__tests__/worktree-pool.test.ts`
+
+Append two new `describe` blocks at the end of the file (after the existing "WorktreePool stats" block):
+
+```typescript
+// ---------------------------------------------------------------------------
+// getActiveWorkers
+// ---------------------------------------------------------------------------
+
+describe("WorktreePool.getActiveWorkers", () => {
+  it("returns empty array when no workers are busy", async () => {
+    const { repoPath, cleanup } = await makeTempRepo();
+    try {
+      const pool = new WorktreePool(repoPath, 2);
+      await pool.init();
+
+      assert.deepStrictEqual(pool.getActiveWorkers(), [], "no workers should be active initially");
+    } finally {
+      cleanup();
+    }
+  });
+
+  it("returns all busy worker names", async () => {
+    const { repoPath, cleanup } = await makeTempRepo();
+    try {
+      const pool = new WorktreePool(repoPath, 3);
+      await pool.init();
+
+      const w1 = await pool.acquire();
+      const w2 = await pool.acquire();
+      assert.ok(w1 !== null && w2 !== null);
+
+      const active = pool.getActiveWorkers();
+      assert.strictEqual(active.length, 2, "should report 2 active workers");
+      assert.ok(active.includes(w1.name), "should include first acquired worker");
+      assert.ok(active.includes(w2.name), "should include second acquired worker");
+    } finally {
+      cleanup();
+    }
+  });
+
+  it("excludes the named worker from results", async () => {
+    const { repoPath, cleanup } = await makeTempRepo();
+    try {
+      const pool = new WorktreePool(repoPath, 3);
+      await pool.init();
+
+      const w1 = await pool.acquire();
+      const w2 = await pool.acquire();
+      assert.ok(w1 !== null && w2 !== null);
+
+      const active = pool.getActiveWorkers(w1.name);
+      assert.strictEqual(active.length, 1, "should return 1 after excluding one");
+      assert.strictEqual(active[0], w2.name, "remaining entry should be the non-excluded worker");
+    } finally {
+      cleanup();
+    }
+  });
+});
+
+// ---------------------------------------------------------------------------
+// rebaseOnMain
+// ---------------------------------------------------------------------------
+
+describe("WorktreePool.rebaseOnMain", () => {
+  it("returns false for unknown worker name", async () => {
+    const { repoPath, cleanup } = await makeTempRepo();
+    try {
+      const pool = new WorktreePool(repoPath, 1);
+      await pool.init();
+
+      const result = await pool.rebaseOnMain("nonexistent");
+      assert.strictEqual(result, false, "unknown worker should return false");
+    } finally {
+      cleanup();
+    }
+  });
+
+  it("returns true when branch is already up to date with main", async () => {
+    const { repoPath, cleanup } = await makeTempRepo();
+    try {
+      const pool = new WorktreePool(repoPath, 1);
+      await pool.init();
+
+      // Worker was just reset to current main tip — nothing to rebase
+      const worker = await pool.acquire();
+      assert.ok(worker !== null);
+
+      const result = await pool.rebaseOnMain(worker.name);
+      assert.strictEqual(result, true, "up-to-date branch should rebase successfully");
+    } finally {
+      cleanup();
+    }
+  });
+
+  it("returns true after rebasing worker branch onto new main commits", async () => {
+    const { repoPath, cleanup } = await makeTempRepo();
+    try {
+      const pool = new WorktreePool(repoPath, 2);
+      await pool.init();
+
+      // Acquire worker-0 and add a commit on its branch (non-conflicting file)
+      const w0 = await pool.acquire();
+      assert.ok(w0 !== null);
+      fs.writeFileSync(path.join(w0.path, "worker-file.txt"), "worker work\n");
+      const git0 = (...args: string[]) => execFileAsync("git", args, { cwd: w0.path });
+      await git0("add", "worker-file.txt");
+      await git0("commit", "-m", "worker commit");
+
+      // Simulate a new commit landing on main via worker-1
+      const w1 = await pool.acquire();
+      assert.ok(w1 !== null);
+      fs.writeFileSync(path.join(w1.path, "main-new.txt"), "new on main\n");
+      const git1 = (...args: string[]) => execFileAsync("git", args, { cwd: w1.path });
+      await git1("add", "main-new.txt");
+      await git1("commit", "-m", "new main commit");
+      const { stdout: newSha } = await git1("rev-parse", "HEAD");
+      // Update main ref to simulate a squash merge landing
+      await execFileAsync("git", ["update-ref", "refs/heads/main", newSha.trim()], { cwd: repoPath });
+
+      // Rebase w0 onto new main
+      const result = await pool.rebaseOnMain(w0.name);
+      assert.strictEqual(result, true, "rebase onto non-conflicting main should succeed");
+    } finally {
+      cleanup();
+    }
+  });
+});
+```
+
+**Step 1: Append the two describe blocks**
+
+**Step 2: Run the test file**
+```bash
+node --import tsx --test src/__tests__/worktree-pool.test.ts
+```
+Expected: all tests pass including new ones
+
+**Step 3: Commit**
+```bash
+git add -A && git commit -m "test(worktree-pool): getActiveWorkers and rebaseOnMain coverage"
+```
+
+---
+
+#### Task 7: Tests for Scheduler new behaviour
+
+**Files:**
+- Modify: `src/__tests__/scheduler.test.ts`
+
+**Step 1: Update `makePool()` mock at the top of the file**
+
+The existing `makePool()` returns an object without `getActiveWorkers` or `rebaseOnMain`. The scheduler now calls both. Find `makePool()` and add the two stubs:
+
+```typescript
+function makePool(): WorktreePool {
+  return {
+    available: 2,
+    busy: 0,
+    acquire: async () => ({ name: "w0", path: "/tmp/w0", branch: "worker/w0", busy: true }),
+    release: async () => ({ merged: true }),
+    init: async () => {},
+    getStatus: () => [],
+    getActiveWorkers: (_exclude?: string) => [],
+    rebaseOnMain: async (_name: string) => true,
+  } as unknown as WorktreePool;
+}
+```
+
+**Step 2: Append new describe blocks at the end of the file**
+
+```typescript
+// ---------------------------------------------------------------------------
+// Prompt accumulation fix
+// ---------------------------------------------------------------------------
+
+describe("Scheduler retry — prompt accumulation fix", () => {
+  it("second retry rebuilds prompt from _originalPrompt, not accumulated prompt", async () => {
+    let callCount = 0;
+    const capturedPrompts: string[] = [];
+
+    const runner = {
+      run: async (task: Task) => {
+        callCount++;
+        capturedPrompts.push(task.prompt);
+        if (callCount <= 2) {
+          task.status = "failed";
+          task.error = `error on attempt ${callCount}`;
+          task.durationMs = 10;
+        } else {
+          task.status = "success";
+          task.durationMs = 10;
+        }
+        return task;
+      },
+      getRunningTasks: () => [],
+      reviewDiffWithAgent: async () => ({ approve: true, score: 80, issues: [], suggestions: [] }),
+    } as unknown as import("../agent-runner.js").AgentRunner;
+
+    const store = makeStore();
+    const s = new Scheduler(makePool(), runner, store);
+    s.start();
+
+    s.submit("original prompt text", { maxRetries: 3 });
+    // Allow enough time for 3 attempts
+    await new Promise((r) => setTimeout(r, 600));
+    await s.stop();
+
+    // Every attempt after the first should see exactly one "## Previous Attempt Failed" section
+    for (let i = 1; i < capturedPrompts.length; i++) {
+      const sections = (capturedPrompts[i].match(/## Previous Attempt Failed/g) ?? []).length;
+      assert.strictEqual(sections, 1,
+        `Attempt ${i + 1} prompt should have exactly 1 error section, got ${sections}.\nPrompt: ${capturedPrompts[i].slice(0, 300)}`);
+    }
+  });
+
+  it("stores _originalPrompt on first retry", async () => {
+    let callCount = 0;
+
+    const runner = {
+      run: async (task: Task) => {
+        callCount++;
+        if (callCount === 1) {
+          task.status = "failed";
+          task.error = "first failure";
+          task.durationMs = 10;
+        } else {
+          task.status = "success";
+          task.durationMs = 10;
+        }
+        return task;
+      },
+      getRunningTasks: () => [],
+      reviewDiffWithAgent: async () => ({ approve: true, score: 80, issues: [], suggestions: [] }),
+    } as unknown as import("../agent-runner.js").AgentRunner;
+
+    const store = makeStore();
+    const s = new Scheduler(makePool(), runner, store);
+    s.start();
+
+    const task = s.submit("the real original prompt", { maxRetries: 1 });
+    await new Promise((r) => setTimeout(r, 400));
+    await s.stop();
+
+    assert.strictEqual(task._originalPrompt, "the real original prompt",
+      "_originalPrompt should be saved after first retry");
+  });
+});
+
+// ---------------------------------------------------------------------------
+// Model escalation
+// ---------------------------------------------------------------------------
+
+describe("Scheduler retry — model escalation", () => {
+  it("sets modelOverride to claude-opus-4-6 on retryCount >= 2", async () => {
+    const modelOverrides: Array<string | undefined> = [];
+    let callCount = 0;
+
+    const runner = {
+      run: async (task: Task) => {
+        callCount++;
+        modelOverrides.push(task.modelOverride);
+        task.status = "failed";
+        task.error = "always fails";
+        task.durationMs = 10;
+        return task;
+      },
+      getRunningTasks: () => [],
+      reviewDiffWithAgent: async () => ({ approve: true, score: 80, issues: [], suggestions: [] }),
+    } as unknown as import("../agent-runner.js").AgentRunner;
+
+    const s = new Scheduler(makePool(), runner, makeStore());
+    s.start();
+    s.submit("test model escalation", { maxRetries: 2 });
+    await new Promise((r) => setTimeout(r, 600));
+    await s.stop();
+
+    // 3 total attempts: attempt 0, 1, 2
+    // On attempt at retryCount=2 (third call), modelOverride should be "claude-opus-4-6"
+    assert.ok(callCount >= 3, `expected at least 3 attempts, got ${callCount}`);
+    assert.strictEqual(modelOverrides[2], "claude-opus-4-6",
+      `third attempt (retryCount=2) should use claude-opus-4-6, got: ${modelOverrides[2]}`);
+    // First two attempts should not have modelOverride set
+    assert.strictEqual(modelOverrides[0], undefined, "first attempt should not have modelOverride");
+    assert.strictEqual(modelOverrides[1], undefined, "second attempt (retryCount=1) should not have modelOverride");
+  });
+});
+
+// ---------------------------------------------------------------------------
+// Array dependsOn (DAG)
+// ---------------------------------------------------------------------------
+
+describe("Scheduler dependency DAG — array dependsOn", () => {
+  it("task with string[] dependsOn waits for all deps before running", async () => {
+    const store = makeStore();
+    const completionOrder: string[] = [];
+
+    const runner = {
+      run: async (task: Task) => {
+        await new Promise((r) => setTimeout(r, 30));
+        task.status = "success";
+        task.durationMs = 30;
+        completionOrder.push(task.id);
+        return task;
+      },
+      getRunningTasks: () => [],
+      reviewDiffWithAgent: async () => ({ approve: true, score: 80, issues: [], suggestions: [] }),
+    } as unknown as import("../agent-runner.js").AgentRunner;
+
+    // Pool with 3 workers so deps can run in parallel
+    const pool = {
+      available: 3,
+      busy: 0,
+      acquire: (() => {
+        let n = 0;
+        return async () => ({ name: `w${n++}`, path: `/tmp/w${n}`, branch: `worker/w${n}`, busy: true });
+      })(),
+      release: async () => ({ merged: true }),
+      init: async () => {},
+      getStatus: () => [],
+      getActiveWorkers: () => [],
+      rebaseOnMain: async () => true,
+    } as unknown as import("../worktree-pool.js").WorktreePool;
+
+    const s = new Scheduler(pool, runner, store);
+    s.start();
+
+    const dep1 = s.submit("dep task 1");
+    const dep2 = s.submit("dep task 2");
+    const dependent = s.submit("dependent task", { dependsOn: [dep1.id, dep2.id] });
+
+    await new Promise((r) => setTimeout(r, 600));
+    await s.stop();
+
+    const savedDependent = store.get(dependent.id);
+    assert.strictEqual(savedDependent?.status, "success",
+      `dependent task should succeed, got: ${savedDependent?.status}`);
+
+    const dep1Idx = completionOrder.indexOf(dep1.id);
+    const dep2Idx = completionOrder.indexOf(dep2.id);
+    const depIdx = completionOrder.indexOf(dependent.id);
+    assert.ok(dep1Idx !== -1, "dep1 should have completed");
+    assert.ok(dep2Idx !== -1, "dep2 should have completed");
+    assert.ok(depIdx !== -1, "dependent should have completed");
+    assert.ok(dep1Idx < depIdx, "dep1 must complete before dependent");
+    assert.ok(dep2Idx < depIdx, "dep2 must complete before dependent");
+  });
+
+  it("dependent task fails immediately when any dep in array fails", async () => {
+    const store = makeStore();
+
+    const runner = {
+      run: async (task: Task) => {
+        if (task.prompt === "will fail") {
+          task.status = "failed";
+          task.error = "intentional failure";
+        } else {
+          task.status = "success";
+        }
+        task.durationMs = 10;
+        return task;
+      },
+      getRunningTasks: () => [],
+      reviewDiffWithAgent: async () => ({ approve: true, score: 80, issues: [], suggestions: [] }),
+    } as unknown as import("../agent-runner.js").AgentRunner;
+
+    const pool = {
+      available: 2,
+      busy: 0,
+      acquire: (() => {
+        let n = 0;
+        return async () => ({ name: `w${n++}`, path: `/tmp/w${n}`, branch: `worker/w${n}`, busy: true });
+      })(),
+      release: async () => ({ merged: true }),
+      init: async () => {},
+      getStatus: () => [],
+      getActiveWorkers: () => [],
+      rebaseOnMain: async () => true,
+    } as unknown as import("../worktree-pool.js").WorktreePool;
+
+    const s = new Scheduler(pool, runner, store);
+    s.start();
+
+    const depFailing = s.submit("will fail", { maxRetries: 0 });
+    const depOk = s.submit("will succeed");
+    const dependent = s.submit("dep on both", { dependsOn: [depFailing.id, depOk.id] });
+
+    await new Promise((r) => setTimeout(r, 500));
+    await s.stop();
+
+    const savedDependent = store.get(dependent.id);
+    assert.strictEqual(savedDependent?.status, "failed",
+      `dependent should be failed when a dep fails, got: ${savedDependent?.status}`);
+    assert.ok(savedDependent?.error.includes(depFailing.id),
+      `error message should reference the failed dep ID. Got: ${savedDependent?.error}`);
+  });
+
+  it("string dependsOn (single ID, backward-compat) still works", () => {
+    const store = makeStore();
+    const s = new Scheduler(makePool(), makeRunner(), store);
+
+    const dep = s.submit("parent task");
+    dep.status = "success";
+    store.save(dep);
+
+    // String (not array) — must not break
+    const child = s.submit("child task", { dependsOn: dep.id });
+    assert.strictEqual(child.status, "pending",
+      "child with string dependsOn should be pending (not immediately failed)");
+  });
+});
+```
+
+**Step 3: Run the full scheduler test file**
+```bash
+node --import tsx --test src/__tests__/scheduler.test.ts
+```
+Expected: all tests pass
+
+**Step 4: Run the entire test suite**
+```bash
+node --import tsx --test src/__tests__/*.test.ts
+```
+Expected: all tests pass
+
+**Step 5: Commit**
+```bash
+git add -A && git commit -m "test(scheduler): prompt accumulation fix, model escalation, array dependsOn coverage"
+```
+
+---
+
+## Risks
+
+| Risk | Mitigation |
+|------|-----------|
+| **SQL param count mismatch** — `taskToParams` now returns 26 params but SQL might still expect 25 | Count `?` placeholders in every INSERT/UPDATE statement after editing. 26 columns in INSERT, 25 SET clauses + 1 WHERE in UPDATE (26 total params, same array) |
+| **`retryCount` increment order** — in `executeAndRelease`, `retryCount++` happens BEFORE the `>= 2` check. In `requeue()`, `retryCount += 1` happens AFTER. Be careful: escalation fires at retryCount=2 in both places | Double-check: after `task.retryCount++` the value is 2 on the third attempt. In requeue, `retryCount += 1` then `if (task.retryCount >= 2)` — same logic |
+| **Rebase locking** — `rebaseOnMain` calls `gitIn` which runs in a worktree. If the worktree is actively running an agent that is also calling git, rebase could conflict | Rebase is best-effort, fires after the current worker's merge completes (that worker is already released). Other active workers are using different worktree paths |
+| **Test timing flakiness** — async scheduler tests use `setTimeout` delays. Slow CI might fail | If tests flake, increase delays. 600ms allows 3 × 10ms-duration runs with plenty of scheduling overhead |
+| **`dependsOn` JSON round-trip** — reading old DB rows where `depends_on` is a plain string like `"abc123"` must not be accidentally JSON-parsed | The `startsWith('[')` guard handles this — only arrays are parsed as JSON |
diff --git a/.cc-pipeline/tasks.json b/.cc-pipeline/tasks.json
new file mode 100644
index 0000000..76f006c
--- /dev/null
+++ b/.cc-pipeline/tasks.json
@@ -0,0 +1,37 @@
+{
+  "waves": [
+    {
+      "waveIndex": 0,
+      "tasks": [
+        "Modify src/types.ts only. (1) In the Task interface, after the line `model?: string;`, add two new optional fields: `modelOverride?: string;` and `_originalPrompt?: string;`. (2) Change the existing `dependsOn?: string;` field to `dependsOn?: string | string[];`. No other changes are needed — createTask() already handles the widened type via opts?.dependsOn assignment. Run `npx tsc --noEmit` and verify no errors. Then commit: `git add -A && git commit -m \"feat(types): add modelOverride, _originalPrompt; widen dependsOn to string|string[]\"`"
+      ]
+    },
+    {
+      "waveIndex": 1,
+      "tasks": [
+        "Modify src/store.ts only. Apply four changes in sequence: (1) In migrate(), after the existing `review` column ALTER TABLE try/catch block, add: `try { this.db.exec(\"ALTER TABLE tasks ADD COLUMN original_prompt TEXT\"); } catch {}`. (2) In taskToParams(), append `task._originalPrompt ?? null` as the 26th element of the returned array. (3) Update all INSERT SQL strings in save(), updateBatch() insertStmt, and saveBatch() insertStmt to add `original_prompt` to the column list and a 26th `?` to VALUES. Update all UPDATE SQL strings to add `original_prompt=?` before `WHERE id=?` (the params array is already 26 elements from step 2). (4) In update() fieldMap, replace the dependsOn entry with: `dependsOn: { col: 'depends_on', serialize: (v) => v == null ? null : Array.isArray(v) ? JSON.stringify(v as unknown[]) : v as string }`, and add `_originalPrompt: { col: 'original_prompt' }`. In rowToTask(), replace the dependsOn line with: `dependsOn: (() => { const raw = row.depends_on as string|null|undefined; if (!raw) return undefined; if (raw.startsWith('[')) { try { return JSON.parse(raw) as string[]; } catch { return raw; } } return raw; })()`, and add `_originalPrompt: (row.original_prompt as string | null) ?? undefined`. Run `npx tsc --noEmit`. Commit: `git add -A && git commit -m \"feat(store): persist _originalPrompt; serialize dependsOn array as JSON\"`",
+        "Modify src/worktree-pool.ts only. Insert two new public methods after the getWorkerStats() method, before the private git() helper: (1) `getActiveWorkers(exclude?: string): string[]` — iterate `this.workers.values()`, push `w.name` into result array when `w.busy && w.name !== exclude`, return result. (2) `async rebaseOnMain(workerName: string): Promise<boolean>` — get worker via `this.workers.get(workerName)`, return false if not found; call `const { stdout } = await this.git('rev-parse', 'main')` to get mainSha (trim it); call `await this.gitIn(w.path, 'rebase', mainSha)`; on any error, call `await this.gitIn(w.path, 'rebase', '--abort').catch(() => {})`, log a warn with `log('warn', '[pool] rebaseOnMain: conflict, aborted', { worker: workerName })`, and return false; return true on success. Use the existing `log` import and `this.git`/`this.gitIn` helpers already in the file. Run `npx tsc --noEmit`. Commit: `git add -A && git commit -m \"feat(worktree-pool): add getActiveWorkers() and rebaseOnMain()\"`"
+      ]
+    },
+    {
+      "waveIndex": 2,
+      "tasks": [
+        "Modify src/agent-runner.ts only. Make exactly two line changes: (1) In runClaudeSDK(), find the line `model: task.model ?? this.model,` and change it to `model: task.modelOverride ?? task.model ?? this.model,`. (2) In runClaude(), find the line `\"--model\", task.model ?? this.model,` and change it to `\"--model\", task.modelOverride ?? task.model ?? this.model,`. No other changes. Run `npx tsc --noEmit` and verify no errors. Commit: `git add -A && git commit -m \"feat(agent-runner): honour task.modelOverride in runClaude and runClaudeSDK\"`"
+      ]
+    },
+    {
+      "waveIndex": 3,
+      "tasks": [
+        "Modify src/scheduler.ts only. Apply four sub-changes then compile and commit. (1) In executeAndRelease(), in the retry block where task.prompt is modified: after `task.retryCount++`, add `if (!task._originalPrompt) { task._originalPrompt = task.prompt; }`, then replace the existing prompt-mutation line with `task.prompt = prevError ? \\`${task._originalPrompt}\\n\\n---\\n## Previous Attempt Failed (attempt ${task.retryCount})\\nError: ${errorContext}\\nFix the error above and try again.\\` : task._originalPrompt;`, then after that add `if (task.retryCount >= 2) { task.modelOverride = 'claude-opus-4-6'; }`. (2) Same fix in requeue(): before the existing prompt mutation, add `if (!task._originalPrompt) { task._originalPrompt = task.prompt; }`, replace the prompt line to rebuild from task._originalPrompt, and after `task.retryCount += 1` add `if (task.retryCount >= 2) { task.modelOverride = 'claude-opus-4-6'; }`. (3) In loop(), replace the single-ID dependency check block with array-aware logic: `const depIds = Array.isArray(task.dependsOn) ? task.dependsOn : [task.dependsOn]; let anyFailed = false, failedDepId: string|undefined, failedDepStatus: string|undefined, allSuccess = true; for (const depId of depIds) { const dep = this.tasks.get(depId) ?? this.store.get(depId) ?? undefined; if (!dep || ['failed','timeout','cancelled'].includes(dep.status)) { anyFailed = true; failedDepId = depId; failedDepStatus = dep?.status ?? 'missing'; break; } if (dep.status !== 'success') allSuccess = false; }` then fail-fast if anyFailed, re-queue if !allSuccess. (4) After `const mergeResult = await this.pool.release(...)`, add: `if (shouldMerge && mergeResult.merged) { for (const w of this.pool.getActiveWorkers(workerName)) { this.pool.rebaseOnMain(w).catch((err: unknown) => { log('warn','staged rebase failed',{worker:w,error:String(err)}); }); } }`. Also update submit() opts signature: change `dependsOn?: string` to `dependsOn?: string | string[]`. Run `npx tsc --noEmit`. Commit: `git add -A && git commit -m \"feat(scheduler): fix prompt accumulation, model escalation, array dependsOn, staged rebase\"`"
+      ]
+    },
+    {
+      "waveIndex": 4,
+      "tasks": [
+        "Modify src/__tests__/worktree-pool.test.ts only. Append two describe blocks at end of file. Block 1 'WorktreePool.getActiveWorkers': (a) test returns [] when no workers busy — init pool, call getActiveWorkers(), assert empty; (b) test returns both acquired worker names — acquire two workers, assert getActiveWorkers().length===2 and includes both names; (c) test excludes named worker — acquire two, call getActiveWorkers(w1.name), assert length===1 and result[0]===w2.name. Block 2 'WorktreePool.rebaseOnMain': (a) test returns false for unknown name — init pool, call rebaseOnMain('nonexistent'), assert false; (b) test returns true when up-to-date — acquire worker, call rebaseOnMain(worker.name), assert true; (c) test returns true after rebasing onto new main commits — acquire w0, write a file in w0.path, git add+commit in w0's worktree; acquire w1, write a different file in w1.path, git add+commit in w1's worktree, capture HEAD sha, call `git update-ref refs/heads/main <sha>` in repoPath to advance main; then call rebaseOnMain(w0.name) and assert true. Each test uses makeTempRepo() and cleanup() in finally. Run `node --import tsx --test src/__tests__/worktree-pool.test.ts`. Commit: `git add -A && git commit -m \"test(worktree-pool): getActiveWorkers and rebaseOnMain coverage\"`",
+        "Modify src/__tests__/scheduler.test.ts only. (1) Update makePool() to add two stubs: `getActiveWorkers: (_exclude?: string) => [] as string[]` and `rebaseOnMain: async (_name: string) => true`. (2) Append three describe blocks. 'Scheduler retry — prompt accumulation fix': (a) test that on 3 attempts (2 failures then success), each retry prompt contains exactly one '## Previous Attempt Failed' section — use regex match count; (b) test that task._originalPrompt equals the original submitted prompt string after first retry. 'Scheduler retry — model escalation': test that across 3 failed attempts (maxRetries:2), modelOverride captured at attempt index 0 and 1 is undefined, and at index 2 is 'claude-opus-4-6'. 'Scheduler dependency DAG — array dependsOn': (a) test task with dependsOn:[dep1.id,dep2.id] succeeds only after both deps complete, using completion order array to verify ordering; (b) test task fails immediately with error referencing the failed dep ID when one dep in the array fails; (c) backward-compat test: string dependsOn (not array) still works without errors. Use makeStore() and inline runner mocks with setTimeout delays. Run `node --import tsx --test src/__tests__/scheduler.test.ts` then `node --import tsx --test src/__tests__/*.test.ts`. Commit: `git add -A && git commit -m \"test(scheduler): prompt accumulation fix, model escalation, array dependsOn coverage\"`"
+      ]
+    }
+  ],
+  "totalTasks": 7
+}
\ No newline at end of file
diff --git a/AGENTS.md b/AGENTS.md
new file mode 100644
index 0000000..e69a9e6
--- /dev/null
+++ b/AGENTS.md
@@ -0,0 +1,23 @@
+# Repository Guidelines
+
+## Project Structure & Module Organization
+`src/` contains the TypeScript application code. Core runtime modules include `scheduler.ts`, `agent-runner.ts`, `store.ts`, `server.ts`, and the CLI entrypoints `index.ts` and `cli.ts`. Tests live in `src/__tests__/` and follow the source module names, for example `src/__tests__/scheduler.test.ts`. The web dashboard is a single static file at `src/web/index.html`; built output goes to `dist/`. Longer-form design and API docs live in `docs/`, and `ARCHITECTURE.md` explains the dependency flow between modules. Runtime artifacts such as `.cc-manager.db` and `.worktrees/` should not be treated as source.
+
+## Build, Test, and Development Commands
+Use Node.js 20+.
+
+- `npm install`: install dependencies and enable the repo’s git hooks via `prepare`.
+- `npm run dev`: run the app from source with `tsx`.
+- `npm run build`: compile TypeScript to `dist/` and copy the web UI asset.
+- `npm test`: run the Node test runner against `src/__tests__/*.test.ts`.
+- `npx tsc --noEmit`: run the strict type check used by CI and the pre-commit hook.
+- `npm run start -- --repo /path/to/repo`: run the built server locally.
+
+## Coding Style & Naming Conventions
+Follow `.editorconfig`: UTF-8, LF, and 2-space indentation. Keep source in TypeScript under `src/`; do not add plain `.js` source files there. Use Node ESM import paths with explicit `.js` extensions, for example `import { Store } from './store.js';`. Match existing file naming: kebab-case module files and `*.test.ts` for tests. Prefer explicit types and keep `strict`-mode compatibility. For the dashboard, keep `src/web/index.html` framework-free and self-contained.
+
+## Testing Guidelines
+Add or update targeted tests in `src/__tests__/` whenever behavior changes. Keep test filenames aligned with the module under test and cover both success and failure paths for scheduler, store, server, or worktree behavior. Before opening a PR, run `npx tsc --noEmit`, `npm test`, and `npm run build` if your change affects runtime packaging.
+
+## Commit & Pull Request Guidelines
+Recent history uses Conventional Commits, usually with a scope: `feat(scheduler): ...`, `fix(pipeline): ...`, `docs: ...`. Keep commits focused and descriptive. PRs should answer: what changed, why it changed, and how to test it. Follow `.github/pull_request_template.md`: confirm tests pass, types compile, `console.log` calls are removed, and docs are updated when needed.
diff --git a/CLAUDE.md b/CLAUDE.md
index 92542a4..cfe87f7 100644
--- a/CLAUDE.md
+++ b/CLAUDE.md
@@ -13,6 +13,10 @@ Multi-agent orchestrator that runs parallel Claude Code agents in git worktrees.
 - **src/worktree-pool.ts** — Git worktree lifecycle, parallel init, merge
 - **src/store.ts** — SQLite persistence (better-sqlite3, WAL mode)
 - **src/types.ts** — Shared TypeScript types
+- **src/pipeline.ts** — 5-stage autonomous pipeline (research→decompose→execute→verify→done)
+- **src/pipeline-types.ts** — Pipeline type definitions
+- **src/pipeline-store.ts** — Pipeline run persistence
+- **src/task-classifier.ts** — Task routing (quick/standard/deep → model/agent/contextProfile)
 - **src/logger.ts** — Structured JSON logger
 - **src/web/index.html** — Dashboard (vanilla HTML/JS, dark theme)
 
@@ -30,7 +34,7 @@ node dist/index.js --repo /path/to/repo --workers 5 --port 8080
 ```
 
 ```bash
-# Run tests (282 tests across 8 suites)
+# Run tests (372 tests across 10 suites)
 node --import tsx --test src/__tests__/*.test.ts
 ```
 
@@ -45,6 +49,14 @@ node --import tsx --test src/__tests__/*.test.ts
 ## Agent Flywheel Strategy
 The cc-manager improves itself by running agents against its own codebase.
 
+### Current Status: NOT WORKING (v0.1.7)
+Two self-hosting runs (v0.1.5, v0.1.6) achieved only 43-50% commit rate. All "successful" runs required manual fixes. The flywheel loop does not yet produce reliable, mergeable code autonomously.
+
+**Root causes identified**:
+- Agents exit 0 without committing (fixed in v0.1.7: F1 empty commit detection)
+- Complex files (scheduler.ts 618 LOC) always fail multi-point integration
+- System prompt commit instruction too weak (fixed in v0.1.7: F2 CRITICAL warning)
+
 ### Proven Best Practices
 - **240s timeout** — sweet spot (120s = 80% failure, 180s = occasional timeout)
 - **One file per task** — prevents merge conflicts between concurrent agents
@@ -146,7 +158,7 @@ pending → running → success (branch merged to main)
 
 ## Repository
 - **GitHub**: `agent-next/cc-manager` (private)
-- **Version**: v0.1.0
+- **Version**: v0.1.7
 
 ## Security Notes
 - **No authentication**: cc-manager has no auth. It is a local dev tool — do NOT expose to the public internet.
diff --git a/TODO.md b/TODO.md
new file mode 100644
index 0000000..70e1569
--- /dev/null
+++ b/TODO.md
@@ -0,0 +1,190 @@
+# TODO
+
+Single coordination backlog for multi-agent work. This file is the execution queue for the current codebase as of 2026-03-05.
+
+## Source of Truth
+
+- Prefer code over older roadmap claims.
+- Primary planning refs: `docs/plans/2026-03-05-v0.1.7-plan.md`, `docs/plans/2026-03-05-v0.2-implementation-plan.md`, `docs/ROADMAP.md`.
+- Latest review findings elevated several correctness and safety bugs above the previous roadmap work.
+- This backlog is cumulative: earlier roadmap items stay here if they are still real todos.
+
+## Backlog Continuity
+
+The earlier TODO was not discarded; its still-valid items were merged into the priority queue below.
+
+- Previous `T1 Failure diagnoser core` -> `P2-A3`
+- Previous `T2 Task classifier v2` -> `P2-A5`
+- Previous `T3 Docs sync` -> `P3-D2`
+- Previous `T4 Pipeline/API docs cleanup` -> `P3-D3`
+- Previous `T5 Claude resume support` -> `P2-A6`
+- Previous `T6 Structured review output` -> `P2-A7`
+- Previous `T7 Codex profile/config management` -> `P2-A8`
+- Previous `T8 Pricing/cost table refresh` -> `P2-A9`
+- Previous `T9 Wire failure diagnoser into retry flow` -> `P2-A4`
+- Previous `T10 Enhanced verification gate` -> `P4-A11`
+- Previous `T11 Import-graph wave validation` -> `P4-A10`
+- Previous `T12 Smart dead-loop detection` -> `P4-A12`
+- Previous `T13 Budget-aware model downgrade` -> `P4-A13`
+- Previous `T14 Agent self-evolution/version monitoring` -> `P4-A14`
+- Previous `T15 Dashboard v2` -> `P4-D4`
+
+## Coordination Rules
+
+- Each agent claims exactly one task.
+- Do not edit files owned by another active task.
+- Hot-file tasks must be serialized by lane.
+- Every code task must add or update narrow tests.
+- Update this file when claiming, blocking, or completing a task.
+
+Claim format:
+
+```md
+- [ ] P0-A Task name
+  owner: agent-name
+  status: in_progress
+```
+
+## Hot-File Lanes
+
+Use these lanes to avoid merge collisions.
+
+- Lane S: `src/scheduler.ts`, `src/pipeline.ts`
+- Lane A: `src/agent-runner.ts`, `src/types.ts`, `src/store.ts`
+- Lane V: `src/server.ts`
+- Lane W: `src/worktree-pool.ts`
+- Lane D: docs and packaging files
+
+## P0: Correctness And Safety
+
+These are blocking issues and should be addressed before new capability work.
+
+- [ ] P0-S1 Review rejection / merge conflict must not report success
+  lane: S
+  scope: ensure review rejection and merge conflict paths end in a non-success terminal status and correct API events
+  files: `src/scheduler.ts`, related tests
+  done when: a task blocked from merge cannot remain `success`
+
+- [ ] P0-S2 Pipeline cancel must stop running tasks
+  lane: S
+  scope: cancellation must stop already-running pipeline tasks, not just pending ones
+  files: `src/pipeline.ts`, `src/scheduler.ts`, related tests
+  depends_on: none
+  done when: cancelled runs cannot keep mutating the repo or merge afterward
+
+- [ ] P0-S3 Isolate concurrent pipeline runs
+  lane: S
+  scope: remove shared `_lastDecompose` and shared `.cc-pipeline/tasks.json` state across runs
+  files: `src/pipeline.ts`, `src/pipeline-store.ts`, related tests
+  depends_on: none
+  done when: two pipeline runs can decompose and execute without overwriting each other
+
+- [ ] P0-V1 Harden webhook SSRF validation
+  lane: V
+  scope: replace string-based host blocking with stricter validation that rejects loopback aliases and local/private targets
+  files: `src/server.ts`, related tests
+  done when: localhost variants and local-address tricks are rejected
+
+- [ ] P0-A1 Fix advertised default runtime behavior
+  lane: A
+  scope: make `--timeout`, `--budget`, and `--model` apply consistently to normal tasks, or change API/startup behavior and docs to match reality
+  files: `src/index.ts`, `src/server.ts`, `src/scheduler.ts`, `src/agent-runner.ts`, docs/tests as needed
+  done when: startup defaults match actual runtime behavior for ordinary task submissions
+
+## P1: Data Integrity And Observability
+
+These are important and can mostly proceed in parallel by lane.
+
+- [ ] P1-A2 Task diff and review must use task-specific commit range
+  lane: A
+  scope: stop diffing only `HEAD~1..HEAD`; capture full task diff/review scope for multi-commit tasks
+  files: `src/agent-runner.ts`, `src/scheduler.ts`, related tests
+  done when: cross-agent review covers the full task change set
+
+- [ ] P1-V2 Diff endpoint must not depend on mutable worker state
+  lane: V
+  scope: return task-specific diffs after worker reuse, not current worktree contents
+  files: `src/server.ts`, `src/worktree-pool.ts`, `src/store.ts`, related tests
+  done when: `/api/tasks/:id/diff` is stable after worker reassignment
+
+- [ ] P1-V3 GET /api/tasks must include persisted history after restart
+  lane: V
+  scope: merge scheduler in-memory tasks with store-backed history or route directly through persisted data
+  files: `src/server.ts`, `src/scheduler.ts`, `src/store.ts`, related tests
+  done when: task history survives process restart in the list API
+
+- [ ] P1-D1 Lock down npm publish surface
+  lane: D
+  scope: prevent `.cc-pipeline/*`, `.cc-manager.db*`, and other local runtime artifacts from shipping in npm packages
+  files: `.npmignore`, `package.json`
+  done when: `npm pack --dry-run` includes only intended publish artifacts
+
+## P2: Agent Quality Work
+
+Start these after P0 is merged. Serialize within Lane A.
+
+- [ ] P2-A3 Failure diagnoser core
+  lane: A
+  scope: add structured parsing for TypeScript/build failures
+  files: `src/failure-diagnoser.ts`, `src/__tests__/failure-diagnoser.test.ts`
+  done when: failures are categorized into actionable buckets such as missing import/export and dependency-order issues
+
+- [ ] P2-A4 Wire failure diagnoser into retry flow
+  lane: A
+  scope: inject structured diagnosis into retry prompts and task errors
+  files: `src/scheduler.ts`, `src/agent-runner.ts`, `src/failure-diagnoser.ts`, tests
+  depends_on: P2-A3
+  done when: retries include targeted failure context instead of generic error text
+
+- [ ] P2-A5 Task classifier v2
+  lane: A
+  scope: enrich classification beyond `quick|standard|deep`
+  files: `src/task-classifier.ts`, `src/__tests__/task-classifier.test.ts`
+  done when: routing metadata supports future agent/model/context decisions without breaking callers
+
+- [ ] P2-A6 Claude resume support
+  lane: A
+  scope: capture session identifiers and reuse them on retry
+  files: `src/agent-runner.ts`, `src/types.ts`, `src/store.ts`, related tests
+  done when: retry can continue prior session context instead of always starting cold
+
+- [ ] P2-A7 Structured review output
+  lane: A
+  scope: replace brittle review parsing with schema-shaped output
+  files: `src/agent-runner.ts`, related tests
+  done when: review approval, score, and issues are parsed deterministically
+
+- [ ] P2-A8 Codex profile/config management
+  lane: A
+  scope: generate or validate `~/.codex/config.toml` profiles for default and wide-context execution
+  files: `src/agent-runner.ts`, related tests, docs if needed
+  done when: Codex routing does not rely on undocumented local manual setup
+
+- [ ] P2-A9 Pricing and cost table refresh
+  lane: A
+  scope: ensure supported model rates are current and covered by tests
+  files: `src/agent-runner.ts`, tests
+  done when: supported Claude and Codex model rates are verified in tests
+
+## P3: Docs And Roadmap Cleanup
+
+- [ ] P3-D2 Sync roadmap docs with shipped code
+  lane: D
+  scope: update docs that still describe pipeline, DAG, or staged rebase as missing
+  files: `docs/ROADMAP.md`, `docs/GAP-ANALYSIS.md`, optionally `docs/STRATEGY.md`
+  done when: roadmap docs match the current implementation
+
+- [ ] P3-D3 Document pipeline and approval flow
+  lane: D
+  scope: document current pipeline endpoints, approval flow, and operator workflow
+  files: `README.md`, `docs/API.md`, `docs/OPERATIONS.md`
+  done when: contributors can discover pipeline behavior without reading source
+
+## Deferred
+
+- [ ] P4-A10 Import-graph wave validation
+- [ ] P4-A11 Enhanced verification gate
+- [ ] P4-A12 Smart dead-loop detection
+- [ ] P4-A13 Budget-aware model downgrade
+- [ ] P4-D4 Dashboard v2
+- [ ] P4-A14 Agent self-evolution/version monitoring
diff --git a/docs/3-agents-reference.md b/docs/3-agents-reference.md
new file mode 100644
index 0000000..bfd35c8
--- /dev/null
+++ b/docs/3-agents-reference.md
@@ -0,0 +1,195 @@
+# cc-manager: 3-Agent Reference (2026-03-05)
+
+cc-manager orchestrates 3 agents: Claude CLI, Claude Agent SDK, Codex CLI.
+Source: `src/agent-runner.ts`
+
+## Agent 1: Claude CLI (`agent: "claude"`) — Primary workhorse
+
+### Latest Core Features (Claude Code 2.1.x)
+- `--max-budget-usd <n>` — built-in budget cap per task
+- `--json-schema <schema>` — guaranteed structured output (no manual JSON parse)
+- `--fallback-model <model>` — auto-downgrade on overload (e.g. Opus → Sonnet on 429)
+- `--resume <session-id>` — continue previous session (retry without re-running from scratch)
+- `--max-turns <n>` — prevent agent loops (more precise than timeout)
+- `--append-system-prompt` — inject custom system instructions
+- `--output-format stream-json` — JSONL event stream for real-time monitoring
+- `--agents` — dynamic subagent definitions
+- `--worktree` — built-in worktree support (evaluate vs our worktree-pool)
+
+### What cc-manager uses today
+- `-p`, `--dangerously-skip-permissions`, `--output-format stream-json`, `--verbose`
+- `--model`, `--max-budget-usd`, `--append-system-prompt`
+- Code: `agent-runner.ts:428-502` (runClaude method)
+
+### Gaps (not using yet)
+- `--resume` (P0): retry wastes full token cost by re-running from scratch
+- `--fallback-model` (P1): Opus overload → direct fail instead of auto-downgrade
+- `--json-schema` (P1): review agent JSON parsing fails ~15-20%, falls back to heuristic
+- `--max-turns` (P2): only timeout guards against loops, not turn count
+
+## Agent 2: Claude Agent SDK (`agent: "claude-sdk"`) — Heavy tasks + hooks
+
+### Latest Core Features (SDK v0.2.69)
+- **V2 API**: `send()`/`stream()` replaces V1 `query()` async generator
+- `createSession()` / `resumeSession()` — persistent sessions across calls
+- **18 lifecycle hooks**: PreToolUse, PostToolUse, Stop, WorktreeCreate, etc.
+- Subagent definitions — SDK-native multi-agent (explore/code/review roles)
+- MCP server integration — mount tools (database, filesystem, etc.)
+- `maxBudgetUsd`, `maxTurns`, `permissionMode`, `systemPrompt` (append/preset)
+- `abortController` for graceful cancellation
+
+### What cc-manager uses today
+- V1 `query()` async generator (NOT V2)
+- `model`, `permissionMode: "bypassPermissions"`, `maxTurns: 50`
+- `maxBudgetUsd`, `systemPrompt` (append), `abortController`
+- `persistSession: false` (throwaway sessions)
+- Code: `agent-runner.ts:369-425` (runClaudeSDK method)
+
+### Gaps (not using yet)
+- V2 `send()`/`stream()` (P0): V1 query() has no session concept, can't resume
+- `createSession()`/`resumeSession()` (P0): retry = full re-run, not session continue
+- `persistSession: true` (P0): must enable to save session IDs
+- Lifecycle hooks (P1): no real-time cost monitoring, no danger tool interception
+- Subagent definitions (P2): not using SDK-native multi-agent roles
+
+## Agent 3: Codex CLI (`agent: "codex"`) — Cross-model retry + second opinion
+
+### Latest Core Features (Codex 0.104.0 + GPT-5.4)
+- GPT-5.4 model ($2.50/$15 per M tokens, SWE-bench 77.2%)
+- GPT-5.4 Thinking / GPT-5.4 Pro variants
+- `model_reasoning_effort` — low/medium/high/xhigh per task
+- Agent roles: worker/explorer/reviewer/monitor
+- `spawn_agents_on_csv` — batch multi-agent
+- `report_agent_job_result` — structured job completion
+- Config via `~/.codex/config.toml` with **profiles** support
+- `exec` mode with `--json` JSONL output
+
+### GPT-5.4 1M Context Window (IMPORTANT)
+- **NOT on by default** — must explicitly configure via config.toml profile
+- Default context: 272K. Experimental 1M support requires opt-in.
+- **Cost penalty beyond 272K**: 2x input rate, 1.5x output rate for FULL session
+- So GPT-5.4 pricing becomes $5.00/$22.50 per M tokens in 1M mode
+
+**Config profile for 1M context:**
+```toml
+# ~/.codex/config.toml
+[profiles.wide]
+model = "gpt-5.4"
+model_reasoning_effort = "medium"
+model_verbosity = "medium"
+model_context_window = 1050000
+model_auto_compact_token_limit = 900000
+```
+
+**When to use 1M context (wide profile):**
+- Large monorepo refactors
+- Cross-file debugging where context continuity matters
+- Keeping many long specs/design docs/logs in one session
+- Long-running agent sessions
+
+**When NOT to use (keep default 272K):**
+- Small bug fixes, quick edit/test loops
+- Tasks where rg/file reads/targeted search are enough
+- Any task that doesn't need full repo in context
+
+**Best practices:**
+- Keep default profile normal (272K), use `wide` profile only when needed
+- Even with 1M, don't paste giant blobs — let tools fetch on demand
+- Keep stable instructions in AGENTS.md, not repeated in chat
+- Start new session when task changes substantially
+- For API: pair with server-side compaction + prompt caching
+
+### What cc-manager uses today
+- `exec` mode, `--dangerously-bypass-approvals-and-sandbox`, `--json`, `--cd`
+- Model hardcoded to `o4-mini` when task model starts with "claude"
+- JSONL event parsing (item.completed, turn.completed)
+- Cost estimation hardcoded at o4-mini rates ($1.1/$4.4 per M)
+- Code: `agent-runner.ts:566-632` (runCodex method)
+
+### Gaps (not using yet)
+- GPT-5.4 (P0): hardcoded o4-mini, missing GPT-5.4's 77.2% SWE-bench capability
+- Model routing for Codex (P0): all tasks use o4-mini regardless of complexity
+- Config profiles (P0): no config.toml management — need default + wide profiles
+- `model_reasoning_effort` (P1): no effort tuning per task category
+- Cost table wrong (P1): hardcoded o4-mini prices; GPT-5.4 = $2.50/$15 (272K) or $5/$22.50 (1M)
+- 1M context routing (P1): deep tasks (monorepo refactor) should use wide profile, others should not
+- Agent roles (P2): not using worker/explorer/reviewer differentiation
+
+## Cross-Agent Architecture
+
+### Model Pricing Table (needs update in estimateCost)
+| Model | Input $/M | Output $/M | SWE-bench | Best for |
+|-------|----------|-----------|-----------|----------|
+| claude-haiku-4-5-20251001 | 0.80 | 4.00 | ~40% | Quick single-file fixes |
+| claude-sonnet-4-6 | 3.00 | 15.00 | ~65% | Standard 1-2 file tasks |
+| claude-opus-4-6 | 15.00 | 75.00 | 80.9% | Deep refactor, pipeline decompose |
+| gpt-5.4 (272K default) | 2.50 | 15.00 | 77.2% | Cross-model retry, cost-effective deep |
+| gpt-5.4 (1M wide mode) | 5.00 | 22.50 | 77.2% | Monorepo refactor, cross-file debug (2x/1.5x penalty) |
+| o4-mini | 1.10 | 4.40 | ~55% | Fast Codex tasks |
+
+### Current routing: task-classifier.ts
+- quick (<200 chars, <=1 file) → Haiku, 120s, $1
+- standard → Sonnet, 300s, $5
+- deep (refactor/redesign/3+ files) → Opus 4.6, 600s, $10
+- Classifier does NOT select agent, only Claude model
+
+### Current retry: scheduler.ts:544-559
+- Failed → swap agent (claude ↔ codex via pickFallbackAgent)
+- Error context injected into prompt
+- Bug: task.error cleared before retry (line 555), but error already in prompt (line 553)
+
+### Optimal Agent Selection Strategy (planned)
+| Scenario | Agent | Model | Why |
+|----------|-------|-------|-----|
+| Quick fix | Claude CLI | Haiku | Fastest, cheapest |
+| Standard coding | Claude CLI | Sonnet | Good balance |
+| Deep refactor | Claude SDK | Opus 4.6 | Hooks + session for control |
+| Cross-model retry | Codex CLI | GPT-5.4 | Different training bias |
+| Monorepo refactor | Codex CLI | GPT-5.4 (wide 1M) | Full repo context needed |
+| Code review | Claude CLI + --json-schema | Sonnet | Structured output |
+| Pipeline decompose | Claude SDK | Opus 4.6 | Codebase understanding |
+
+### Implementation Priority
+1. Phase 1 (quick wins, ~60 LOC): Fix Codex model routing, complete pricing table, add --fallback-model, add --max-turns, create codex config.toml profiles
+2. Phase 2 (session resume, ~120 LOC): Add sessionId to Task, CLI --resume on retry, SDK V2 upgrade, --json-schema for review
+3. Phase 3 (smart routing, ~150 LOC): Classifier outputs agent+model+profile combo, error-type-driven retry, SDK lifecycle hooks
+
+## Self-Evolution: Agent Version Monitor
+
+Core idea: cc-manager should **auto-detect upstream agent updates** and **intelligently upgrade its own integration** — not just pin versions, but adapt to new capabilities as they ship. This is a pillar of self-evolution.
+
+### What to Monitor
+| Source | Method | What changes |
+|--------|--------|-------------|
+| Claude CLI | `claude --version` + changelog RSS/GitHub releases | New flags, output format changes, model additions |
+| Claude Agent SDK | `npm view @anthropic-ai/claude-agent-sdk version` + CHANGELOG.md | API breaking changes (V1→V2), new hooks, new options |
+| Codex CLI | `codex --version` + GitHub releases | New models (GPT-5.4→next), new exec flags, role changes |
+
+### Monitor → Detect → Adapt Pipeline
+1. **Version Check** (periodic or on startup): compare installed vs latest
+2. **Changelog Parse**: extract new flags/features/breaking changes from release notes
+3. **Capability Mapping**: match new features to cc-manager gaps (e.g. new `--resume` flag → enable session retry)
+4. **Self-Upgrade Plan**: generate upgrade tasks (which files to change, what to add)
+5. **Auto-PR or Alert**: either auto-implement via pipeline or alert human for review
+
+### Concrete Triggers
+- New CLI flag detected → update `runClaude()`/`runCodex()` args builder
+- New model released → update `estimateCost()` pricing table + `task-classifier.ts` routing
+- SDK API change (V1→V2) → flag for manual upgrade (breaking change)
+- New agent role/capability → update `pickReviewAgent()`, `pickFallbackAgent()` logic
+- Deprecation notice → schedule migration before removal
+
+### Implementation Sketch
+- `src/agent-monitor.ts` — version check + changelog fetch + diff
+- Store last-known versions in SQLite (`agent_versions` table)
+- On version bump: parse changelog, emit `agent_updated` event
+- Pipeline can auto-generate upgrade tasks from changelog diff
+- Startup log: "Claude CLI 2.1.72 (was 2.1.69) — 3 new flags available"
+
+### Self-Evolution Loop
+```
+monitor versions → detect new features → map to gaps →
+generate upgrade tasks → execute via pipeline → verify TSC+tests →
+merge → cc-manager now uses latest capabilities → repeat
+```
+This closes the loop: cc-manager improves itself by consuming the very agents it orchestrates.
diff --git a/docs/BUILD-VS-BORROW.md b/docs/BUILD-VS-BORROW.md
new file mode 100644
index 0000000..5f239b8
--- /dev/null
+++ b/docs/BUILD-VS-BORROW.md
@@ -0,0 +1,228 @@
+# cc-manager: Build vs Borrow Strategy
+
+> "We didn't build Claude Code. We orchestrate it.
+> Same logic: don't build components. Assemble the best ones."
+
+---
+
+## What to BORROW (proven by others)
+
+### From Composio/agent-orchestrator (3.7K stars)
+
+**1. JSONL Event Monitoring** — DON'T parse stdout
+```
+Claude Code writes structured JSONL events to session files.
+Every user message, assistant response, tool execution, turn completion.
+Composio reads these directly instead of scraping terminal output.
+```
+- Source: `agent-claude-code` plugin reads `~/.claude/projects/*/sessions/*.jsonl`
+- We should: Read the same JSONL files. No stdout parsing. No self-reporting.
+- Effort: ~100 LOC to read and parse CC session events
+
+**2. 8-Slot Plugin Architecture** — proven abstraction boundaries
+```
+Runtime:   tmux | docker | k8s | process
+Agent:     claude-code | codex | aider | opencode
+Workspace: worktree | clone
+Tracker:   github | linear
+SCM:       github
+Notifier:  desktop | slack | webhook
+Terminal:  iterm2 | web
+Lifecycle: core
+```
+- We already have plugins/types.ts and registry.ts
+- Borrow: their slot categorization. Ours lumps too many concerns together.
+- Action: Refactor our plugin interface to match these 8 categories
+
+**3. CI Auto-Fix Loop** — their killer feature
+```
+Agent creates PR → CI fails → orchestrator injects CI logs back into agent session
+→ agent fixes → CI passes → merge
+```
+- We don't have this at all. Tasks just "fail" at TSC gate.
+- Borrow: the pattern of feeding failure output back as context for retry
+- This alone would have fixed our 0% success rate today
+
+**4. Review Comment Routing**
+```
+Reviewer leaves comment on PR → orchestrator routes to agent → agent addresses it
+```
+- We have C3 (PR reviewer) but not the feedback loop back to the original agent
+
+### From claude-squad (6.2K stars)
+
+**5. tmux Session Management** — battle-tested
+```go
+// claude-squad creates tmux sessions per agent, tracks state
+cmd/session.go → tmux new-session -d -s "agent-0" -x 200 -y 50
+```
+- Our current approach: `spawn("claude", ["-p", prompt])` — basic child_process
+- Borrow: tmux as the runtime layer. More robust, survives crashes, inspectable.
+- Bonus: user can `tmux attach -t agent-0` to watch any agent live
+
+**6. One-letter CLI** — `cs` (claude-squad)
+- We have `cc-m` (3 chars) vs `cs` (2 chars)
+- Not critical, but shows their focus on developer ergonomics
+
+### From vibe-kanban (22K stars)
+
+**7. Kanban UI Concept** — why they have 22K stars
+- People want to SEE their agent fleet
+- Our dashboard is basic SSE + task list
+- Borrow: the mental model of kanban columns (Backlog → In Progress → Review → Done)
+- Don't build a full React app; enhance our existing HTML dashboard with kanban lanes
+
+**8. "Each workspace gives an agent a branch, a terminal, and a dev server"**
+- The three-piece bundle: branch + terminal + dev server per agent
+- We have branch + terminal. Missing: per-agent dev server for testing
+
+### From symphony (OpenAI, 4.2K stars)
+
+**9. WORKFLOW.md Spec** — harness engineering
+```
+Symphony requires repos to have WORKFLOW.md defining:
+- How to plan
+- How to execute
+- How to verify
+```
+- We already have C6 (workflow-loader). Good.
+- Borrow: their specific WORKFLOW.md structure and make it a first-class citizen
+
+**10. "Walkthrough Video" as Proof**
+- Symphony agents produce walkthrough videos showing their changes work
+- Wild idea but powerful for review — PR includes a video of the change working
+
+### From ccpm (7.6K stars)
+
+**11. PRD → Epic → Task Decomposition Chain**
+- ccpm structures work as: PRD → Epic → Task → GitHub Issue → Agent
+- We have C8 (orchestrator decomposition) but no PRD/Epic layer
+- Borrow: the multi-level decomposition concept for complex projects
+
+### From metabot (96 stars)
+
+**12. IM Bridge for Mobile Access**
+- Control agent fleet from Telegram/Feishu on your phone
+- `cc-m ls` but from your phone while commuting
+- Low effort via Telegram Bot API, high user delight
+
+### From dagger/container-use (3.6K stars)
+
+**13. Container Isolation Option**
+- Worktrees share the host filesystem. Containers are fully sandboxed.
+- For high-risk tasks (deleting files, running untrusted code): container > worktree
+- Borrow: offer both worktree (fast, default) and container (safe, opt-in)
+
+---
+
+## What to BUILD (nobody has this)
+
+### 1. Wave Planner + Staged Merging ← OUR MOAT
+
+**Nobody does this. Confirmed by web search — zero results.**
+
+```
+Current (everyone):
+  Dispatch all tasks → run in parallel → merge at end → conflicts/TSC fails
+
+cc-manager (our innovation):
+  Analyze deps → split into waves → run wave → merge → rebase → next wave
+```
+
+This is the ONE thing that makes us better than Composio.
+Composio retries on CI failure (reactive). We prevent failure (proactive).
+
+### 2. Failure Diagnosis Engine
+
+Parse TSC/test errors → identify root cause → auto-resolve:
+- Missing type → find which task creates it → merge that first
+- Import error → fix import path
+- Test failure → spawn targeted fix agent
+
+Composio does "inject CI logs back into agent" (reactive).
+We do "parse error, identify root cause, fix environment" (proactive).
+
+### 3. Success Rate Tracking as First-Class Metric
+
+No orchestrator shows you: "Your fleet has 87% success rate, up from 72% last week."
+Make this the hero number on the dashboard.
+
+---
+
+## Assembly Plan
+
+```
+Phase 1: Borrow the basics (make it work)
+  ├── #3 CI auto-fix loop (from Composio pattern)
+  ├── #1 JSONL event monitoring (from Composio)
+  ├── #5 tmux runtime (from claude-squad)
+  └── #9 WORKFLOW.md as first-class (from symphony)
+
+Phase 2: Build our moat (make it smart)
+  ├── Wave Planner (OURS — nobody has this)
+  ├── Staged Merging (OURS — nobody has this)
+  └── Failure Diagnosis Engine (OURS — proactive vs reactive)
+
+Phase 3: Borrow the polish (make it beautiful)
+  ├── #7 Kanban-style dashboard (from vibe-kanban concept)
+  ├── #12 Telegram bot (from metabot)
+  ├── #2 8-slot plugin refactor (from Composio)
+  └── #13 Container isolation option (from dagger)
+
+Phase 4: Borrow the scale (make it enterprise)
+  ├── #11 PRD→Epic→Task chain (from ccpm)
+  ├── #4 Review comment routing (from Composio)
+  └── Success rate analytics dashboard
+```
+
+---
+
+## The Composable Architecture
+
+```
+┌─────────────────────────────────────────────────────────┐
+│                    cc-manager v0.2                       │
+│                                                         │
+│  ┌─────────────┐  ┌─────────────┐  ┌────────────────┐ │
+│  │ Issue Source │  │ Wave Planner│  │ Failure Diag.  │ │
+│  │ (GitHub/     │  │ (OURS)      │  │ (OURS)         │ │
+│  │  Linear)     │  │ dep analysis│  │ TSC/test parse │ │
+│  │ #borrowed    │  │ topo sort   │  │ auto-resolve   │ │
+│  └──────┬──────┘  └──────┬──────┘  └───────┬────────┘ │
+│         │                │                  │          │
+│         ▼                ▼                  ▼          │
+│  ┌─────────────────────────────────────────────────┐   │
+│  │              Execution Engine                    │   │
+│  │                                                  │   │
+│  │  Runtime: tmux (#5 claude-squad)                │   │
+│  │  Workspace: worktree | container (#13 dagger)   │   │
+│  │  Monitoring: JSONL events (#1 Composio)         │   │
+│  │  Retry: CI log injection (#3 Composio)          │   │
+│  │  Merging: staged merge (OURS)                   │   │
+│  └─────────────────────────────────────────────────┘   │
+│         │                                              │
+│         ▼                                              │
+│  ┌─────────────────────────────────────────────────┐   │
+│  │              Interface Layer                     │   │
+│  │                                                  │   │
+│  │  CLI: cc-m (ours)                               │   │
+│  │  Dashboard: kanban lanes (#7 vibe-kanban)       │   │
+│  │  Mobile: Telegram bot (#12 metabot)             │   │
+│  │  API: REST + SSE (ours)                         │   │
+│  └─────────────────────────────────────────────────┘   │
+└─────────────────────────────────────────────────────────┘
+```
+
+---
+
+## Sources
+
+- [Composio blog: The Self-Improving AI System That Built Itself](https://composio.dev/blog/the-self-improving-ai-system-that-built-itself)
+- [Composio blog: Open-Sourcing Agent Orchestrator](https://pkarnal.com/blog/open-sourcing-agent-orchestrator)
+- [Running 20 AI Agents in Parallel](https://pkarnal.com/blog/parallel-ai-agents)
+- [ComposioHQ/agent-orchestrator](https://github.com/ComposioHQ/agent-orchestrator)
+- [smtg-ai/claude-squad](https://github.com/smtg-ai/claude-squad)
+- [BloopAI/vibe-kanban](https://github.com/BloopAI/vibe-kanban)
+- [openai/symphony](https://github.com/openai/symphony)
+- [dagger/container-use](https://github.com/dagger/container-use)
+- [xvirobotics/metabot](https://github.com/xvirobotics/metabot)
diff --git a/docs/COMPETITIVE-ANALYSIS.md b/docs/COMPETITIVE-ANALYSIS.md
new file mode 100644
index 0000000..102decd
--- /dev/null
+++ b/docs/COMPETITIVE-ANALYSIS.md
@@ -0,0 +1,186 @@
+# Coding Agent Orchestrator: Competitive Analysis
+
+**Date**: 2026-03-05
+**Category**: Tools that orchestrate existing coding agent CLIs (not frameworks for building agents from scratch)
+
+---
+
+## Market Map
+
+```
+                        Full Automation
+                             ▲
+                             │
+              ┌──────────────┼──────────────┐
+              │              │              │
+              │  agent-orch  │  cc-manager  │
+              │  (Composio)  │  (Agent Next)│
+              │              │              │
+              │    symphony  │   lalph      │
+              │    (OpenAI)  │              │
+   CLI-only ──┼──────────────┼──────────────┼── GUI-first
+              │              │              │
+              │ claude-squad │  vibe-kanban │
+              │    cmux      │  humanlayer  │
+              │    amux      │  emdash      │
+              │              │  parallel-   │
+              │              │    code      │
+              └──────────────┼──────────────┘
+                             │
+                             ▼
+                      Manual Control
+```
+
+---
+
+## Tier 1: Direct Competitors (Full Orchestrators)
+
+### 1. BloopAI/vibe-kanban — 22,439 stars
+- **URL**: https://github.com/BloopAI/vibe-kanban
+- **Agents**: 10+ (Claude Code, Copilot, Gemini CLI, Codex, Amp, Cursor, OpenCode, Droid, CCR, Qwen Code)
+- **Lang**: Rust (49.6%) + TypeScript (46.4%)
+- **Architecture**: Kanban board UI as task manager, each task in isolated git worktree. SQLx persistence.
+- **Isolation**: Git worktree, one branch per task
+- **Key differentiator**: Visual kanban is the core UX — drag tasks, assign to agents, view diffs, create PRs. Built-in preview browser.
+- **Weakness**: Manual task creation/assignment (no auto-dispatch), no budget control.
+- **vs cc-manager**: vibe-kanban is human-managed kanban; cc-manager is automated queue dispatch.
+
+### 2. humanlayer/humanlayer (CodeLayer) — 9,654 stars
+- **URL**: https://github.com/humanlayer/humanlayer
+- **Agents**: Claude Code primarily ("Superhuman for Claude Code")
+- **Lang**: TypeScript (59.2%) + Go (33.6%) + Docker Compose
+- **Architecture**: IDE-level experience. "MULTICLAUDE" for parallel execution. ACP (Agent Control Plane) as distributed scheduler.
+- **Isolation**: Git worktree + optional remote cloud workers
+- **Key differentiator**: "Advanced Context Engineering" for large codebases. Keyboard-first IDE replacement.
+- **Weakness**: Heavy, steep learning curve. Primarily Claude Code only.
+- **vs cc-manager**: humanlayer is a full IDE replacement; cc-manager is a lightweight CLI orchestrator.
+
+### 3. automazeio/ccpm — 7,558 stars
+- **URL**: https://github.com/automazeio/ccpm
+- **Agents**: Claude Code via `/pm:` commands
+- **Architecture**: CLAUDE.md spec + `.claude/` directory structure (PRDs, epics, tasks) + GitHub Issues as single source of truth.
+- **Isolation**: Git worktree, one branch per task
+- **Key differentiator**: Spec-driven workflow (PRD → epic → task → Issue → agent). Full traceability. Supports human+AI mixed collaboration.
+- **Weakness**: Requires manual PRD/epic creation. No budget control. No multi-agent type support.
+- **vs cc-manager**: ccpm is "requirements to execution" PM framework; cc-manager focuses on execution-layer orchestration.
+
+### 4. smtg-ai/claude-squad — 6,218 stars
+- **URL**: https://github.com/smtg-ai/claude-squad
+- **Agents**: Claude Code, Aider, Codex, Gemini, OpenCode, Amp
+- **Lang**: Go (87.9%)
+- **Architecture**: tmux session manager + git worktree isolation. TUI interface, keyboard-driven.
+- **Isolation**: Git worktree, one branch per session
+- **Key differentiator**: Pure TUI, Go, extremely lightweight. `-p` flag for any agent command. `--dangerously-skip-permissions` yolo mode.
+- **Weakness**: Manual-driven (user starts/manages each agent in TUI). No task queue, no budget, no auto-merge.
+- **vs cc-manager**: claude-squad is manual TUI multiplexer; cc-manager is automated queue orchestrator.
+
+### 5. openai/symphony — 4,232 stars
+- **URL**: https://github.com/openai/symphony
+- **Agents**: Codex primarily
+- **Lang**: Elixir reference implementation + spec docs
+- **Architecture**: Monitors Linear/work boards → auto-spawns agents → CI verification → safe PR landing.
+- **Key differentiator**: OpenAI official. Emphasizes "harness engineering" (codebase must adopt specific practices). More spec/protocol than turnkey tool.
+- **Weakness**: Requires team adoption of the spec. No budget control, no GUI.
+- **vs cc-manager**: symphony is spec + reference impl; cc-manager is ready-to-use tool.
+
+### 6. ComposioHQ/agent-orchestrator — 3,709 stars
+- **URL**: https://github.com/ComposioHQ/agent-orchestrator
+- **Agents**: Claude Code, Codex, Aider, OpenCode
+- **Lang**: TypeScript
+- **Architecture**: 8-slot plugin architecture. Runtimes (tmux/Docker/k8s), workspaces (worktree/clone), issue trackers (GitHub/Linear) are all pluggable. Reads Claude Code's structured JSONL event file for monitoring.
+- **Isolation**: Git worktree (default) or clone
+- **Task source**: GitHub Issues, Linear
+- **Key differentiator**:
+  - Auto-handles CI failures (injects failure logs back into agent session)
+  - Auto-addresses code review comments (routes to corresponding agent)
+  - Dashboard for 30 parallel agents
+  - Self-improvement loop: records performance metrics, adjusts strategies
+  - **Built itself**: 30 agents in parallel, 8 days, 40,000 LOC TypeScript, 84.6% CI success
+- **Weakness**: No budget control. More focused on CI/PR lifecycle than task queue management.
+- **vs cc-manager**: Closest full-feature competitor. Composio has more mature plugin system; cc-manager has budget control.
+
+---
+
+## Tier 2: Parallel Runners / TUI Tools
+
+| Project | Stars | Agents | Key Feature | Weakness |
+|---------|-------|--------|-------------|----------|
+| [manaflow-ai/cmux](https://github.com/manaflow-ai/cmux) | 4,184 | CC/OpenCode/Codex | macOS native, GPU-accelerated terminal, notification-driven | macOS only, no auto-dispatch |
+| [dagger/container-use](https://github.com/dagger/container-use) | 3,586 | Any MCP agent | **Container isolation** (not worktree), Dagger engine, cross-env consistency | Runtime layer only, no task queue |
+| [stravu/crystal](https://github.com/stravu/crystal) | 2,968 | Codex/CC | Desktop app | **Deprecated** Feb 2026, replaced by Nimbalyst |
+| [generalaction/emdash](https://github.com/generalaction/emdash) | 2,372 | **22 agents** (most) | YC W26, Linear/GitHub/Jira import, SSH/SFTP remote | Early stage, unclear auto-merge |
+| [subsy/ralph-tui](https://github.com/subsy/ralph-tui) | 2,047 | CC/OpenCode/Factory/Gemini/Codex | Autonomous serial loop, PRD+Beads task tracker | **Serial only** (one task at a time) |
+| [coder/mux](https://github.com/coder/mux) | 1,294 | Multi-LLM (API, not CLI) | SSH remote execution, cost tracking | Calls APIs directly, not CLI wrappers |
+| [johannesjo/parallel-code](https://github.com/johannesjo/parallel-code) | 313 | CC/Codex/Gemini | Electron GUI, mobile QR code monitoring | No task queue, no auto-merge |
+
+---
+
+## Tier 3: Niche / Special Purpose
+
+| Project | Stars | Unique Angle |
+|---------|-------|-------------|
+| [xvirobotics/metabot](https://github.com/xvirobotics/metabot) | 96 | **IM bridge** — control CC teams via Feishu/Telegram. Shared MetaMemory (SQLite). Agent Bus REST API for inter-agent delegation. Cron scheduling. |
+| [tim-smart/lalph](https://github.com/tim-smart/lalph) | 92 | **Architecture closest to cc-manager**: issue-driven, label-based routing, auto-merge, task dependencies, git worktree concurrency. |
+| [dsifry/metaswarm](https://github.com/dsifry/metaswarm) | 95 | 18 agents collaboration framework |
+| [nyldn/claude-octopus](https://github.com/nyldn/claude-octopus) | 1,016 | Multi-agent consensus mechanism |
+| [andyrewlee/amux](https://github.com/andyrewlee/amux) | 42 | Minimal TUI multiplexer |
+
+---
+
+## Tier 4: Commercial / Closed Source
+
+| Product | Key Feature |
+|---------|-------------|
+| **GitHub Agent HQ** | GitHub-native. Assign same issue to Copilot+Claude+Codex simultaneously, compare results. Enterprise audit trail. |
+| **Cognition Devin** (MultiDevin) | Multiple Devin VMs in parallel. Closed SaaS. |
+| **Factory** | Enterprise agent fleet management. SOC2 compliant. |
+
+---
+
+## Feature Comparison Matrix
+
+| Feature | cc-manager | agent-orch (Composio) | vibe-kanban | claude-squad | symphony | ccpm |
+|---------|-----------|----------------------|-------------|--------------|----------|------|
+| **Budget cap ($$$)** | **YES** | No | No | No | No | No |
+| Auto task dispatch | **YES** | **YES** | Manual | Manual | **YES** | Manual |
+| Auto-merge pipeline | **YES** | **YES** (CI-aware) | PR creation | Manual | **YES** | Manual |
+| Cross-agent review | **YES** (C3) | **YES** | No | No | No | No |
+| Plugin architecture | Planned (v0.1.4) | **YES** (8-slot) | No | No | Spec | No |
+| Self-evolution | Planned (v0.1.4) | **YES** | No | No | No | No |
+| Issue tracker integration | **YES** (C1) | **YES** | No | No | **YES** (Linear) | **YES** (GitHub) |
+| State machine | **YES** (C5) | **YES** | No | No | No | No |
+| Agent memory / learning | **YES** (memory.ts) | **YES** | No | No | No | No |
+| GUI / Dashboard | Basic web | Dashboard | **Kanban** | TUI | No | No |
+| One-line start | `cc-manager --repo .` | Config required | Config required | `cs` | Config required | Config required |
+| Multi-agent types | CC/CX/any CLI | CC/CX/Aider/OpenCode | 10+ agents | 6 agents | CX | CC only |
+| Worktree isolation | **YES** | **YES** | **YES** | **YES** | **YES** | **YES** |
+| Container isolation | No | Docker/k8s option | No | No | No | No |
+| SSE real-time events | **YES** | **YES** | No | Terminal | No | No |
+| Cost tracking | **YES** | No | No | No | No | No |
+| Tests | 367 | Unknown | Unknown | Unknown | Unknown | Unknown |
+
+---
+
+## Star Count Rankings (verified 2026-03-05)
+
+| # | Project | Stars | Category |
+|---|---------|-------|----------|
+| 1 | BloopAI/vibe-kanban | 22,439 | Kanban GUI |
+| 2 | humanlayer/humanlayer | 9,654 | IDE + Orchestrator |
+| 3 | automazeio/ccpm | 7,558 | PM Protocol |
+| 4 | smtg-ai/claude-squad | 6,218 | TUI Multiplexer |
+| 5 | openai/symphony | 4,232 | Spec + Ref Impl |
+| 6 | manaflow-ai/cmux | 4,184 | macOS Terminal |
+| 7 | ComposioHQ/agent-orchestrator | 3,709 | Full Orchestrator |
+| 8 | dagger/container-use | 3,586 | Container Runtime |
+| 9 | stravu/crystal | 2,968 | Desktop (deprecated) |
+| 10 | generalaction/emdash | 2,372 | Desktop, 22 agents |
+| 11 | subsy/ralph-tui | 2,047 | Serial Loop |
+| 12 | coder/mux | 1,294 | Multi-LLM Desktop |
+| 13 | nyldn/claude-octopus | 1,016 | Consensus |
+| 14 | johannesjo/parallel-code | 313 | Electron GUI |
+| 15 | xvirobotics/metabot | 96 | IM Bridge (Feishu/TG) |
+| 16 | dsifry/metaswarm | 95 | 18-agent collab |
+| 17 | tim-smart/lalph | 92 | Issue-driven (closest to cc-manager) |
+| 18 | andyrewlee/amux | 42 | Minimal TUI |
+| — | **agent-next/cc-manager** | **~50** | **Queue + Budget Orchestrator** |
diff --git a/docs/CONFIGURATION.md b/docs/CONFIGURATION.md
index 9a28e64..ebb3f7b 100644
--- a/docs/CONFIGURATION.md
+++ b/docs/CONFIGURATION.md
@@ -110,10 +110,10 @@ Claude model identifier passed to every agent session.
 |---|---|
 | **Default** | `claude-sonnet-4-6` |
 | **Type** | string |
-| **Valid values** | Any supported Claude model ID (e.g. `claude-opus-4-5`, `claude-sonnet-4-6`) |
+| **Valid values** | Any supported Claude model ID (e.g. `claude-opus-4-6`, `claude-sonnet-4-6`) |
 
 ```bash
-cc-manager --repo . --model claude-opus-4-5
+cc-manager --repo . --model claude-opus-4-6
 ```
 
 ---
diff --git a/docs/GAP-ANALYSIS.md b/docs/GAP-ANALYSIS.md
new file mode 100644
index 0000000..73305f4
--- /dev/null
+++ b/docs/GAP-ANALYSIS.md
@@ -0,0 +1,128 @@
+# cc-manager: Gap Analysis & Action Plan
+
+> Simple but powerful. Fix what's broken, connect what's disconnected, add what's missing.
+
+---
+
+## 1. Self-Assessment
+
+### What works
+- Worktree pool (create/acquire/release/merge)
+- SQLite persistence (WAL, 24-col tasks table)
+- SSE real-time events
+- Priority queue with event-driven dispatch
+- TSC build gate
+- Multi-agent (Claude CLI/SDK, Codex, any CLI)
+- Budget control
+- Web dashboard + CLI (cc-m)
+
+### What's dead code (~40%)
+- `state-machine.ts` — FSM never called by Scheduler
+- `router.ts` — smart routing never called
+- `memory.ts` — execution memory never called
+- `workpad.ts` — progress files never written
+- `store.claimTask()` — atomic claim never used
+- `orchestrator.ts` — DAG decomposition has no API endpoint
+
+### What's broken
+- `listTasks()` reads only memory, not SQLite → empty after restart
+- Rate limit hardcoded to single key → effectively disabled
+- Two conflicting `AgentPlugin` interfaces
+- Pool lock is 10ms spin → should be Promise queue
+
+---
+
+## 2. Gap vs Competitors
+
+### Critical (blocks success rate)
+
+| Gap | What competitors do | Effort |
+|-----|--------------------:|-------:|
+| No staged merging | Gas Town Refinery: serial merge queue + CI bisect | ~200 LOC |
+| No wave planning | Gas Town Convoy (manual), nobody auto-analyzes | ~300 LOC |
+| No CI feedback loop | Composio: inject CI errors → agent fixes → retry | ~100 LOC |
+| No failure diagnosis | Nobody (our moat): parse TSC error → fix env → retry | ~200 LOC |
+
+### Important (blocks robustness)
+
+| Gap | What competitors do | Effort |
+|-----|--------------------:|-------:|
+| No stall timeout | lalph: output activity, not wall-clock | ~30 LOC |
+| No JSONL monitoring | Composio: read session JSONL directly | ~100 LOC |
+| No context recovery | Gas Town Handoff/Seance: checkpoint + resume | ~100 LOC |
+| No worktree pre-warm | emdash: reserve pool, instant claim | ~50 LOC |
+| Dead code not wired | Our own modules exist but aren't connected | ~100 LOC |
+
+### Nice-to-have (blocks adoption)
+
+| Gap | What competitors do | Effort |
+|-----|--------------------:|-------:|
+| No provider registry | emdash: declarative agent config | ~150 LOC |
+| No attempt model | vibe-kanban: multiple tries, compare diffs | ~100 LOC |
+| No auth | Everyone except simple tools | ~50 LOC |
+| No Telegram/IM | metabot: mobile monitoring | ~200 LOC |
+
+---
+
+## 3. Action Plan: 3 Sprints
+
+### Sprint 1: Wire + Core Loop (0% → 80%)
+
+**Wire dead code:**
+- Connect FSM to Scheduler (use `transition()` instead of raw string assignment)
+- Connect Router to dispatch (pick best agent per task)
+- Connect Memory to post-execution (record outcomes)
+- Add `/api/orchestrate` endpoint for Orchestrator
+- Fix `listTasks()` to merge memory + SQLite
+- Fix rate limit bug
+
+**Add core loop:**
+- `staged-merger.ts` — merge completed tasks immediately, rebase active worktrees
+- `wave-planner.ts` — analyze deps, topological sort into waves
+- CI feedback in `agent-runner.ts` — on TSC fail, inject errors as retry context
+- `failure-diagnoser.ts` — parse TSC errors, identify missing deps, auto-resolve
+
+### Sprint 2: Robustness (80% → 90%)
+
+- Stall timeout (replace wall-clock with output-activity)
+- JSONL monitor (read Claude session files)
+- Handoff protocol (checkpoint + resume)
+- Worktree pre-warming (reserve pool)
+- Promise-based pool lock (replace spin)
+
+### Sprint 3: Polish (90% → 95%)
+
+- Provider registry (declarative agent config)
+- Attempt model (multiple tries per task)
+- API auth (Bearer token)
+- Enhanced dashboard (kanban lanes)
+
+---
+
+## 4. Sprint 1 Scaffold
+
+### New files (4):
+
+```
+src/staged-merger.ts     — merge queue + rebase active worktrees
+src/wave-planner.ts      — dependency analysis + wave generation
+src/failure-diagnoser.ts — parse errors + identify root cause + suggest fix
+src/pipeline.ts          — connects everything: wave → dispatch → merge → diagnose
+```
+
+### Modified files (4):
+
+```
+src/scheduler.ts    — use FSM transitions, call Router, call Memory
+src/agent-runner.ts — CI feedback loop (inject TSC errors on retry)
+src/server.ts       — add /api/orchestrate, fix listTasks, fix rate limit
+src/index.ts        — wire Pipeline into startup
+```
+
+### Design principle:
+
+Each new module is a pure function or simple class with:
+- Clear input/output types
+- No hidden state
+- Testable in isolation
+- <200 LOC each
diff --git a/docs/IMPLEMENTATION-PLAN.md b/docs/IMPLEMENTATION-PLAN.md
new file mode 100644
index 0000000..98c235b
--- /dev/null
+++ b/docs/IMPLEMENTATION-PLAN.md
@@ -0,0 +1,406 @@
+# cc-manager v0.2: Implementation Plan
+
+> Focus on ours. Borrow good features from others.
+> Our moat: Wave Planning + Staged Merging. Nobody else has this.
+
+---
+
+## Current State (v0.1.0)
+
+- 6 modules, 3150 LOC, 367 tests passing
+- 0% auto-merge (TSC gate fails due to isolation paradox)
+- Basic child_process spawn, no CI feedback loop, no wave planning
+
+## Target State (v0.2.0)
+
+- 95%+ auto-merge success rate
+- Wave-based dependency-aware dispatch
+- CI failure → auto-fix loop
+- Borrowed best patterns from 18+ competitors
+
+---
+
+## Phase 1: Fix the Core Loop (0% → 80%)
+
+**Goal**: Tasks that run should actually merge.
+
+### 1.1 Staged Merging ← OUR MOAT (nobody has this)
+
+```
+Current:  dispatch all → run parallel → merge at end → all fail (TSC)
+Target:   dispatch wave → run parallel → merge completed → rebase active → next wave
+```
+
+**New file**: `src/staged-merger.ts` (~200 LOC)
+```typescript
+interface StagedMerger {
+  // After a task completes and passes TSC:
+  mergeToMain(worktreeId: string): Promise<MergeResult>
+  // After merge, rebase all active worktrees:
+  rebaseActive(activeWorktrees: string[]): Promise<RebaseResult[]>
+}
+```
+
+**Modify**: `src/scheduler.ts` — add merge-after-complete hook
+
+### 1.2 Wave Planner ← OUR MOAT (nobody has this)
+
+```
+Tasks: [create types.ts, use types.ts, modify scheduler.ts, add tests]
+  → Dependency analysis → DAG
+  → Wave 1: [create types.ts, modify scheduler.ts, add tests] (parallel)
+  → Wave 2: [use types.ts] (after types.ts merged)
+```
+
+**New file**: `src/wave-planner.ts` (~300 LOC)
+```typescript
+interface WavePlanner {
+  analyzeDeps(tasks: Task[]): DependencyGraph
+  planWaves(graph: DependencyGraph): Wave[]
+  // Each wave: max parallel tasks with no inter-dependencies
+}
+
+interface Wave {
+  id: number
+  tasks: Task[]
+  dependsOn: number[]  // previous wave IDs that must complete
+}
+```
+
+**How to analyze deps**: Parse task prompts for file references (imports, creates, modifies).
+Use Opus to identify which tasks create new types/exports and which consume them.
+
+### 1.3 Merge Queue with CI Bisect (borrowed from Gas Town's Refinery)
+
+Gas Town's Refinery is the only project with a real merge queue:
+```
+Multiple PRs ready → batch merge → run CI on tip
+  → CI passes: all merged
+  → CI fails: binary search to find which PR broke it → reject that one → retry rest
+```
+
+**Modify**: `src/staged-merger.ts` — add Refinery-style bisect on CI failure
+
+```typescript
+interface MergeQueue {
+  // Batch merge completed tasks
+  batchMerge(tasks: CompletedTask[]): Promise<MergeResult>
+  // On CI failure, binary search for the culprit
+  bisectFailure(tasks: CompletedTask[], ciError: string): Promise<Task>
+  // Retry without the culprit
+  retryWithout(culprit: Task): Promise<MergeResult>
+}
+```
+
+### 1.4 CI Auto-Fix Loop (borrowed from Composio)
+
+```
+Agent creates code → TSC fails → inject TSC errors back into agent → agent fixes → retry
+```
+
+**Modify**: `src/agent-runner.ts` — after TSC gate failure:
+1. Parse TSC error output
+2. Inject error context as continuation prompt
+3. Resume agent session (not restart from scratch)
+
+**Borrow from**: Composio's reaction engine pattern + Symphony's continuation turns
+
+### 1.5 Failure Diagnosis Engine ← OUR MOAT
+
+```
+TSC error: "Cannot find module './types.js'"
+  → Diagnosis: types.ts created by Task A, not yet merged
+  → Action: merge Task A first, rebase, retry
+```
+
+**New file**: `src/failure-diagnoser.ts` (~200 LOC)
+
+---
+
+## Phase 2: Borrow the Runtime (80% → 90%)
+
+### 2.1 JSONL Event Monitoring (from Composio)
+
+**Stop**: Parsing stdout/self-reporting
+**Start**: Read `~/.claude/projects/*/sessions/*.jsonl` directly
+
+```typescript
+// Composio reads these fields from JSONL:
+// - type: "user" | "assistant" | "tool_use" | "tool_result"
+// - timestamp, sessionId, content
+```
+
+**New file**: `src/jsonl-monitor.ts` (~100 LOC)
+- Watch session JSONL files with `fs.watch()`
+- Parse events: message, tool_use, turn_complete
+- Replace current stdout-based progress tracking
+
+### 2.2 Stall Timeout (from lalph)
+
+**Current**: Wall-clock timeout kills agent after N minutes
+**Better**: Track last output time, kill only if agent produces no output for M seconds
+
+```typescript
+// lalph pattern: race output stream vs stall timer
+// Every stdout line resets the stall timer
+// Agent is alive if producing output, even if slow
+```
+
+**Modify**: `src/agent-runner.ts` — replace `setTimeout` with output-activity-based timeout
+
+### 2.3 Worktree Pool (from emdash)
+
+**Current**: Create worktree on-demand (3-7s delay per task)
+**Better**: Pre-create reserve worktrees, claim instantly
+
+```typescript
+interface WorktreePool {
+  reserves: Map<string, ReserveWorktree>
+  claimReserve(): Promise<Worktree>     // instant
+  replenishInBackground(): void          // async refill
+}
+```
+
+**Modify**: `src/worktree-pool.ts` — add reserve pool with background replenishment
+
+### 2.4 CLAUDE* Env Filtering (from metabot)
+
+**Problem**: Nested Claude Code sessions fail with "nested session" detection
+**Fix**: Filter all `CLAUDE_*` environment variables when spawning agent subprocess
+
+```typescript
+// metabot pattern:
+const env = Object.fromEntries(
+  Object.entries(process.env).filter(([k]) => !k.startsWith('CLAUDE'))
+)
+```
+
+**Modify**: `src/agent-runner.ts` — add env filtering to spawn options
+
+### 2.5 GUPP Hook Pattern (from Gas Town)
+
+**Gas Town's GUPP**: "If there is work on your Hook, YOU MUST RUN IT."
+Each agent has a pinned task as its work queue. Session starts → auto-execute.
+
+```typescript
+// Inject current task into agent's system prompt (CLAUDE.md)
+// Agent sees task on startup → immediately starts working
+// No polling, no external trigger needed
+```
+
+**Modify**: `src/agent-runner.ts` — write task details to worktree's CLAUDE.md before spawn
+
+### 2.6 Handoff + Context Recovery (from Gas Town)
+
+When agent hits context limit or crashes:
+1. Write summary of decisions/progress to checkpoint file
+2. Start new session with checkpoint as context
+3. New session resumes from where old one left off
+
+```typescript
+interface HandoffProtocol {
+  saveCheckpoint(workerId: string, summary: string): void
+  loadCheckpoint(workerId: string): string | null
+  seance(workerId: string): PreviousDecisions  // query past session
+}
+```
+
+**New file**: `src/handoff.ts` (~100 LOC)
+
+### 2.7 Beads Dual Persistence (from Gas Town)
+
+SQLite for fast queries + JSONL for git tracking:
+- `.tasks/tasks.db` — SQLite, fast status queries
+- `.tasks/tasks.jsonl` — git-tracked, cross-machine sync
+
+**Modify**: `src/store.ts` — add JSONL append on every state change
+
+### 2.8 Three-Phase Lifecycle (from emdash)
+
+```
+setup → run → teardown
+```
+
+Each phase has its own status, logs, and timeout.
+- **setup**: npm install, env prep, custom scripts
+- **run**: agent execution
+- **teardown**: cleanup, PR creation, notification
+
+**Modify**: `src/agent-runner.ts` — refactor into 3 phases
+
+---
+
+## Phase 3: Borrow the Intelligence (90% → 95%)
+
+### 3.1 Provider Registry (from emdash + vibe-kanban)
+
+Declarative config for each agent type:
+
+```typescript
+interface AgentProvider {
+  id: string                    // "claude" | "codex" | "gemini"
+  command: string               // "claude" | "codex" | "gemini"
+  promptFlag: string            // "-p" | "--prompt" | "--message"
+  autoApproveFlag?: string      // "--dangerously-skip-permissions"
+  sessionIdFlag?: string        // "--session-id"
+  resumeFlag?: string           // "-c -r"
+  useKeystrokeInjection?: bool  // for agents without prompt flag
+}
+```
+
+**New file**: `src/providers/registry.ts` (~150 LOC)
+- Declarative: adding a new agent = adding a JSON entry
+- No code changes needed to support new agents
+
+### 3.2 Attempt Model (from vibe-kanban)
+
+Each task can have multiple attempts:
+- Different agents, different prompts, different results
+- Compare diffs across attempts
+- Pick the best one to merge
+
+**Modify**: `src/store.ts` — add `attempts` table, `task_id` → `attempt[]`
+
+### 3.3 Review Comment Routing (from Composio)
+
+```
+PR review comment → orchestrator detects → routes to original agent → agent addresses
+```
+
+**New file**: `src/review-router.ts` (~150 LOC)
+
+### 3.4 Linear Integration (from Symphony)
+
+Symphony's Linear GraphQL adapter is clean:
+- Poll Linear for active issues
+- Map Linear states to internal states
+- Agent can query Linear directly via injected tool
+
+**Modify**: `src/integrations/` — add `linear.ts`
+
+---
+
+## Phase 4: Borrow the Polish (user acquisition)
+
+### 4.1 Kanban Dashboard (inspired by vibe-kanban)
+
+Don't build React from scratch. Enhance existing HTML dashboard:
+- Kanban columns: Backlog → In Progress → Review → Done
+- Real-time SSE updates (already have this)
+- Click to view diff, logs, agent output
+
+### 4.2 PRD → Epic → Task (from ccpm)
+
+ccpm's YAML frontmatter + Markdown body pattern:
+```yaml
+---
+name: Auth System
+status: backlog
+depends_on: [001]
+parallel: true
+conflicts_with: [003]
+---
+```
+
+**Borrow**: The decomposition chain + frontmatter format
+**Don't borrow**: The 37 slash commands (too complex)
+
+### 4.3 WORKFLOW.md as First-Class (from Symphony)
+
+Symphony's WORKFLOW.md is a contract:
+- YAML frontmatter for runtime config
+- Liquid templates for agent prompts
+- Dynamic reload without restart
+
+**Modify**: `src/workflow-loader.ts` — support YAML frontmatter + Liquid templates
+
+### 4.4 IM Bridge (from metabot)
+
+Telegram bot for mobile monitoring:
+- `cc-m ls` from your phone
+- Notifications on task completion/failure
+- Quick approve/reject
+
+**New file**: `src/integrations/telegram.ts` (~200 LOC)
+
+---
+
+## What We Do NOT Borrow
+
+| Feature | Why Not |
+|---------|---------|
+| vibe-kanban's Rust backend | We're TypeScript. Our stack is fine. |
+| vibe-kanban's ElectricSQL | Overkill for single-user CLI tool |
+| ccpm's 37 slash commands | Too complex. We automate, not prompt. |
+| Symphony's Elixir | Language mismatch |
+| container-use's Dagger | Worktrees are sufficient for now |
+| cmux's Swift/macOS | We're cross-platform CLI |
+| emdash's Electron | We're terminal-first |
+| Gas Town's Go language | Language mismatch, but patterns are gold |
+| Gas Town's Dolt DB | SQLite + JSONL is simpler and sufficient |
+| Gas Town's MEOW stack | Over-abstracted for our needs (Beads are enough) |
+
+---
+
+## Priority Execution Order
+
+```
+Sprint 1 (P0 — make it work):
+  1. staged-merger.ts        ← OUR MOAT
+  2. wave-planner.ts         ← OUR MOAT
+  3. merge queue + CI bisect (Gas Town's Refinery pattern)
+  4. CI auto-fix loop        (Composio pattern)
+  5. failure-diagnoser.ts    ← OUR MOAT
+
+Sprint 2 (P1 — make it robust):
+  6. GUPP hook pattern       (from Gas Town — task in CLAUDE.md)
+  7. handoff.ts              (from Gas Town — context recovery)
+  8. jsonl-monitor.ts        (from Composio)
+  9. stall timeout           (from lalph)
+  10. worktree pool          (from emdash)
+  11. CLAUDE* env filtering  (from metabot)
+  12. three-phase lifecycle  (from emdash)
+
+Sprint 3 (P2 — make it smart):
+  13. provider registry      (from emdash/vibe-kanban)
+  14. attempt model          (from vibe-kanban)
+  15. dual persistence       (from Gas Town — SQLite + JSONL)
+  16. review-router.ts       (from Composio)
+  17. linear.ts              (from Symphony)
+
+Sprint 4 (P3 — make it beautiful):
+  18. kanban dashboard       (inspired by vibe-kanban)
+  19. WORKFLOW.md upgrade     (from Symphony)
+  20. telegram.ts            (from metabot)
+```
+
+---
+
+## File Changes Summary
+
+| Sprint | New Files | Modified Files | Est. LOC |
+|--------|-----------|----------------|----------|
+| 1 | staged-merger.ts, wave-planner.ts, failure-diagnoser.ts | scheduler.ts, agent-runner.ts, staged-merger.ts (merge queue) | ~900 |
+| 2 | handoff.ts, jsonl-monitor.ts | agent-runner.ts (GUPP + stall + env + lifecycle), worktree-pool.ts | ~600 |
+| 3 | providers/registry.ts, review-router.ts, integrations/linear.ts | store.ts (dual persistence + attempts) | ~600 |
+| 4 | integrations/telegram.ts | workflow-loader.ts, dashboard HTML | ~400 |
+| **Total** | **8 new** | **7 modified** | **~2500** |
+
+---
+
+## Success Metrics
+
+```
+After Sprint 1: 0% → 80% auto-merge (staged merging alone fixes most failures)
+After Sprint 2: 80% → 90% (robust runtime, fewer crashes/hangs)
+After Sprint 3: 90% → 95% (smart routing, multi-attempt, review loop)
+After Sprint 4: 95% + beautiful UI + mobile access
+```
+
+---
+
+## The One Sentence
+
+**cc-manager is the only orchestrator that understands task dependencies before dispatch, merges incrementally instead of all-at-once, and diagnoses failures to fix the environment rather than retry blindly.**
+
+Every borrowed feature serves this core thesis. Nothing we borrow dilutes our moat.
diff --git a/docs/PRODUCT-VISION.md b/docs/PRODUCT-VISION.md
new file mode 100644
index 0000000..1d65e5c
--- /dev/null
+++ b/docs/PRODUCT-VISION.md
@@ -0,0 +1,288 @@
+# cc-manager: Product Vision — "Best in Class"
+
+**Date**: 2026-03-05
+**Status**: Strategic rethink after competitive analysis
+
+---
+
+## The Honest Assessment
+
+We ran 20 tasks today. 0% auto-merge success. The code was all good (367 tests pass after manual merge), but the orchestrator failed to deliver end-to-end results.
+
+Meanwhile:
+- Composio: 84.6% CI success, 30 parallel agents, 40K LOC in 8 days
+- vibe-kanban: 22K stars, beautiful kanban UI
+- claude-squad: 6K stars, dead simple TUI
+
+**We are not competing on features. We are behind.**
+
+---
+
+## What "Best" Actually Means
+
+The user doesn't care about:
+- How many plugins we support
+- What our type system looks like
+- Whether we have a state machine
+
+The user cares about ONE thing:
+
+> "I have 50 GitHub Issues. I want them all done by tomorrow morning. With working code, passing tests, and merged PRs."
+
+**Success rate is the only metric that matters.**
+
+Everything else — plugins, memory, self-evolution — is meaningless if the basic loop doesn't work.
+
+---
+
+## Why Orchestrators Fail Today
+
+Every orchestrator (including ours) has the same fundamental problem:
+
+```
+Issue → Dispatch agent → Agent writes code → Gate check → FAIL
+                                                  ↓
+                                            Mark as failed
+                                            (user does manual work)
+```
+
+The failure modes:
+
+### 1. Isolation Paradox
+Agents work in isolated worktrees. Agent A creates a new type. Agent B needs that type but can't see it. TSC fails for both.
+
+**Nobody solves this.** Composio, vibe-kanban, claude-squad — they all have this problem. They just retry and hope.
+
+### 2. Dumb Dispatch
+Current orchestrators are glorified `for task in tasks: spawn(agent, task)`. No understanding of:
+- Task dependency (type definitions before consumers)
+- Conflict prediction (two agents editing same file)
+- Optimal ordering (foundation first, features second)
+
+### 3. No Recovery Intelligence
+When a task fails, orchestrators either:
+- Retry with the same prompt (insanity)
+- Give up (waste)
+- Let the user fix it (defeat)
+
+Nobody does: "TSC failed because type X is missing → find which other task creates type X → merge that first → retry"
+
+---
+
+## The Vision: Intelligent Orchestration
+
+cc-manager should be the orchestrator that **understands what it's doing**.
+
+Not a task queue. Not a worktree manager. An **intelligent build planner for agent work**.
+
+### Core Insight
+
+The best orchestrator is not the one that dispatches fastest.
+It's the one that **fails least**.
+
+```
+                    Current Orchestrators          cc-manager v0.2
+                    ─────────────────────          ──────────────────
+Dispatch            Parallel, hope for best        Dependency-aware DAG
+Isolation           Full isolation (causes TSC)    Staged merging between waves
+Failure handling    Retry or give up               Diagnose → fix dependency → retry
+Task ordering       FIFO / priority                Topological sort by code deps
+Conflict            Detect after fail              Predict before dispatch
+Success rate        ~80%                           Target: 95%+
+```
+
+### The Three Pillars
+
+#### Pillar 1: Dependency-Aware Dispatch
+
+Before dispatching, analyze the task set:
+
+```
+Tasks:
+  T1: Create types.ts (new types)
+  T2: Create router.ts (imports types.ts)
+  T3: Modify scheduler.ts (imports nothing new)
+  T4: Create memory.ts (imports store.ts patterns)
+
+Dependency graph:
+  T1 → T2 (T2 depends on T1's types)
+  T3 → (independent)
+  T4 → (independent)
+
+Execution plan:
+  Wave 1: T1, T3, T4 (parallel, no deps)
+  Wave 2: T2 (after T1 merges)
+```
+
+Between waves: merge completed work to main, rebase remaining worktrees.
+
+This is what we should have done today. Instead we dispatched all 10 in parallel and got 0% auto-merge.
+
+#### Pillar 2: Staged Merging
+
+Don't wait for all tasks to finish. Merge as you go:
+
+```
+Time 0:  Dispatch Wave 1 (T1, T3, T4)
+Time 2m: T3 completes, TSC passes → merge to main
+Time 3m: T1 completes, TSC passes → merge to main
+Time 3m: Rebase T4's worktree onto new main
+Time 4m: T4 completes, TSC passes → merge to main
+Time 4m: Dispatch Wave 2 (T2) on updated main
+Time 6m: T2 completes, TSC passes → merge to main
+         ALL DONE. 100% success.
+```
+
+vs current approach:
+```
+Time 0:  Dispatch all (T1, T2, T3, T4) in parallel
+Time 5m: T2 fails (can't find types from T1)
+         T1, T3, T4 fail (TSC sees missing cross-refs)
+         0% auto-merge. User manually cherry-picks.
+```
+
+#### Pillar 3: Failure Diagnosis Engine
+
+When a task fails, don't just retry. Diagnose:
+
+```
+Task T2 failed.
+TSC error: "Cannot find module './types.js'"
+
+Diagnosis:
+  1. T2 imports from types.ts
+  2. types.ts was created by T1 in worker/worker-0
+  3. T1 hasn't merged to main yet
+  4. Resolution: merge T1 first, rebase T2's worktree, retry T2
+
+Action: merge T1 → rebase T2 → retry T2
+```
+
+This turns "retry with same prompt" into "fix the environment, then retry".
+
+For code-level failures:
+```
+Task T5 failed.
+Agent output: "Error: property 'tags' does not exist on type TaskCreateInput"
+
+Diagnosis:
+  1. Agent hallucinated a 'tags' field on TaskCreateInput
+  2. TaskCreateInput is defined in types.ts
+  3. Fix: remove 'tags' from the generated code
+
+Action: spawn fix agent with targeted prompt:
+  "In file X, remove the 'tags' property — it doesn't exist on TaskCreateInput"
+```
+
+---
+
+## Product Architecture
+
+```
+┌─────────────────────────────────────────────────────────────┐
+│                     cc-manager v0.2                          │
+│                                                             │
+│  ┌─────────────────┐                                        │
+│  │  Issue Source    │  GitHub Issues / Linear / CLI / API    │
+│  └────────┬────────┘                                        │
+│           ▼                                                 │
+│  ┌─────────────────┐                                        │
+│  │  Task Analyzer   │  ← NEW: analyze code deps, predict    │
+│  │                  │    conflicts, build execution DAG      │
+│  └────────┬────────┘                                        │
+│           ▼                                                 │
+│  ┌─────────────────┐                                        │
+│  │  Wave Planner    │  ← NEW: topological sort into waves,  │
+│  │                  │    maximize parallelism within waves   │
+│  └────────┬────────┘                                        │
+│           ▼                                                 │
+│  ┌─────────────────────────────────────────┐                │
+│  │  Execution Engine                        │                │
+│  │                                          │                │
+│  │  Wave 1: ┌──┐ ┌──┐ ┌──┐                │                │
+│  │          │W0│ │W1│ │W2│  (parallel)     │                │
+│  │          └──┘ └──┘ └──┘                 │                │
+│  │            ↓                             │                │
+│  │  Staged Merge: merge completed → rebase  │  ← NEW        │
+│  │            ↓                             │                │
+│  │  Wave 2: ┌──┐ ┌──┐                     │                │
+│  │          │W3│ │W4│  (parallel)          │                │
+│  │          └──┘ └──┘                      │                │
+│  │            ↓                             │                │
+│  │  Staged Merge → rebase → ...            │                │
+│  └─────────────────────────────────────────┘                │
+│           ▼                                                 │
+│  ┌─────────────────┐                                        │
+│  │ Failure Diagnoser│  ← NEW: parse TSC/test errors,        │
+│  │                  │    identify root cause, auto-fix       │
+│  └────────┬────────┘                                        │
+│           ▼                                                 │
+│  ┌─────────────────┐                                        │
+│  │  PR / Merge      │  cross-review → merge → close issue   │
+│  └─────────────────┘                                        │
+└─────────────────────────────────────────────────────────────┘
+```
+
+---
+
+## What We Build (Priority Order)
+
+### P0: Make the basic loop work (success rate from 0% to 80%+)
+
+1. **Staged merging** — merge completed tasks immediately, don't wait for all
+2. **Worktree rebase** — after each merge, rebase active worktrees onto new main
+3. **TSC error diagnosis** — parse TSC errors, identify missing deps, auto-resolve
+
+This alone would have turned today's 0/20 into ~16/20.
+
+### P1: Make it smart (success rate from 80% to 95%+)
+
+4. **Task dependency analysis** — before dispatch, analyze which tasks create/consume types/files
+5. **Wave planning** — group independent tasks into waves, sequence dependent tasks
+6. **Conflict prediction** — detect when two tasks will edit the same file, sequence them
+
+### P2: Make it beautiful (user acquisition)
+
+7. **Real-time dashboard** — show wave progress, dependency graph, live agent output
+8. **One-command experience** — `cc-m run "do all open issues"` (Opus decomposes, plans, executes)
+9. **Mobile notifications** — Telegram/Slack bot for completion alerts
+
+### P3: Make it unstoppable (moat)
+
+10. **Learning from failures** — every failure becomes a routing/prompting improvement
+11. **Agent benchmarking** — continuously test which agent is best for which task type
+12. **Self-evolution** — auto-upgrade agents, auto-discover new ones
+
+---
+
+## Success Metric
+
+One number: **End-to-end success rate**.
+
+```
+Success = (tasks that auto-merge with passing tests) / (total tasks submitted)
+
+Today:     0/20 = 0%     ← embarrassing
+Target P0: 16/20 = 80%   ← competitive with Composio
+Target P1: 19/20 = 95%   ← best in class
+Target P2: with auto-retry and diagnosis, effective 99%
+```
+
+Everything we build must move this number up.
+
+---
+
+## Why This Wins
+
+Every other orchestrator is a **dumb dispatcher** with a nice UI.
+
+cc-manager will be the **smart dispatcher** that:
+1. Understands task dependencies before dispatch
+2. Merges incrementally instead of all-or-nothing
+3. Diagnoses failures and fixes them automatically
+
+The analogy: other orchestrators are `make -j10` (parallel but dumb).
+cc-manager should be `bazel` (understands the dependency graph, caches intermediates, retries intelligently).
+
+No amount of UI polish or plugin architecture will beat 95% success rate.
+The user will tolerate an ugly dashboard if their issues get solved overnight.
diff --git a/docs/ROADMAP.md b/docs/ROADMAP.md
new file mode 100644
index 0000000..32aa061
--- /dev/null
+++ b/docs/ROADMAP.md
@@ -0,0 +1,184 @@
+# cc-manager Roadmap
+
+> **Updated**: 2026-03-05 | **Status**: Active
+
+## Current State (v0.1.7)
+
+| Metric | Value |
+|--------|-------|
+| Core modules | 13 (types, logger, store, worktree-pool, agent-runner, scheduler, server, cli, index, pipeline, pipeline-types, pipeline-store, task-classifier) |
+| LOC | 4,924 |
+| Tests | 372 pass, 0 fail |
+| Features shipped | Priority queue, worktree isolation, SQLite/WAL, SSE, cross-agent review, squash merge, cost tracking, 5-stage pipeline, DAG dispatch, staged rebase, task classifier, model escalation, GPT-5.4 routing, session resume, empty commit detection |
+| Agent types | 4 (claude, claude-sdk, codex, generic) |
+| API endpoints | 20+ |
+| Self-hosting commit rate | 43% (NOT WORKING — requires manual fixes) |
+
+### What works well
+- Worktree pool (create/acquire/release/merge with conflict detection)
+- Event-driven scheduler with priority queue, retry, and model escalation
+- Cross-agent diff review before merge (Claude codes → Codex reviews)
+- Squash merge with review persisted to SQLite + staged rebase
+- Real-time SSE dashboard + CLI client
+- 5-stage autonomous pipeline (research→decompose→execute→verify)
+- Dependency DAG dispatch with wave planning
+- Task classifier routing (quick/standard/deep → model/agent/contextProfile)
+- Empty commit detection (v0.1.7) — no more silent success
+
+### What's NOT working (honest assessment)
+1. **Flywheel loop** — 2 pipeline runs, 43-50% commit rate, 0% unattended merge
+2. **Complex file integration** — scheduler.ts (618 LOC) tasks always fail (0/4 across 2 runs)
+3. **Failure diagnosis** — only basic error injection, no structured parsing
+4. **Agent self-evolution** — Pillar 4 not started
+
+The flywheel is the #1 blocker. Until agents can reliably produce mergeable code, the self-hosting loop is aspirational.
+
+---
+
+## Competitive Landscape (2026-03)
+
+Key insight: Claude Code now has built-in Agent Teams, Hooks, and Worktrees. cc-manager should **not** reinvent coordination — it should be the **orchestration layer above** individual agent runtimes.
+
+| Tool | Strength | cc-manager differentiator |
+|------|----------|--------------------------|
+| Claude Code Agent Teams | Built-in multi-agent + shared tasks | cc-manager adds wave planning, CI feedback, multi-provider |
+| Gas Town (steveyegge) | Persistent work state (Beads), 20-30 agents | cc-manager adds dependency analysis, failure diagnosis |
+| Composio Orchestrator | CI auto-fix loop, 30 agents, MCP gateway | cc-manager adds wave planning, multi-provider flexibility |
+| Emdash | 22+ agents, issue integration, Docker isolation | cc-manager adds staged merging, failure diagnosis |
+| Vibe Kanban | Visual kanban, 10+ agents, built-in dev env | cc-manager adds programmatic API, wave planning |
+
+**cc-manager's moat**: Nobody else does dependency-aware wave planning + staged merging + automated failure diagnosis. These three together solve the isolation paradox.
+
+---
+
+## Roadmap: 3 Phases
+
+### Phase 1: Core Loop (the moat)
+
+> Goal: Solve the isolation paradox. Get auto-merge rate from ~50% to 80%+.
+
+| # | Feature | File | LOC | Priority |
+|---|---------|------|-----|----------|
+| 1 | **Wave planner** — analyze task deps, topological sort into waves | `src/wave-planner.ts` | ~160 | P0 |
+| 2 | **Staged merger** — merge completed → rebase active → next wave | `src/staged-merger.ts` | ~140 | P0 |
+| 3 | **Failure diagnoser** — parse TSC errors → isolation paradox detection → retry prompt | `src/failure-diagnoser.ts` | ~170 | P0 |
+| 4 | **Pipeline** — connects wave → dispatch → merge → diagnose | `src/pipeline.ts` | ~180 | P0 |
+| 5 | **CI feedback** — on TSC/test fail, inject errors into agent retry context | `src/agent-runner.ts` MODIFY | ~50 | P0 |
+| 6 | **Fix listTasks()** — merge memory + SQLite reads | `src/store.ts` MODIFY | ~20 | P1 |
+
+**How wave planning works**:
+```
+Tasks: [A: "create types.ts", B: "import from types.ts", C: "add tests"]
+           ↓ analyzeDeps()
+Edges: [A→B (B consumes types.ts created by A)]
+           ↓ planWaves()
+Wave 0: [A, C]  (independent, run parallel)
+Wave 1: [B]     (depends on A, runs after wave 0 merges)
+```
+
+**How staged merging works**:
+```
+Wave 0 starts: A and C run in parallel worktrees
+  A completes → mergeOne(A) → rebase C's worktree onto updated main
+  C completes → mergeOne(C)
+Wave 1 starts: B runs, can see A's types.ts (already merged)
+  B completes → mergeOne(B)
+```
+
+**Acceptance criteria**:
+- [ ] Wave planner correctly groups independent tasks
+- [ ] Staged merger merges immediately and rebases active worktrees
+- [ ] Failure diagnoser detects isolation paradox (missing module/type/export)
+- [ ] Pipeline orchestrates full wave→dispatch→merge→diagnose loop
+- [ ] Auto-merge rate improves measurably on a 5-task batch
+
+### Phase 2: Robustness
+
+> Goal: Handle failures gracefully, monitor intelligently, recover automatically.
+
+| # | Feature | File | LOC | Priority |
+|---|---------|------|-----|----------|
+| 7 | **Stall detection** — monitor output activity, not wall-clock | `src/agent-runner.ts` MODIFY | ~30 | P1 |
+| 8 | **JSONL monitor** — read Claude session files for progress | `src/jsonl-monitor.ts` | ~100 | P1 |
+| 9 | **Context recovery** — checkpoint task state, resume on failure | `src/checkpoint.ts` | ~100 | P1 |
+| 10 | **Worktree pre-warm** — reserve pool, zero-latency claim | `src/worktree-pool.ts` MODIFY | ~50 | P2 |
+| 11 | **Promise-based lock** — replace 10ms spin with async queue | `src/worktree-pool.ts` MODIFY | ~30 | P2 |
+| 12 | **Hooks integration** — leverage CC hooks for quality gates | `src/hooks.ts` | ~80 | P1 |
+
+**Hooks integration** (leveraging Claude Code's native hook system):
+```json
+{
+  "hooks": {
+    "TaskCompleted": [{
+      "type": "command",
+      "command": "npx tsc --noEmit && npm test"
+    }],
+    "Stop": [{
+      "type": "prompt",
+      "prompt": "Verify all acceptance criteria are met"
+    }]
+  }
+}
+```
+
+**Acceptance criteria**:
+- [ ] Stalled agents detected within 30s of last output
+- [ ] Session JSONL progress visible in dashboard
+- [ ] Failed tasks resume from checkpoint with previous context
+- [ ] Worktree acquire latency < 100ms (pre-warmed pool)
+
+### Phase 3: Scale + Intelligence
+
+> Goal: Multi-provider flexibility, smart routing, learning from history.
+
+| # | Feature | File | LOC | Priority |
+|---|---------|------|-----|----------|
+| 13 | **Provider registry** — declarative agent plugin system | `src/provider-registry.ts` | ~150 | P2 |
+| 14 | **Smart router** — route by complexity, history, budget | `src/router.ts` | ~150 | P2 |
+| 15 | **Execution memory** — store patterns, feed back to routing | `src/memory.ts` | ~100 | P2 |
+| 16 | **GitHub Issues integration** — issues → tasks (auto-dispatch) | `src/integrations/github.ts` | ~150 | P2 |
+| 17 | **Attempt model** — multiple tries per task, compare diffs | `src/scheduler.ts` MODIFY | ~80 | P3 |
+| 18 | **Dashboard v2** — kanban lanes, cost charts, wave visualization | `src/web/` MODIFY | ~200 | P3 |
+
+**Provider registry**:
+```typescript
+interface AgentProvider {
+  name: string;
+  detect(): Promise<boolean>;       // is this agent installed?
+  run(task, cwd): Promise<Result>;  // execute task
+  review(diff): Promise<Review>;    // review code
+  cost(tokens): number;             // estimate cost
+  capabilities: { maxContext, speed, supportsStreaming };
+}
+```
+
+**Acceptance criteria**:
+- [ ] New agent CLI auto-detected and registered
+- [ ] Tasks route to best agent based on complexity + history
+- [ ] GitHub Issues with label auto-convert to tasks
+- [ ] Memory stores success/failure patterns per task type
+
+---
+
+## Summary
+
+| Phase | New files | Modified | Est. LOC | Key metric |
+|-------|-----------|----------|----------|------------|
+| 1: Core Loop | 4 | 2 | ~720 | Auto-merge rate 50%→80% |
+| 2: Robustness | 3 | 3 | ~390 | Recovery rate, stall detection |
+| 3: Scale | 4 | 2 | ~830 | Multi-provider, smart routing |
+| **Total** | **11** | **7** | **~1,940** | 3,738→~5,700 LOC |
+
+**Critical path**: Phase 1 (#1-5) → Phase 2 (#7,8,12) → Phase 3 (#13,14)
+
+Phase 1 is the moat. Ship it first, measure auto-merge rate, then iterate.
+
+---
+
+## Design Principles
+
+1. **Leverage, don't reinvent** — Claude Code has Agent Teams, Hooks, Worktrees. Use them. cc-manager adds the orchestration layer above.
+2. **Merge early, merge often** — Staged merging is the core innovation. Every completed task merges immediately, every active worktree rebases.
+3. **Diagnose, don't retry blindly** — Parse errors structurally. Tell the agent exactly what's wrong and how to fix it.
+4. **One file per task** — Prevents merge conflicts. Creation (~100% success) > modification (~70% success).
+5. **Simple prompts** — 3-4 sentences max. One clear objective per task.
diff --git a/docs/SOURCE-CODE-ANALYSIS.md b/docs/SOURCE-CODE-ANALYSIS.md
new file mode 100644
index 0000000..c0e047b
--- /dev/null
+++ b/docs/SOURCE-CODE-ANALYSIS.md
@@ -0,0 +1,217 @@
+# Competitor Source Code Analysis
+
+> Deep-dive of 11 coding agent orchestrator projects.
+> Research date: 2026-03-05
+
+---
+
+## Tier 1: Full Orchestrators
+
+### 1. ComposioHQ/agent-orchestrator (3.7K stars)
+
+**Architecture**: TypeScript, 8-slot plugin system, YAML config, stateless flat-file
+
+**Key patterns**:
+- **JSONL Event Monitoring**: Reads `~/.claude/projects/*/sessions/*.jsonl` directly instead of parsing stdout. Every message, tool call, and turn completion is a structured event.
+- **8-Slot Plugin Architecture**: Runtime (tmux/docker/k8s), Agent (claude/codex/aider), Workspace (worktree/clone), Tracker (github/linear), SCM, Notifier, Terminal, Lifecycle
+- **CI Auto-Fix Reaction Engine**: CI fails → parse error logs → inject back into agent session → agent fixes → retry. This is their killer feature.
+- **Review Comment Routing**: PR comment → route to the agent that wrote the code → agent addresses it
+- **Self-built**: 30 agents, 8 days, 40K LOC, 84.6% CI success
+
+**Borrow**: JSONL monitoring, CI feedback loop, review routing
+
+### 2. BloopAI/vibe-kanban (22K stars)
+
+**Architecture**: Rust 49.6% (Axum + Tokio + SQLx) + TypeScript 48% (React + TanStack + Zustand)
+
+**Key patterns**:
+- **Attempt 1:N model**: Each task can have multiple attempts with different agents/prompts. Compare diffs across attempts. This treats LLM non-determinism as a product feature.
+- **`ts-rs` cross-language types**: Rust structs auto-generate TypeScript interfaces. Backend change → frontend build fails. Eliminates API drift.
+- **Per-path async mutex**: Worktree creation uses `LazyLock<Mutex<HashMap<String, Arc<tokio::sync::Mutex<()>>>>>` for concurrent safety
+- **Four-step worktree cleanup**: `git worktree remove --force` → delete `.git/worktrees/` metadata → `fs::remove_dir_all` → `git worktree prune`
+- **Orphan cleanup on startup**: Scan worktree base dir, delete directories with no DB record
+- **Electric SQL**: Local-first SQLite sync for offline-capable kanban board
+- **`enum_dispatch` agent trait**: Adding new agent = add enum variant + implement trait methods
+- **MCP dual integration**: Acts as both MCP client (connecting to tools) AND MCP server (exposing board to agents)
+
+**Borrow**: Attempt model, worktree cleanup sequence, startup orphan cleanup
+
+### 3. automazeio/ccpm (7.6K stars)
+
+**Architecture**: Pure Markdown protocol — all logic in `.claude/commands/pm/*.md` slash commands
+
+**Key patterns**:
+- **PRD → Epic → Task → Issue pipeline**: 5-phase discipline with full traceability
+- **File rename as mapping**: `001.md` → `{issue-id}.md` after GitHub sync. No database needed.
+- **Command YAML frontmatter**: Each command declares its required tools (`Read, Write, Bash, Task`)
+- **`epics/` in .gitignore**: Local PM workspace stays local, GitHub Issues are team truth
+- **Context isolation**: Sub-agents read `.claude/context/`, return only summaries
+- **`/pm:next`**: Auto-picks next priority task with full epic context
+- **`parallel: true` + `depends_on` + `conflicts_with`**: Task metadata for scheduling
+
+**Borrow**: Task dependency metadata format, `/pm:next` auto-pick, context isolation
+
+### 4. openai/symphony (4.2K stars)
+
+**Architecture**: Elixir OTP GenServer, WORKFLOW.md as single config
+
+**Key patterns**:
+- **WORKFLOW.md = YAML frontmatter + Liquid template prompt**: Single file configures tracker, workspace, agent, polling, hooks, and agent prompt
+- **Workspace hooks**: `after_create / before_run / after_run / before_remove` lifecycle
+- **Skills as `.codex/*.md`**: `land.md` teaches agent to squash-merge safely. Skills are copyable Markdown.
+- **Tracker writes through agent**: Symphony only reads Linear; agent writes via injected `linear_graphql` tool
+- **Thread sandbox**: `workspace-write` limits agent to its own directory
+- **Deterministic workspace key**: `sanitize(issue.identifier)` → directory name. No DB needed to rebuild state.
+- **Continuation turns**: After max_turns, agent pauses. Next poll cycle resumes with continuation guidance prompt.
+- **Proof-of-work package**: CI status + review addressed + complexity + walkthrough
+
+**Borrow**: WORKFLOW.md format, workspace hooks, continuation turns, proof-of-work
+
+### 5. smtg-ai/claude-squad (6.2K stars)
+
+**Architecture**: Go 87.9%, tmux session manager, Bubbletea TUI
+
+**Key patterns**:
+- **tmux as process container**: `tmux new-session -d -s "agent-0" -x 200 -y 50`. Survives crashes, user can `tmux attach` to watch.
+- **PTY input injection**: `tmux send-keys -t session "prompt text" Enter` for agents without --prompt flag
+- **SHA256 completion detection**: Hash pane content every tick. If hash unchanged for N ticks → agent is idle/done.
+- **Git worktree lifecycle**: `Setup() → Cleanup() → Remove() → Pause() → Resume()`
+- **`state.json` persistence**: Minimal state file for crash recovery
+
+**Borrow**: tmux runtime, SHA256 completion detection, worktree lifecycle
+
+---
+
+## Tier 2: Specialized Tools
+
+### 6. tim-smart/lalph (92 stars) — closest to cc-manager
+
+**Key patterns**:
+- **Label-based agent routing**: Issue labels map to agent presets (e.g., "fast-lane" → Sonnet, "deep-think" → Opus)
+- **Stall timeout**: Tracks last output time, not wall-clock. Agent alive if producing output.
+- **Issue dependency graph**: Wait for dependency PR to merge before starting next issue
+- **Plan mode → `.specs/`**: High-level spec → auto-generate PRD → auto-create sub-issues
+- **Finalizer auto-rollback**: `Effect.addFinalizer` resets issue to "todo" on failure
+- **Chooser → task.json protocol**: LLM writes choice to file, orchestrator reads it
+
+**Borrow**: Stall timeout, label routing, issue dependency graph
+
+### 7. generalaction/emdash (2.4K stars, YC W26)
+
+**Key patterns**:
+- **Worktree pool pre-warming**: Background pre-create reserve worktrees. `claimReserve()` returns instantly.
+- **22-provider registry**: Declarative config for each agent's CLI flags, prompt method, resume method
+- **Keystroke injection**: For agents without `--prompt` flag, inject via PTY keystrokes
+- **PTY env var whitelist**: Only pass listed env vars to agent (prevent secret leakage)
+- **Three-phase lifecycle**: `setup → run → teardown`, each with own status/logs/timeout
+- **HTTP hook server + UUID token**: Agent → HTTP POST → orchestrator, decoupled event notification
+- **`killProcessTree`**: `process.kill(-pid, signal)` for process group cleanup
+
+**Borrow**: Worktree pool, provider registry, three-phase lifecycle, process group kill
+
+### 8. dagger/container-use (3.6K stars)
+
+**Key patterns**:
+- **Git notes for state storage**: Container ID and config stored in `refs/notes/container-use`. No external DB. `git fetch` syncs state.
+- **`environment_checkpoint`**: Snapshot container state at key points, rollback on failure
+- **12 MCP tools**: `environment_create/open/run_cmd/file_read/write/edit/add_service/checkpoint`
+- **Single/multi-tenant MCP modes**: Per-chat or shared server
+
+**Borrow**: Git notes for state, checkpoint/rollback concept
+
+### 9. xvirobotics/metabot (96 stars)
+
+**Key patterns**:
+- **Agent Bus REST API**: `POST /api/tasks` (delegate), `POST /api/bots` (create agent), `POST /api/schedule` (cron)
+- **CLAUDE* env var filtering**: Filter `CLAUDE_*` vars to avoid nested session detection
+- **MetaMemory**: SQLite + Markdown dual knowledge base, shared across all agents
+- **chatId → sessionId persistence**: Resume agent sessions across IM conversations
+- **Cron scheduler**: Persistent to JSON, survives restart
+
+**Borrow**: CLAUDE* env filtering, Agent Bus API pattern, cron scheduler
+
+### 10. manaflow-ai/cmux (4.2K stars)
+
+**Key patterns**:
+- **OSC 777 notification protocol**: Terminal escape sequences for agent notifications
+- **Claude Code hook integration**: `Stop` and `PostToolUse` hooks → notification → workspace auto-reorder
+- **UNIX domain socket control**: `cmux workspace create/focus/notify` via socket API
+- **Sidebar status aggregation**: branch + PR + ports + last notification in one line
+
+**Borrow**: Hook-based notifications, status aggregation model
+
+### 11. humanlayer/humanlayer (9.6K stars)
+
+**Key patterns**:
+- **ACP (Agent Control Plane)**: Distributed scheduler for remote cloud workers
+- **"Advanced Context Engineering"**: Specialized for large codebases
+- **MULTICLAUDE**: Parallel Claude Code execution
+
+### 12. steveyegge/gastown (Steve Yegge)
+
+**Architecture**: Go 1.23+, Dolt (versioned SQLite) + JSONL, tmux sessions, git worktrees
+
+**The closest project to our vision.** Gas Town has:
+
+**Role hierarchy**:
+- **Mayor** = coordinator (user's single entry point, dispatches work)
+- **Polecats** = ephemeral worker agents (20-30 parallel, each in own worktree)
+- **Refinery** = merge queue manager (serial merge, conflict resolution)
+- **Witness** = supervisor (detects stuck agents, triggers recovery)
+- **Deacon** = daemon (patrol every 5 min, health monitoring)
+
+**Key patterns**:
+- **Convoy ≈ Wave**: Batch related tasks, `convoy stage` → `convoy launch`. BUT: manually created, no auto dependency analysis.
+- **Refinery ≈ Staged Merger**: Bors-style batch merge → run CI on tip → binary search for failure source on CI fail. Serial integration of parallel MR streams.
+- **GUPP (Universal Propulsion Principle)**: "If there is work on your Hook, YOU MUST RUN IT." — each agent has a pinned task as work queue, auto-executes on session start.
+- **Beads dual persistence**: SQLite (fast query) + JSONL (git-tracked). JSONL commits with code for cross-machine sync.
+- **Handoff + Seance**: `gt handoff` gracefully restarts agent at context limit. `gt seance` lets new session query previous session's decisions.
+- **NDI (Non-Deterministic Idempotency)**: All workflows assume agent can crash anytime. Tasks resume from any intermediate state.
+- **Six-stage lifecycle**: CREATE → LIVE → CLOSE → DECAY → COMPACT → FLATTEN. Wisp Reaper auto-closes stale tasks after 7 days.
+- **MEOW stack**: Formulas (TOML templates) → Protomolecules → Molecules (multi-step workflows) → Beads (atomic tasks) → Wisps (ephemeral)
+
+**What Gas Town has that we don't**:
+- Refinery merge queue with CI bisect
+- Handoff/Seance context recovery
+- Role-based architecture (Mayor/Polecat/Refinery/Witness)
+- GUPP hook-based auto-push
+
+**What we have that Gas Town doesn't**:
+- **Automatic dependency analysis** (Gas Town's Convoy is manual)
+- **Cross-task type tracking** (which task creates types another needs)
+- **Proactive failure diagnosis** (parse error → identify root cause → fix env)
+
+**Borrow**: Refinery merge queue + bisect, GUPP hook pattern, Handoff context recovery, Beads dual persistence, role separation
+
+---
+
+## Cross-Cutting Patterns (appears in 3+ projects)
+
+| Pattern | Projects | Description |
+|---------|----------|-------------|
+| Git worktree isolation | ALL 11 | Every project uses worktrees for agent isolation |
+| YAML/MD config files | ccpm, symphony, lalph | Single-file declarative configuration |
+| Agent as subprocess | ALL except container-use | spawn CLI process, monitor stdout/stderr |
+| SSE for real-time updates | vibe-kanban, composio, cc-manager | Server-sent events for dashboard |
+| SQLite for state | vibe-kanban, emdash, metabot | Local-first persistence |
+| `gh` CLI for GitHub | ALL with GitHub integration | Standard PR/issue management |
+| Exponential backoff retry | symphony, composio, cc-manager | Failure recovery |
+| Process group kill | emdash, claude-squad | `-pid` signal for clean teardown |
+
+---
+
+## What Nobody Does (our moat opportunity)
+
+| Feature | Status across all 11 projects |
+|---------|-------------------------------|
+| **Dependency-aware wave planning** | Gas Town has manual Convoy. Nobody does auto-analysis. |
+| **Staged merging between waves** | Gas Town's Refinery is closest (Bors-style). But no wave↔merge integration. |
+| **Proactive failure diagnosis** | ZERO projects. All do reactive retry. |
+| **Cross-task type dependency tracking** | ZERO projects. All treat tasks as independent. |
+
+Gas Town's Refinery is the closest to our staged merging vision, but it lacks:
+1. Auto dependency analysis (Convoys are manual)
+2. Wave↔merge integration (Refinery runs independently of dispatch)
+3. Proactive diagnosis (still reactive retry)
+
+**Our moat = the integration**: analyze deps → auto-plan waves → staged merge → diagnose failures. Nobody connects all four.
diff --git a/docs/STRATEGY.md b/docs/STRATEGY.md
new file mode 100644
index 0000000..5257640
--- /dev/null
+++ b/docs/STRATEGY.md
@@ -0,0 +1,64 @@
+# cc-manager Strategy Notes
+
+## Competitive Landscape (2026-03)
+- 18+ competing projects in "coding agent orchestrator" space
+- Top: vibe-kanban (22K stars), humanlayer (9.7K), ccpm (7.6K), claude-squad (6.2K)
+- Closest competitor: ComposioHQ/agent-orchestrator (3.7K stars, 8-slot plugin, CI auto-fix)
+- ALL competitors are dumb dispatchers — none do dependency-aware wave planning
+
+## cc-manager Key Insight
+Every orchestrator does: dispatch → hope → retry
+cc-manager should do: analyze deps → plan waves → merge incrementally → diagnose failures
+
+## Learned from 2026-03-05 Sprint
+- 20 tasks, 10 workers, $12.29 total cost
+- 0% auto-merge (TSC gate), but all code was correct (367 tests pass after manual merge)
+- Root cause: parallel worktrees can't see each other's new types
+- Fix needed: staged merging between waves, not all-at-once dispatch
+
+## Four Pillars
+1. Dependency-aware dispatch (build DAG before dispatching)
+2. Staged merging (merge completed → rebase active → continue)
+3. Failure diagnosis (parse errors → identify root cause → auto-fix)
+4. **Agent self-evolution** (monitor 3 agent versions → detect new features → auto-upgrade integration)
+   - cc-manager consumes the agents it orchestrates to upgrade itself
+   - See [3-agents-reference.md](3-agents-reference.md) "Self-Evolution: Agent Version Monitor" section
+
+## Key Borrowed Patterns (priority order)
+1. Refinery merge queue + CI bisect (Gas Town) — batch merge, binary search failure
+2. CI auto-fix loop (Composio) — inject failure logs back into agent
+3. GUPP hook pattern (Gas Town) — task injected into CLAUDE.md, auto-execute
+4. Handoff + Seance (Gas Town) — context recovery across sessions
+5. JSONL event monitoring (Composio) — read ~/.claude/projects/*/sessions/*.jsonl
+6. Stall timeout (lalph) — output activity, not wall-clock
+7. Worktree pool pre-warming (emdash) — instant task start
+8. CLAUDE* env filtering (metabot) — prevent nested session errors
+9. Provider registry (emdash/vibe-kanban) — declarative agent config
+10. Attempt model (vibe-kanban) — multiple tries per task, compare diffs
+11. Dual persistence (Gas Town) — SQLite + JSONL git-tracked
+12. Three-phase lifecycle (emdash) — setup/run/teardown
+13. WORKFLOW.md (symphony) — YAML frontmatter + Liquid template prompt
+
+## Gas Town (steveyegge/gastown) — Closest Competitor
+- Go-based, Dolt + JSONL, tmux sessions
+- Convoy ≈ our Wave (but manual, not auto-analyzed)
+- Refinery ≈ our Staged Merger (Bors-style, with CI bisect)
+- GUPP = hook-based auto-push (agent auto-executes pinned task)
+- Handoff/Seance = context recovery across sessions
+- Our advantage: automatic dependency analysis + proactive failure diagnosis
+
+## Documentation Map
+- docs/plans/2026-03-05-v0.2-implementation-plan.md — v0.2 concrete plan (9 features, 3 phases)
+- docs/3-agents-reference.md — Claude CLI, Claude SDK, Codex CLI features + gaps + routing
+- docs/research/2026-03-05-agent-landscape.md — Perplexity Computer, GPT-5.4, latest SDK/CLI research
+- docs/SOURCE-CODE-ANALYSIS.md — 11 competitor deep-dives
+- docs/BUILD-VS-BORROW.md — what to build vs borrow
+- docs/PRODUCT-VISION.md — three pillars + priority order
+- docs/COMPETITIVE-ANALYSIS.md — market map + feature matrix
+- docs/ROADMAP.md — v0.1.x → v0.2.0 unified roadmap
+- docs/GAP-ANALYSIS.md — self-assessment + action plan
+
+## User Role Model
+- User is CEO, cc-m is CTO with R&D team
+- cc-manager should run autonomously: Issues in → PRs merged out
+- One metric: end-to-end success rate (current: 0%, target: 95%)
diff --git a/docs/plans/2026-03-05-v0.1.6-implementation-plan.md b/docs/plans/2026-03-05-v0.1.6-implementation-plan.md
new file mode 100644
index 0000000..47f5228
--- /dev/null
+++ b/docs/plans/2026-03-05-v0.1.6-implementation-plan.md
@@ -0,0 +1,961 @@
+# Implementation Plan
+
+> **For Claude:** REQUIRED SUB-SKILL: Use superpowers:executing-plans to implement this plan task-by-task.
+
+**Goal:** Implement v0.1.6 Phase 1 Critical Path: fix prompt accumulation on retry, add staged rebase after merge, and support array dependency DAGs.
+
+**Architecture:** Three independent features layered bottom-up through types → store → worktree-pool → agent-runner → scheduler. Types change first (Wave 0), then store + worktree-pool in parallel (Wave 1), then agent-runner (Wave 2), then scheduler integrates everything (Wave 3), then tests (Wave 4).
+
+**Tech Stack:** TypeScript 5, Node.js ESM, better-sqlite3, node:test + assert/strict
+
+---
+
+## Summary
+
+**Feature 1 — Prompt accumulation fix + model escalation:** Each retry currently appends error context to `task.prompt`, so by retry 3 the prompt contains 3 stacked error sections. Fix by saving the original prompt in `task._originalPrompt` on first retry, then rebuilding from `_originalPrompt + latest error` on each subsequent retry. Add model escalation: when `retryCount >= 2` set `task.modelOverride = "claude-opus-4-6"` so hard tasks get a more powerful model. `_originalPrompt` is persisted in SQLite (new `original_prompt` column migration). `modelOverride` is transient (set in memory at retry time, recomputed each retry).
+
+**Feature 2 — Staged rebase:** After a successful merge, other busy workers operate on a stale `main`. Add `WorktreePool.getActiveWorkers(exclude?)` (returns busy worker names, optionally excluding one) and `WorktreePool.rebaseOnMain(workerName)` (rebases branch onto current `main` tip, returns false on conflict). After every successful merge in `scheduler.executeAndRelease`, fire `rebaseOnMain` on all other active workers as best-effort (errors caught and logged, never blocking dispatch).
+
+**Feature 3 — Dependency DAG:** `dependsOn` currently accepts only a single string task ID. Extend to `string | string[]` (backward-compatible). The dispatch loop checks ALL dependencies; if any is failed/timeout/cancelled the task fails immediately; if any is still pending/running the task is re-queued. Store serializes array values as JSON (detected on read by `startsWith('[')`).
+
+---
+
+## Files to Create
+_(none — all changes are modifications to existing files)_
+
+## Files to Modify
+- `src/types.ts` — add `_originalPrompt?`, `modelOverride?` to Task; change `dependsOn` to `string | string[]`; update `createTask` opts
+- `src/store.ts` — add `original_prompt` column migration; update taskToParams/rowToTask for `_originalPrompt`; serialize array `dependsOn` as JSON; update `fieldMap` in `update()`
+- `src/worktree-pool.ts` — add `getActiveWorkers(exclude?)` and `rebaseOnMain(workerName)` public methods
+- `src/agent-runner.ts` — use `task.modelOverride ?? task.model ?? this.model` in `runClaudeSDK` and `runClaude`
+- `src/scheduler.ts` — fix prompt accumulation in `executeAndRelease` + `requeue`; add model escalation; update dependency check loop for arrays; call `pool.rebaseOnMain` on other workers after successful merge; update `submit()` opts type
+- `src/__tests__/scheduler.test.ts` — update `makePool()` mock; add tests for prompt accumulation fix, model escalation, array dependsOn
+- `src/__tests__/worktree-pool.test.ts` — add tests for `getActiveWorkers` and `rebaseOnMain`
+
+---
+
+## Waves (execution order)
+
+### Wave 0: Types (single task, blocks everything else)
+
+#### Task 1: Update `src/types.ts`
+
+**Files:**
+- Modify: `src/types.ts`
+
+**Step 1: Add two new optional fields to the Task interface**
+
+After line 39 (`model?: string;`), insert:
+```typescript
+  modelOverride?: string;
+  _originalPrompt?: string;
+```
+
+**Step 2: Change `dependsOn` type**
+
+Line 34: change `dependsOn?: string;` to:
+```typescript
+  dependsOn?: string | string[];
+```
+
+No changes needed to `createTask` body — `opts?.dependsOn` assignment already works for `string | string[]`.
+
+**Step 3: Run tsc to verify**
+```bash
+npx tsc --noEmit
+```
+Expected: no errors (this is a pure type widening, no breaking changes)
+
+**Step 4: Commit**
+```bash
+git add -A && git commit -m "feat(types): add modelOverride, _originalPrompt; widen dependsOn to string|string[]"
+```
+
+---
+
+### Wave 1: Store + WorktreePool (parallel — independent files, both depend on Wave 0)
+
+#### Task 2: Update `src/store.ts`
+
+**Files:**
+- Modify: `src/store.ts`
+
+This task has four parts. Apply them in sequence within this task.
+
+**Part A — Add migration for `original_prompt` column**
+
+In `migrate()`, after the existing `review` column migration block (around line 89, after `"ALTER TABLE tasks ADD COLUMN review TEXT"`), add:
+```typescript
+    // Add original_prompt column to preserve original prompt across retries
+    try {
+      this.db.exec("ALTER TABLE tasks ADD COLUMN original_prompt TEXT");
+    } catch {
+      // Column already exists — safe to ignore
+    }
+```
+
+**Part B — Update `taskToParams()`**
+
+The existing method returns 25 params. Replace it entirely:
+```typescript
+  private taskToParams(task: Task): unknown[] {
+    return [
+      task.id, task.prompt, task.status, task.worktree ?? null,
+      task.output, task.error, JSON.stringify(task.events),
+      task.createdAt, task.startedAt ?? null, task.completedAt ?? null,
+      task.timeout, task.maxBudget, task.costUsd,
+      task.tokenInput, task.tokenOutput, task.durationMs, task.retryCount, task.maxRetries,
+      task.priority ?? "normal",
+      JSON.stringify(task.tags ?? []),
+      task.dependsOn == null
+        ? null
+        : Array.isArray(task.dependsOn)
+          ? JSON.stringify(task.dependsOn)
+          : task.dependsOn,
+      task.webhookUrl ?? null, task.summary ?? null,
+      task.agent ?? "claude",
+      JSON.stringify(task.review ?? null),
+      task._originalPrompt ?? null,
+    ];
+  }
+```
+(26 params now — `original_prompt` is the last one)
+
+**Part C — Update all SQL statements to include `original_prompt`**
+
+There are 4 SQL statements across `save()`, `updateBatch()`, and `saveBatch()` — two variants each (INSERT and UPDATE). Update all of them:
+
+INSERT (add `original_prompt` to column list and add `?` to VALUES — goes from 25 `?` to 26):
+```sql
+INSERT OR IGNORE INTO tasks
+(id, prompt, status, worktree, output, error, events, created_at,
+ started_at, completed_at, timeout, max_budget, cost_usd,
+ token_input, token_output, duration_ms, retry_count, max_retries, priority, tags,
+ depends_on, webhook_url, summary, agent, review, original_prompt)
+VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?)
+```
+
+UPDATE (add `original_prompt=?` before `WHERE id=?`):
+```sql
+UPDATE tasks SET
+  prompt=?, status=?, worktree=?, output=?, error=?, events=?, created_at=?,
+  started_at=?, completed_at=?, timeout=?, max_budget=?, cost_usd=?,
+  token_input=?, token_output=?, duration_ms=?, retry_count=?, max_retries=?,
+  priority=?, tags=?, depends_on=?, webhook_url=?, summary=?, agent=?, review=?,
+  original_prompt=?
+WHERE id=?
+```
+
+Apply these SQL changes to `save()`, `updateBatch()` (insertStmt + updateStmt), and `saveBatch()` (insertStmt + updateStmt) — 6 SQL strings total.
+
+**Part D — Update `update()` fieldMap and `rowToTask()`**
+
+In `update()` fieldMap, replace the existing `dependsOn` entry and add `_originalPrompt`:
+```typescript
+      dependsOn:   { col: "depends_on", serialize: (v) => {
+        if (v == null) return null;
+        return Array.isArray(v) ? JSON.stringify(v as unknown[]) : v as string;
+      }},
+      _originalPrompt: { col: "original_prompt" },
+```
+
+In `rowToTask()`, replace the `dependsOn` line and add `_originalPrompt`:
+```typescript
+      dependsOn: (() => {
+        const raw = row.depends_on as string | null | undefined;
+        if (!raw) return undefined;
+        if (raw.startsWith("[")) {
+          try { return JSON.parse(raw) as string[]; } catch { return raw; }
+        }
+        return raw;
+      })(),
+      _originalPrompt: (row.original_prompt as string | null) ?? undefined,
+```
+
+**Step 5: Run tsc**
+```bash
+npx tsc --noEmit
+```
+Expected: no errors. Fix any type errors before committing.
+
+**Step 6: Commit**
+```bash
+git add -A && git commit -m "feat(store): persist _originalPrompt; serialize dependsOn array as JSON"
+```
+
+---
+
+#### Task 3: Add rebase methods to `src/worktree-pool.ts`
+
+**Files:**
+- Modify: `src/worktree-pool.ts`
+
+**Step 1: Add two public methods**
+
+Insert after the `getWorkerStats()` method (around line 386) and before the private `git()` helper:
+
+```typescript
+  /**
+   * Returns names of all currently-busy workers, optionally excluding one.
+   * Used by the scheduler to find other workers to rebase after a merge.
+   */
+  getActiveWorkers(exclude?: string): string[] {
+    const result: string[] = [];
+    for (const w of this.workers.values()) {
+      if (w.busy && w.name !== exclude) result.push(w.name);
+    }
+    return result;
+  }
+
+  /**
+   * Rebases the worker's branch onto the current tip of main.
+   * Returns true on success, false if there were conflicts (rebase is aborted).
+   * Best-effort — callers must not block on failure.
+   */
+  async rebaseOnMain(workerName: string): Promise<boolean> {
+    const w = this.workers.get(workerName);
+    if (!w) return false;
+    try {
+      const { stdout } = await this.git("rev-parse", "main");
+      const mainSha = stdout.trim();
+      await this.gitIn(w.path, "rebase", mainSha);
+      return true;
+    } catch {
+      await this.gitIn(w.path, "rebase", "--abort").catch(() => {});
+      log("warn", "[pool] rebaseOnMain: conflict, aborted", { worker: workerName });
+      return false;
+    }
+  }
+```
+
+**Step 2: Run tsc**
+```bash
+npx tsc --noEmit
+```
+Expected: no errors
+
+**Step 3: Commit**
+```bash
+git add -A && git commit -m "feat(worktree-pool): add getActiveWorkers() and rebaseOnMain()"
+```
+
+---
+
+### Wave 2: AgentRunner model override (depends on Wave 0)
+
+#### Task 4: Update `src/agent-runner.ts`
+
+**Files:**
+- Modify: `src/agent-runner.ts`
+
+**Step 1: Update `runClaudeSDK()` model selection**
+
+Find (~line 400):
+```typescript
+          model: task.model ?? this.model,
+```
+Change to:
+```typescript
+          model: task.modelOverride ?? task.model ?? this.model,
+```
+
+**Step 2: Update `runClaude()` model selection**
+
+Find (~line 438):
+```typescript
+        "--model", task.model ?? this.model,
+```
+Change to:
+```typescript
+        "--model", task.modelOverride ?? task.model ?? this.model,
+```
+
+**Step 3: Run tsc**
+```bash
+npx tsc --noEmit
+```
+Expected: no errors
+
+**Step 4: Commit**
+```bash
+git add -A && git commit -m "feat(agent-runner): honour task.modelOverride in runClaude and runClaudeSDK"
+```
+
+---
+
+### Wave 3: Scheduler — integrate all three features (depends on Waves 1 + 2)
+
+#### Task 5: Update `src/scheduler.ts`
+
+**Files:**
+- Modify: `src/scheduler.ts`
+
+Apply four sub-changes in sequence. Run `npx tsc --noEmit` after all four before committing.
+
+---
+
+**Sub-change A: Fix prompt accumulation in `executeAndRelease()`**
+
+Find the retry block starting at ~line 544:
+```typescript
+      if (task.status === "failed" && task.retryCount < task.maxRetries) {
+        shouldRetry = true;
+        const prevError = task.error ?? "";
+        task.retryCount++;
+        task.status = "pending";
+        task.completedAt = undefined;
+        // Inject previous error into prompt so the agent can learn from it
+        if (prevError) {
+          const errorContext = prevError.length > 500 ? prevError.slice(0, 500) + "..." : prevError;
+          task.prompt = `${task.prompt}\n\n---\n## Previous Attempt Failed (attempt ${task.retryCount})\nError: ${errorContext}\nFix the error above and try again.`;
+        }
+        task.error = "";
+        // Swap agent on retry for better chance of success
+        const prevAgent = task.agent ?? "claude";
+        task.agent = AgentRunner.pickFallbackAgent(prevAgent);
+        log("info", "task retrying with error context", { taskId: task.id, attempt: task.retryCount, maxRetries: task.maxRetries, agent: prevAgent, fallback: task.agent });
+      }
+```
+
+Replace with:
+```typescript
+      if (task.status === "failed" && task.retryCount < task.maxRetries) {
+        shouldRetry = true;
+        const prevError = task.error ?? "";
+        task.retryCount++;
+        task.status = "pending";
+        task.completedAt = undefined;
+        // Save original prompt on first retry; rebuild from it on subsequent retries
+        if (!task._originalPrompt) {
+          task._originalPrompt = task.prompt;
+        }
+        if (prevError) {
+          const errorContext = prevError.length > 500 ? prevError.slice(0, 500) + "..." : prevError;
+          task.prompt = `${task._originalPrompt}\n\n---\n## Previous Attempt Failed (attempt ${task.retryCount})\nError: ${errorContext}\nFix the error above and try again.`;
+        } else {
+          task.prompt = task._originalPrompt;
+        }
+        // Escalate to opus on second retry (retryCount has already been incremented above)
+        if (task.retryCount >= 2) {
+          task.modelOverride = "claude-opus-4-6";
+        }
+        task.error = "";
+        // Swap agent on retry for better chance of success
+        const prevAgent = task.agent ?? "claude";
+        task.agent = AgentRunner.pickFallbackAgent(prevAgent);
+        log("info", "task retrying with error context", { taskId: task.id, attempt: task.retryCount, maxRetries: task.maxRetries, agent: prevAgent, fallback: task.agent });
+      }
+```
+
+---
+
+**Sub-change B: Fix prompt accumulation in `requeue()`**
+
+Find in `requeue()` (~lines 149–164):
+```typescript
+    // Inject previous error into prompt so agent can learn from it
+    const prevError = task.error ?? "";
+    if (prevError) {
+      const errorContext = prevError.length > 500 ? prevError.slice(0, 500) + "..." : prevError;
+      task.prompt = `${task.prompt}\n\n---\n## Previous Attempt Failed (attempt ${task.retryCount + 1})\nError: ${errorContext}\nFix the error above and try again.`;
+    }
+
+    task.status = "pending";
+    task.error = "";
+    task.retryCount += 1;
+    task.completedAt = undefined;
+```
+
+Replace with:
+```typescript
+    // Save original prompt on first retry; rebuild from it on subsequent retries
+    const prevError = task.error ?? "";
+    if (!task._originalPrompt) {
+      task._originalPrompt = task.prompt;
+    }
+    if (prevError) {
+      const errorContext = prevError.length > 500 ? prevError.slice(0, 500) + "..." : prevError;
+      task.prompt = `${task._originalPrompt}\n\n---\n## Previous Attempt Failed (attempt ${task.retryCount + 1})\nError: ${errorContext}\nFix the error above and try again.`;
+    } else {
+      task.prompt = task._originalPrompt;
+    }
+
+    task.status = "pending";
+    task.error = "";
+    task.retryCount += 1;
+    task.completedAt = undefined;
+    // Escalate to opus on second+ manual retry
+    if (task.retryCount >= 2) {
+      task.modelOverride = "claude-opus-4-6";
+    }
+```
+
+---
+
+**Sub-change C: Update dependency DAG check in `loop()`**
+
+Find the dependency check block (~lines 443–461):
+```typescript
+      if (task.dependsOn) {
+        const dep = this.tasks.get(task.dependsOn) ?? this.store.get(task.dependsOn) ?? undefined;
+        if (dep?.status !== "success") {
+          // If dependency is in a terminal failure state (or missing), fail this task
+          if (!dep || dep.status === "failed" || dep.status === "timeout" || dep.status === "cancelled") {
+            task.status = "failed";
+            task.error = `dependency ${task.dependsOn} is ${dep?.status ?? "missing"}`;
+            task.completedAt = new Date().toISOString();
+            this.store.save(task);
+            this.onEvent?.({ type: "task_final", taskId: task.id, status: task.status });
+            continue;
+          }
+          // Still pending/running — re-queue and wait
+          log("info", "task waiting on dependency", { taskId: task.id, dependsOn: task.dependsOn });
+          this.queue.push(task);
+          await this.waitForDispatch(1_000);
+          continue;
+        }
+      }
+```
+
+Replace with:
+```typescript
+      if (task.dependsOn) {
+        const depIds = Array.isArray(task.dependsOn) ? task.dependsOn : [task.dependsOn];
+        let anyFailed = false;
+        let failedDepId: string | undefined;
+        let failedDepStatus: string | undefined;
+        let allSuccess = true;
+
+        for (const depId of depIds) {
+          const dep = this.tasks.get(depId) ?? this.store.get(depId) ?? undefined;
+          if (!dep || dep.status === "failed" || dep.status === "timeout" || dep.status === "cancelled") {
+            anyFailed = true;
+            failedDepId = depId;
+            failedDepStatus = dep?.status ?? "missing";
+            break;
+          }
+          if (dep.status !== "success") {
+            allSuccess = false;
+          }
+        }
+
+        if (anyFailed) {
+          task.status = "failed";
+          task.error = `dependency ${failedDepId} is ${failedDepStatus}`;
+          task.completedAt = new Date().toISOString();
+          this.store.save(task);
+          this.onEvent?.({ type: "task_final", taskId: task.id, status: task.status });
+          continue;
+        }
+        if (!allSuccess) {
+          log("info", "task waiting on dependency", { taskId: task.id, dependsOn: task.dependsOn });
+          this.queue.push(task);
+          await this.waitForDispatch(1_000);
+          continue;
+        }
+      }
+```
+
+---
+
+**Sub-change D: Staged rebase after merge + update `submit()` opts type**
+
+Find in `executeAndRelease()` the merge result line (~line 514):
+```typescript
+      const mergeResult = await this.pool.release(workerName, shouldMerge, task.id);
+
+      if (shouldMerge && !mergeResult.merged) {
+```
+
+After `pool.release(...)`, insert the rebase block:
+```typescript
+      const mergeResult = await this.pool.release(workerName, shouldMerge, task.id);
+
+      // After a successful merge, rebase other active workers onto new main (best-effort)
+      if (shouldMerge && mergeResult.merged) {
+        for (const otherWorker of this.pool.getActiveWorkers(workerName)) {
+          this.pool.rebaseOnMain(otherWorker).catch((err: unknown) => {
+            log("warn", "staged rebase failed (best-effort)", { worker: otherWorker, error: String(err) });
+          });
+        }
+      }
+
+      if (shouldMerge && !mergeResult.merged) {
+```
+
+Also update the `submit()` method signature to accept `dependsOn?: string | string[]`:
+
+Find (~line 72):
+```typescript
+  submit(prompt: string, opts?: { id?: string; timeout?: number; maxBudget?: number; priority?: import("./types.js").TaskPriority; dependsOn?: string; webhookUrl?: string; tags?: string[]; agent?: string; allowLongPrompt?: boolean }): Task {
+```
+
+Change `dependsOn?: string` to `dependsOn?: string | string[]`.
+
+---
+
+**Step 5: Run tsc**
+```bash
+npx tsc --noEmit
+```
+Expected: no errors. Fix any type errors before proceeding.
+
+**Step 6: Run existing tests to verify nothing broke**
+```bash
+node --import tsx --test src/__tests__/scheduler.test.ts
+```
+Expected: all existing tests pass (some may fail due to missing `getActiveWorkers`/`rebaseOnMain` in the mock — see Task 6 fix below, but do not commit tests yet)
+
+**Step 7: Commit**
+```bash
+git add -A && git commit -m "feat(scheduler): fix prompt accumulation, model escalation, array dependsOn, staged rebase"
+```
+
+---
+
+### Wave 4: Tests (parallel — different test files)
+
+#### Task 6: Tests for WorktreePool new methods
+
+**Files:**
+- Modify: `src/__tests__/worktree-pool.test.ts`
+
+Append two new `describe` blocks at the end of the file (after the existing "WorktreePool stats" block):
+
+```typescript
+// ---------------------------------------------------------------------------
+// getActiveWorkers
+// ---------------------------------------------------------------------------
+
+describe("WorktreePool.getActiveWorkers", () => {
+  it("returns empty array when no workers are busy", async () => {
+    const { repoPath, cleanup } = await makeTempRepo();
+    try {
+      const pool = new WorktreePool(repoPath, 2);
+      await pool.init();
+
+      assert.deepStrictEqual(pool.getActiveWorkers(), [], "no workers should be active initially");
+    } finally {
+      cleanup();
+    }
+  });
+
+  it("returns all busy worker names", async () => {
+    const { repoPath, cleanup } = await makeTempRepo();
+    try {
+      const pool = new WorktreePool(repoPath, 3);
+      await pool.init();
+
+      const w1 = await pool.acquire();
+      const w2 = await pool.acquire();
+      assert.ok(w1 !== null && w2 !== null);
+
+      const active = pool.getActiveWorkers();
+      assert.strictEqual(active.length, 2, "should report 2 active workers");
+      assert.ok(active.includes(w1.name), "should include first acquired worker");
+      assert.ok(active.includes(w2.name), "should include second acquired worker");
+    } finally {
+      cleanup();
+    }
+  });
+
+  it("excludes the named worker from results", async () => {
+    const { repoPath, cleanup } = await makeTempRepo();
+    try {
+      const pool = new WorktreePool(repoPath, 3);
+      await pool.init();
+
+      const w1 = await pool.acquire();
+      const w2 = await pool.acquire();
+      assert.ok(w1 !== null && w2 !== null);
+
+      const active = pool.getActiveWorkers(w1.name);
+      assert.strictEqual(active.length, 1, "should return 1 after excluding one");
+      assert.strictEqual(active[0], w2.name, "remaining entry should be the non-excluded worker");
+    } finally {
+      cleanup();
+    }
+  });
+});
+
+// ---------------------------------------------------------------------------
+// rebaseOnMain
+// ---------------------------------------------------------------------------
+
+describe("WorktreePool.rebaseOnMain", () => {
+  it("returns false for unknown worker name", async () => {
+    const { repoPath, cleanup } = await makeTempRepo();
+    try {
+      const pool = new WorktreePool(repoPath, 1);
+      await pool.init();
+
+      const result = await pool.rebaseOnMain("nonexistent");
+      assert.strictEqual(result, false, "unknown worker should return false");
+    } finally {
+      cleanup();
+    }
+  });
+
+  it("returns true when branch is already up to date with main", async () => {
+    const { repoPath, cleanup } = await makeTempRepo();
+    try {
+      const pool = new WorktreePool(repoPath, 1);
+      await pool.init();
+
+      // Worker was just reset to current main tip — nothing to rebase
+      const worker = await pool.acquire();
+      assert.ok(worker !== null);
+
+      const result = await pool.rebaseOnMain(worker.name);
+      assert.strictEqual(result, true, "up-to-date branch should rebase successfully");
+    } finally {
+      cleanup();
+    }
+  });
+
+  it("returns true after rebasing worker branch onto new main commits", async () => {
+    const { repoPath, cleanup } = await makeTempRepo();
+    try {
+      const pool = new WorktreePool(repoPath, 2);
+      await pool.init();
+
+      // Acquire worker-0 and add a commit on its branch (non-conflicting file)
+      const w0 = await pool.acquire();
+      assert.ok(w0 !== null);
+      fs.writeFileSync(path.join(w0.path, "worker-file.txt"), "worker work\n");
+      const git0 = (...args: string[]) => execFileAsync("git", args, { cwd: w0.path });
+      await git0("add", "worker-file.txt");
+      await git0("commit", "-m", "worker commit");
+
+      // Simulate a new commit landing on main via worker-1
+      const w1 = await pool.acquire();
+      assert.ok(w1 !== null);
+      fs.writeFileSync(path.join(w1.path, "main-new.txt"), "new on main\n");
+      const git1 = (...args: string[]) => execFileAsync("git", args, { cwd: w1.path });
+      await git1("add", "main-new.txt");
+      await git1("commit", "-m", "new main commit");
+      const { stdout: newSha } = await git1("rev-parse", "HEAD");
+      // Update main ref to simulate a squash merge landing
+      await execFileAsync("git", ["update-ref", "refs/heads/main", newSha.trim()], { cwd: repoPath });
+
+      // Rebase w0 onto new main
+      const result = await pool.rebaseOnMain(w0.name);
+      assert.strictEqual(result, true, "rebase onto non-conflicting main should succeed");
+    } finally {
+      cleanup();
+    }
+  });
+});
+```
+
+**Step 1: Append the two describe blocks**
+
+**Step 2: Run the test file**
+```bash
+node --import tsx --test src/__tests__/worktree-pool.test.ts
+```
+Expected: all tests pass including new ones
+
+**Step 3: Commit**
+```bash
+git add -A && git commit -m "test(worktree-pool): getActiveWorkers and rebaseOnMain coverage"
+```
+
+---
+
+#### Task 7: Tests for Scheduler new behaviour
+
+**Files:**
+- Modify: `src/__tests__/scheduler.test.ts`
+
+**Step 1: Update `makePool()` mock at the top of the file**
+
+The existing `makePool()` returns an object without `getActiveWorkers` or `rebaseOnMain`. The scheduler now calls both. Find `makePool()` and add the two stubs:
+
+```typescript
+function makePool(): WorktreePool {
+  return {
+    available: 2,
+    busy: 0,
+    acquire: async () => ({ name: "w0", path: "/tmp/w0", branch: "worker/w0", busy: true }),
+    release: async () => ({ merged: true }),
+    init: async () => {},
+    getStatus: () => [],
+    getActiveWorkers: (_exclude?: string) => [],
+    rebaseOnMain: async (_name: string) => true,
+  } as unknown as WorktreePool;
+}
+```
+
+**Step 2: Append new describe blocks at the end of the file**
+
+```typescript
+// ---------------------------------------------------------------------------
+// Prompt accumulation fix
+// ---------------------------------------------------------------------------
+
+describe("Scheduler retry — prompt accumulation fix", () => {
+  it("second retry rebuilds prompt from _originalPrompt, not accumulated prompt", async () => {
+    let callCount = 0;
+    const capturedPrompts: string[] = [];
+
+    const runner = {
+      run: async (task: Task) => {
+        callCount++;
+        capturedPrompts.push(task.prompt);
+        if (callCount <= 2) {
+          task.status = "failed";
+          task.error = `error on attempt ${callCount}`;
+          task.durationMs = 10;
+        } else {
+          task.status = "success";
+          task.durationMs = 10;
+        }
+        return task;
+      },
+      getRunningTasks: () => [],
+      reviewDiffWithAgent: async () => ({ approve: true, score: 80, issues: [], suggestions: [] }),
+    } as unknown as import("../agent-runner.js").AgentRunner;
+
+    const store = makeStore();
+    const s = new Scheduler(makePool(), runner, store);
+    s.start();
+
+    s.submit("original prompt text", { maxRetries: 3 });
+    // Allow enough time for 3 attempts
+    await new Promise((r) => setTimeout(r, 600));
+    await s.stop();
+
+    // Every attempt after the first should see exactly one "## Previous Attempt Failed" section
+    for (let i = 1; i < capturedPrompts.length; i++) {
+      const sections = (capturedPrompts[i].match(/## Previous Attempt Failed/g) ?? []).length;
+      assert.strictEqual(sections, 1,
+        `Attempt ${i + 1} prompt should have exactly 1 error section, got ${sections}.\nPrompt: ${capturedPrompts[i].slice(0, 300)}`);
+    }
+  });
+
+  it("stores _originalPrompt on first retry", async () => {
+    let callCount = 0;
+
+    const runner = {
+      run: async (task: Task) => {
+        callCount++;
+        if (callCount === 1) {
+          task.status = "failed";
+          task.error = "first failure";
+          task.durationMs = 10;
+        } else {
+          task.status = "success";
+          task.durationMs = 10;
+        }
+        return task;
+      },
+      getRunningTasks: () => [],
+      reviewDiffWithAgent: async () => ({ approve: true, score: 80, issues: [], suggestions: [] }),
+    } as unknown as import("../agent-runner.js").AgentRunner;
+
+    const store = makeStore();
+    const s = new Scheduler(makePool(), runner, store);
+    s.start();
+
+    const task = s.submit("the real original prompt", { maxRetries: 1 });
+    await new Promise((r) => setTimeout(r, 400));
+    await s.stop();
+
+    assert.strictEqual(task._originalPrompt, "the real original prompt",
+      "_originalPrompt should be saved after first retry");
+  });
+});
+
+// ---------------------------------------------------------------------------
+// Model escalation
+// ---------------------------------------------------------------------------
+
+describe("Scheduler retry — model escalation", () => {
+  it("sets modelOverride to claude-opus-4-6 on retryCount >= 2", async () => {
+    const modelOverrides: Array<string | undefined> = [];
+    let callCount = 0;
+
+    const runner = {
+      run: async (task: Task) => {
+        callCount++;
+        modelOverrides.push(task.modelOverride);
+        task.status = "failed";
+        task.error = "always fails";
+        task.durationMs = 10;
+        return task;
+      },
+      getRunningTasks: () => [],
+      reviewDiffWithAgent: async () => ({ approve: true, score: 80, issues: [], suggestions: [] }),
+    } as unknown as import("../agent-runner.js").AgentRunner;
+
+    const s = new Scheduler(makePool(), runner, makeStore());
+    s.start();
+    s.submit("test model escalation", { maxRetries: 2 });
+    await new Promise((r) => setTimeout(r, 600));
+    await s.stop();
+
+    // 3 total attempts: attempt 0, 1, 2
+    // On attempt at retryCount=2 (third call), modelOverride should be "claude-opus-4-6"
+    assert.ok(callCount >= 3, `expected at least 3 attempts, got ${callCount}`);
+    assert.strictEqual(modelOverrides[2], "claude-opus-4-6",
+      `third attempt (retryCount=2) should use claude-opus-4-6, got: ${modelOverrides[2]}`);
+    // First two attempts should not have modelOverride set
+    assert.strictEqual(modelOverrides[0], undefined, "first attempt should not have modelOverride");
+    assert.strictEqual(modelOverrides[1], undefined, "second attempt (retryCount=1) should not have modelOverride");
+  });
+});
+
+// ---------------------------------------------------------------------------
+// Array dependsOn (DAG)
+// ---------------------------------------------------------------------------
+
+describe("Scheduler dependency DAG — array dependsOn", () => {
+  it("task with string[] dependsOn waits for all deps before running", async () => {
+    const store = makeStore();
+    const completionOrder: string[] = [];
+
+    const runner = {
+      run: async (task: Task) => {
+        await new Promise((r) => setTimeout(r, 30));
+        task.status = "success";
+        task.durationMs = 30;
+        completionOrder.push(task.id);
+        return task;
+      },
+      getRunningTasks: () => [],
+      reviewDiffWithAgent: async () => ({ approve: true, score: 80, issues: [], suggestions: [] }),
+    } as unknown as import("../agent-runner.js").AgentRunner;
+
+    // Pool with 3 workers so deps can run in parallel
+    const pool = {
+      available: 3,
+      busy: 0,
+      acquire: (() => {
+        let n = 0;
+        return async () => ({ name: `w${n++}`, path: `/tmp/w${n}`, branch: `worker/w${n}`, busy: true });
+      })(),
+      release: async () => ({ merged: true }),
+      init: async () => {},
+      getStatus: () => [],
+      getActiveWorkers: () => [],
+      rebaseOnMain: async () => true,
+    } as unknown as import("../worktree-pool.js").WorktreePool;
+
+    const s = new Scheduler(pool, runner, store);
+    s.start();
+
+    const dep1 = s.submit("dep task 1");
+    const dep2 = s.submit("dep task 2");
+    const dependent = s.submit("dependent task", { dependsOn: [dep1.id, dep2.id] });
+
+    await new Promise((r) => setTimeout(r, 600));
+    await s.stop();
+
+    const savedDependent = store.get(dependent.id);
+    assert.strictEqual(savedDependent?.status, "success",
+      `dependent task should succeed, got: ${savedDependent?.status}`);
+
+    const dep1Idx = completionOrder.indexOf(dep1.id);
+    const dep2Idx = completionOrder.indexOf(dep2.id);
+    const depIdx = completionOrder.indexOf(dependent.id);
+    assert.ok(dep1Idx !== -1, "dep1 should have completed");
+    assert.ok(dep2Idx !== -1, "dep2 should have completed");
+    assert.ok(depIdx !== -1, "dependent should have completed");
+    assert.ok(dep1Idx < depIdx, "dep1 must complete before dependent");
+    assert.ok(dep2Idx < depIdx, "dep2 must complete before dependent");
+  });
+
+  it("dependent task fails immediately when any dep in array fails", async () => {
+    const store = makeStore();
+
+    const runner = {
+      run: async (task: Task) => {
+        if (task.prompt === "will fail") {
+          task.status = "failed";
+          task.error = "intentional failure";
+        } else {
+          task.status = "success";
+        }
+        task.durationMs = 10;
+        return task;
+      },
+      getRunningTasks: () => [],
+      reviewDiffWithAgent: async () => ({ approve: true, score: 80, issues: [], suggestions: [] }),
+    } as unknown as import("../agent-runner.js").AgentRunner;
+
+    const pool = {
+      available: 2,
+      busy: 0,
+      acquire: (() => {
+        let n = 0;
+        return async () => ({ name: `w${n++}`, path: `/tmp/w${n}`, branch: `worker/w${n}`, busy: true });
+      })(),
+      release: async () => ({ merged: true }),
+      init: async () => {},
+      getStatus: () => [],
+      getActiveWorkers: () => [],
+      rebaseOnMain: async () => true,
+    } as unknown as import("../worktree-pool.js").WorktreePool;
+
+    const s = new Scheduler(pool, runner, store);
+    s.start();
+
+    const depFailing = s.submit("will fail", { maxRetries: 0 });
+    const depOk = s.submit("will succeed");
+    const dependent = s.submit("dep on both", { dependsOn: [depFailing.id, depOk.id] });
+
+    await new Promise((r) => setTimeout(r, 500));
+    await s.stop();
+
+    const savedDependent = store.get(dependent.id);
+    assert.strictEqual(savedDependent?.status, "failed",
+      `dependent should be failed when a dep fails, got: ${savedDependent?.status}`);
+    assert.ok(savedDependent?.error.includes(depFailing.id),
+      `error message should reference the failed dep ID. Got: ${savedDependent?.error}`);
+  });
+
+  it("string dependsOn (single ID, backward-compat) still works", () => {
+    const store = makeStore();
+    const s = new Scheduler(makePool(), makeRunner(), store);
+
+    const dep = s.submit("parent task");
+    dep.status = "success";
+    store.save(dep);
+
+    // String (not array) — must not break
+    const child = s.submit("child task", { dependsOn: dep.id });
+    assert.strictEqual(child.status, "pending",
+      "child with string dependsOn should be pending (not immediately failed)");
+  });
+});
+```
+
+**Step 3: Run the full scheduler test file**
+```bash
+node --import tsx --test src/__tests__/scheduler.test.ts
+```
+Expected: all tests pass
+
+**Step 4: Run the entire test suite**
+```bash
+node --import tsx --test src/__tests__/*.test.ts
+```
+Expected: all tests pass
+
+**Step 5: Commit**
+```bash
+git add -A && git commit -m "test(scheduler): prompt accumulation fix, model escalation, array dependsOn coverage"
+```
+
+---
+
+## Risks
+
+| Risk | Mitigation |
+|------|-----------|
+| **SQL param count mismatch** — `taskToParams` now returns 26 params but SQL might still expect 25 | Count `?` placeholders in every INSERT/UPDATE statement after editing. 26 columns in INSERT, 25 SET clauses + 1 WHERE in UPDATE (26 total params, same array) |
+| **`retryCount` increment order** — in `executeAndRelease`, `retryCount++` happens BEFORE the `>= 2` check. In `requeue()`, `retryCount += 1` happens AFTER. Be careful: escalation fires at retryCount=2 in both places | Double-check: after `task.retryCount++` the value is 2 on the third attempt. In requeue, `retryCount += 1` then `if (task.retryCount >= 2)` — same logic |
+| **Rebase locking** — `rebaseOnMain` calls `gitIn` which runs in a worktree. If the worktree is actively running an agent that is also calling git, rebase could conflict | Rebase is best-effort, fires after the current worker's merge completes (that worker is already released). Other active workers are using different worktree paths |
+| **Test timing flakiness** — async scheduler tests use `setTimeout` delays. Slow CI might fail | If tests flake, increase delays. 600ms allows 3 × 10ms-duration runs with plenty of scheduling overhead |
+| **`dependsOn` JSON round-trip** — reading old DB rows where `depends_on` is a plain string like `"abc123"` must not be accidentally JSON-parsed | The `startsWith('[')` guard handles this — only arrays are parsed as JSON |
diff --git a/docs/plans/2026-03-05-v0.1.7-plan.md b/docs/plans/2026-03-05-v0.1.7-plan.md
new file mode 100644
index 0000000..a0d9444
--- /dev/null
+++ b/docs/plans/2026-03-05-v0.1.7-plan.md
@@ -0,0 +1,235 @@
+# v0.1.7 Plan — Post-mortem + Research-Driven
+
+## v0.1.6 Post-mortem
+
+### Pipeline Run #2 Facts
+- 5 waves, 7 tasks, 7/7 "success", verify passed, $5.65
+- Only **3 of 7 tasks** produced commits that merged (43%)
+- 4 tasks ran, agent exited 0, but **no code committed**
+- Manual fix: multi-dep check, scheduler integration, modelOverride, rebase wiring
+
+### Root Causes (B1-B5)
+
+| # | Bug | Root Cause | Fix |
+|---|-----|-----------|-----|
+| B1 | Empty commit = silent success | `worktree-pool.ts:189` returns `{merged:true}` when no new commits | F1: detect + fail |
+| B2 | No commit detection | `agent-runner.ts:331` silently ignores empty diff | F1: detect + fail |
+| B3 | Scheduler integration always fails (0/2) | 618 LOC file, agent can't complete multi-point integration in $5/5min | F7: use Codex GPT-5.4 1M for complex files |
+| B4 | System prompt too weak on commit | "git add && git commit" is suggestion not enforcement | F2: CRITICAL warning |
+| B5 | Working directory desync after merge | main worktree doesn't reflect merges from worker branches | F3: post-merge sync |
+
+### Pattern Across Both Cycles
+
+| Cycle | Tasks | Committed | Commit Rate | Manual Fix |
+|-------|-------|-----------|-------------|------------|
+| v0.1.5 | 6 | 3 | 50% | Classifier regex, scheduler integration |
+| v0.1.6 | 7 | 3 | 43% | Multi-dep, rebase wiring, modelOverride |
+
+**B3 is the hardest**: Scheduler.ts is the integration hub. Every feature touches it. Both v0.1.5 and v0.1.6 pipeline runs specifically failed on "modify scheduler.ts" tasks — 0% success.
+
+**Research insight** (NeurIPS 2025): "79% of multi-agent failures are specification/coordination issues, not technical." — Our problem is exactly this: the agent knows what to do but can't coordinate the change across multiple insertion points in a large file.
+
+---
+
+## Research Inputs (from docs/)
+
+### From 3-agents-reference.md — Agent Gaps
+
+| Gap | Agent | Priority | v0.1.7? |
+|-----|-------|----------|---------|
+| Codex hardcoded o4-mini | Codex | P0 | **F7** — route deep tasks to GPT-5.4 |
+| Pricing table incomplete | All | P0 | **F4** |
+| No `--resume` on retry | Claude CLI | P0 | **F5** |
+| No `--json-schema` for review | Claude CLI | P1 | **F6** |
+| No `--fallback-model` | Claude CLI | P1 | F8 (stretch) |
+| No `--max-turns` | Claude CLI | P2 | defer |
+| SDK still V1 `query()` | Claude SDK | P0 | defer (breaking, needs dedicated sprint) |
+| No config.toml profiles | Codex | P0 | **F9** — generate default + wide profiles |
+| No `model_reasoning_effort` | Codex | P1 | defer |
+| 1M context routing | Codex | P1 | **F7** — deep + multi-file → wide profile |
+
+### From agent-landscape.md — Model Pricing
+
+| Model | $/M In | $/M Out | SWE-bench | Context |
+|-------|--------|---------|-----------|---------|
+| claude-haiku-4-5 | 0.80 | 4.00 | ~40% | 200K |
+| claude-sonnet-4-6 | 3.00 | 15.00 | ~65% | 200K |
+| claude-opus-4-6 | 15.00 | 75.00 | 80.9% | 200K |
+| gpt-5.4 (272K) | 2.50 | 15.00 | 77.2% | 272K |
+| gpt-5.4 (1M wide) | 5.00 | 22.50 | 77.2% | 1.05M |
+| o4-mini | 1.10 | 4.40 | ~55% | 200K |
+
+**Key insight**: GPT-5.4 at $2.50/$15 achieves 77.2% SWE-bench — nearly Opus level (80.9%) at **6x cheaper input, 5x cheaper output**. For scheduler.ts integration tasks (B3), using GPT-5.4 with 1M context could solve the problem: agent can hold entire codebase in context.
+
+### From STRATEGY.md — Four Pillars Status
+
+| Pillar | Status |
+|--------|--------|
+| 1. Dependency-aware dispatch | **DONE** (DAG in v0.1.6) |
+| 2. Staged merging | **DONE** (rebase in v0.1.6) |
+| 3. Failure diagnosis | PARTIAL (error injection done, structured diagnosis not done) |
+| 4. Agent self-evolution | NOT STARTED |
+
+### From GAP-ANALYSIS.md — Dead Code
+
+All dead code files (state-machine, router, memory, workpad, orchestrator) already removed. The gap analysis is partially stale — update needed.
+
+### From ROADMAP.md — Phase 1 Status
+
+| Roadmap Feature | Status |
+|----------------|--------|
+| Wave planner | **DONE** (pipeline decompose stage) |
+| Staged merger | **DONE** (rebaseOnMain in v0.1.6) |
+| Failure diagnoser | NOT DONE (only basic error injection) |
+| Pipeline | **DONE** (5-stage state machine since v0.1.3) |
+| CI feedback | **DONE** (error context retry since v0.1.4) |
+
+Phase 1 is ~80% complete. Remaining: structured failure diagnosis.
+
+---
+
+## v0.1.7 Features
+
+### Tier 1: Fix Self-Hosting Loop (P0)
+
+**F1: Empty commit detection** — `agent-runner.ts`
+- After agent exits, check `git log main..HEAD --oneline`
+- If empty + status="success" → set status="failed", error="no commits produced"
+- This triggers retry, giving agent a second chance with error context
+- LOC: ~15
+
+**F2: Enforce commit in system prompt** — `agent-runner.ts`
+- Append to every task prompt:
+  `CRITICAL: You MUST run 'git add -A && git commit -m "..."' before exiting. If you do not commit, your work will be LOST and the task will be marked FAILED.`
+- LOC: ~5
+
+**F7: Codex GPT-5.4 routing for complex files** — `agent-runner.ts` + `task-classifier.ts`
+- When task targets files >400 LOC (like scheduler.ts), route to Codex + GPT-5.4
+- `task-classifier.ts` outputs `{ category, model, agent, contextProfile }` (not just model)
+- `agent` field: "claude" for most, "codex" for deep + large-file tasks
+- `contextProfile`: "default" or "wide" — Codex uses wide (1M) for deep tasks
+- `runCodex()` uses GPT-5.4 instead of hardcoded o4-mini when `task.model` specified
+- LOC: ~30
+
+**F9: Codex config.toml profile management** — `agent-runner.ts`
+- On startup, check `~/.codex/config.toml` exists
+- If missing or outdated, generate with default + wide profiles:
+  ```toml
+  [profiles.default]
+  model = "gpt-5.4"
+  model_reasoning_effort = "medium"
+
+  [profiles.wide]
+  model = "gpt-5.4"
+  model_reasoning_effort = "medium"
+  model_context_window = 1050000
+  model_auto_compact_token_limit = 900000
+  ```
+- LOC: ~25
+
+### Tier 2: Agent Modernization (P1)
+
+**F4: Complete pricing table** — `agent-runner.ts`
+- Add all 6 models to `estimateCost()` rates table
+- LOC: ~10
+
+**F5: `--resume` on retry** — `agent-runner.ts`
+- Parse session ID from Claude CLI stream-json output
+- Store as `task.sessionId` in types.ts
+- On retry, add `--resume <sessionId>` to CLI args
+- LOC: ~20
+
+**F6: `--json-schema` for review** — `agent-runner.ts`
+- Add `--json-schema` flag to review agent invocation
+- Schema: `{"type":"object","properties":{"approve":{"type":"boolean"},"score":{"type":"number"},...}}`
+- Eliminate regex fallback parsing
+- LOC: ~15
+
+### Tier 3: Housekeeping (P1)
+
+**F3: Post-merge working directory sync** — `worktree-pool.ts`
+- After mergeToMain succeeds, run `git checkout HEAD -- .` in repo root
+- Ensures main worktree files match HEAD
+- LOC: ~5
+
+---
+
+## Consolidated Roadmap View
+
+### Done (v0.1.3-v0.1.6)
+
+| Feature | Version | Source |
+|---------|---------|--------|
+| 5-stage pipeline | v0.1.3 | Roadmap Phase 1 |
+| Cross-agent review | v0.1.3 | Roadmap Phase 1 |
+| Error context retry | v0.1.4 | v0.2 plan 1.1 |
+| Wave conflict validation | v0.1.4 | v0.2 plan 2.2 (basic) |
+| Budget-based retry loop | v0.1.4 | v0.2 plan 3.3 (basic) |
+| Dead-loop detection | v0.1.4 | v0.2 plan 3.2 (basic) |
+| Task classifier | v0.1.5 | v0.2 plan 2.1 |
+| Model fallback on retry | v0.1.5 | v0.2 plan 1.1 |
+| Prompt accumulation fix | v0.1.6 | v0.2 plan 1.1 |
+| Model escalation on retry | v0.1.6 | v0.2 plan 1.1 |
+| Staged merge + rebase | v0.1.6 | v0.2 plan 1.2 |
+| Dependency DAG | v0.1.6 | v0.2 plan 1.3 |
+
+### v0.1.7 (This Release)
+
+| Feature | Source | LOC |
+|---------|--------|-----|
+| F1: Empty commit detection | **Post-mortem B1+B2** | 15 |
+| F2: Enforce commit prompt | **Post-mortem B4** | 5 |
+| F7: Codex GPT-5.4 routing | **3-agents-reference + Post-mortem B3** | 30 |
+| F9: Codex config.toml | **3-agents-reference** | 25 |
+| F4: Pricing table | **3-agents-reference + agent-landscape** | 10 |
+| F5: --resume on retry | **3-agents-reference** | 20 |
+| F6: --json-schema review | **3-agents-reference** | 15 |
+| F3: Working dir sync | **Post-mortem B5** | 5 |
+| **Total** | | **~125** |
+
+### v0.1.8+ (Backlog, from v0.2 plan + roadmap)
+
+| Feature | Source | Priority |
+|---------|--------|----------|
+| Import graph wave validation | v0.2 plan 2.2 | P1 |
+| Failure pattern injection | v0.2 plan 2.3 | P1 |
+| Enhanced verification gate | v0.2 plan 3.1 | P1 |
+| Smart dead-loop (oscillation) | v0.2 plan 3.2 | P2 |
+| Budget-aware model downgrade | v0.2 plan 3.3 | P2 |
+| SDK V2 upgrade | 3-agents-reference | P1 |
+| Lifecycle hooks | 3-agents-reference | P2 |
+| Agent version monitor | STRATEGY.md Pillar 4 | P2 |
+| Stall detection | Roadmap Phase 2 | P1 |
+| JSONL session monitor | Roadmap Phase 2 | P1 |
+| Failure diagnoser (structured) | Roadmap Phase 1 | P1 |
+
+---
+
+## Implementation Order
+
+1. F1 + F2: Empty commit detection + enforce prompt (agent-runner.ts) — **blocks everything**
+2. F4: Pricing table (agent-runner.ts) — quick win, same file
+3. F7 + F9: Codex GPT-5.4 routing + config.toml (task-classifier.ts, agent-runner.ts) — **fixes B3**
+4. F3: Working dir sync (worktree-pool.ts)
+5. F5: --resume (agent-runner.ts)
+6. F6: --json-schema (agent-runner.ts)
+
+## Test Plan
+
+- F1: Mock agent with 0 commits → task.status === "failed", error contains "no commits"
+- F2: buildTaskPrompt output contains "MUST run git add"
+- F4: estimateCost correct for all 6 models
+- F7: classifyTask returns agent="codex" for deep + large-file tasks
+- F9: generateCodexConfig creates valid TOML with default + wide profiles
+- F3: After mergeToMain, working tree matches HEAD
+- F5: sessionId captured from stream-json, --resume flag in retry args
+- F6: Review invocation includes --json-schema
+
+## Success Metrics
+
+| Metric | v0.1.6 | Target v0.1.7 |
+|--------|--------|---------------|
+| Task commit rate | 43% | >75% |
+| Manual fix needed | ~60% | <25% |
+| Scheduler integration success | 0/2 | 1/1+ |
+| Cost per pipeline run | $5.65 | <$8 (GPT-5.4 cheaper) |
diff --git a/docs/plans/2026-03-05-v0.2-implementation-plan.md b/docs/plans/2026-03-05-v0.2-implementation-plan.md
new file mode 100644
index 0000000..a7a941f
--- /dev/null
+++ b/docs/plans/2026-03-05-v0.2-implementation-plan.md
@@ -0,0 +1,867 @@
+# cc-manager v0.2 Implementation Plan
+
+> Target: 0% → 90%+ auto-merge success rate, 50% cost reduction
+> Total: 7 features, ~500 LOC, 3 phases
+
+---
+
+## Phase 1: Critical Path (Day 1-2)
+
+Goal: Fix the two root causes of 0% auto-merge.
+
+### 1.1 Fix Error Context Bug + Model Escalation
+
+**Problem:** `scheduler.ts:549` clears `task.error = ""` before retry. The error injection
+at line 545-547 reads `prevError` from `task.error`, but the clear at 549 wipes it for
+future retries. Also: retry always uses the same model — no escalation.
+
+**Files to modify:**
+- `src/scheduler.ts` (lines 537-551)
+- `src/agent-runner.ts` (lines 55-62)
+- `src/types.ts` (add `modelOverride` field)
+
+**Changes:**
+
+#### 1.1.1 scheduler.ts — Preserve error, don't accumulate prompts
+
+```typescript
+// CURRENT (line 537-551):
+if (task.status === "failed" && task.retryCount < task.maxRetries) {
+  shouldRetry = true;
+  const prevError = task.error ?? "";
+  task.retryCount++;
+  task.status = "pending";
+  task.completedAt = undefined;
+  if (prevError) {
+    const errorContext = prevError.length > 500 ? prevError.slice(0, 500) + "..." : prevError;
+    task.prompt = `${task.prompt}\n\n---\n## Previous Attempt Failed (attempt ${task.retryCount})\nError: ${errorContext}\nFix the error above and try again.`;
+  }
+  task.error = "";  // BUG: clears error context
+  ...
+}
+
+// NEW:
+if (task.status === "failed" && task.retryCount < task.maxRetries) {
+  shouldRetry = true;
+  const prevError = task.error ?? "";
+  task.retryCount++;
+  task.status = "pending";
+  task.completedAt = undefined;
+
+  // Store original prompt on first retry to avoid prompt accumulation
+  if (!task._originalPrompt) task._originalPrompt = task.prompt;
+
+  if (prevError) {
+    const errorContext = prevError.length > 500 ? prevError.slice(0, 500) + "..." : prevError;
+    task.prompt = `${task._originalPrompt}\n\n---\n## Previous Attempt Failed (attempt ${task.retryCount}/${task.maxRetries})\nError: ${errorContext}\nFix the error above and try again.`;
+  }
+
+  // Model escalation: retry 2+ uses Opus
+  if (task.retryCount >= 2) {
+    task.modelOverride = "claude-opus-4-6";
+    log("info", "escalating model for retry", { taskId: task.id, model: "claude-opus-4-6" });
+  }
+
+  // DO NOT clear task.error — keep it for diagnostics
+  // task.error = "";  // REMOVED
+  ...
+}
+```
+
+#### 1.1.2 types.ts — Add fields
+
+```typescript
+// Add to Task interface:
+export interface Task {
+  // ... existing fields ...
+  modelOverride?: string;   // Set by retry logic to escalate model
+  _originalPrompt?: string; // Preserved original prompt before error injection
+}
+```
+
+#### 1.1.3 agent-runner.ts — Respect modelOverride
+
+```typescript
+// CURRENT (line 58-62):
+constructor(
+  private model: string = "claude-sonnet-4-6",
+  ...
+)
+
+// In run() method, before spawning agent:
+const model = task.modelOverride ?? this.model;
+// Use `model` instead of `this.model` when spawning Claude CLI/SDK
+```
+
+**Tests to add:**
+- Retry preserves error context (error field not empty after re-queue)
+- Prompt accumulation prevented (_originalPrompt preserved)
+- Model escalation triggers on retryCount >= 2
+- Cost estimation uses correct model rates for escalated tasks
+
+**LOC: ~25**
+
+---
+
+### 1.2 Staged Merge + Rebase
+
+**Problem:** Parallel worktrees all branch from the same `main`. Task A creates `types.ts`,
+Task B imports from `types.ts` — but B can't see A's changes until both merge. This is the
+root cause of TSC failures in parallel execution.
+
+**Files to modify:**
+- `src/worktree-pool.ts` (add `rebaseOnMain()`, modify `release()`)
+- `src/scheduler.ts` (rebase active workers after merge in `executeAndRelease()`)
+
+**Changes:**
+
+#### 1.2.1 worktree-pool.ts — Add rebaseOnMain()
+
+```typescript
+/**
+ * Rebases a worker's branch onto the latest main.
+ * Returns true if rebase succeeded, false if conflicts (aborts rebase).
+ */
+async rebaseOnMain(workerName: string): Promise<boolean> {
+  const w = this.workers.find(w => w.name === workerName);
+  if (!w || !w.busy) return false;
+
+  try {
+    // Fetch latest main ref
+    await this.gitIn(w.path, "fetch", ".", "main");
+    // Attempt rebase onto main
+    await this.gitIn(w.path, "rebase", "main");
+    log("info", "[pool] rebased worker onto main", { worker: workerName });
+    return true;
+  } catch {
+    // Conflict — abort rebase, worker continues with stale base
+    try {
+      await this.gitIn(w.path, "rebase", "--abort");
+    } catch { /* already clean */ }
+    log("warn", "[pool] rebase conflict, worker continues on stale base", { worker: workerName });
+    return false;
+  }
+}
+
+/**
+ * Returns list of currently busy worker names (excluding the given one).
+ */
+getActiveWorkers(exclude?: string): string[] {
+  return this.workers
+    .filter(w => w.busy && w.name !== exclude)
+    .map(w => w.name);
+}
+```
+
+#### 1.2.2 scheduler.ts — Rebase active workers after successful merge
+
+```typescript
+// In executeAndRelease(), after the merge succeeds (line 508):
+const mergeResult = await this.pool.release(workerName, shouldMerge, task.id);
+
+// NEW: After successful merge, rebase all other active workers onto new main
+if (shouldMerge && mergeResult.merged) {
+  const activeWorkers = this.pool.getActiveWorkers(workerName);
+  for (const otherWorker of activeWorkers) {
+    // Best effort — don't fail the current task if rebase fails
+    await this.pool.rebaseOnMain(otherWorker).catch((err) => {
+      log("warn", "rebase failed for active worker", { worker: otherWorker, err: String(err) });
+    });
+  }
+}
+```
+
+**Key design decisions:**
+- Rebase is **best-effort**: if it conflicts, the worker continues on stale base
+  (the task may fail at TSC check, which is already handled by retry)
+- Rebase happens after EVERY successful merge, not just between waves
+- This means even within a single wave, tasks that finish early update main for
+  still-running tasks
+
+**Tests to add:**
+- rebaseOnMain() succeeds when no conflicts
+- rebaseOnMain() aborts cleanly on conflict
+- getActiveWorkers() excludes specified worker
+- After merge, other active workers get rebased (integration test)
+- Rebase failure doesn't crash the merge flow
+
+**LOC: ~50**
+
+---
+
+### 1.3 Dependency DAG (string → string[])
+
+**Problem:** `types.ts:34` has `dependsOn?: string` — only one parent dependency.
+Cannot express "Task C depends on both Task A and Task B".
+
+**Files to modify:**
+- `src/types.ts` (line 34)
+- `src/scheduler.ts` (lines 437-454)
+- `src/store.ts` (serialization)
+
+**Changes:**
+
+#### 1.3.1 types.ts
+
+```typescript
+// CURRENT:
+dependsOn?: string;
+
+// NEW:
+dependsOn?: string | string[];  // Backward compatible
+```
+
+#### 1.3.2 scheduler.ts — Multi-dependency check
+
+```typescript
+// CURRENT (lines 437-454):
+if (task.dependsOn) {
+  const dep = this.tasks.get(task.dependsOn) ?? this.store.get(task.dependsOn);
+  // ... single check
+
+// NEW:
+const deps = task.dependsOn
+  ? (Array.isArray(task.dependsOn) ? task.dependsOn : [task.dependsOn])
+  : [];
+
+if (deps.length > 0) {
+  let allSuccess = true;
+  let anyTerminalFail = false;
+  let failedDepId = "";
+
+  for (const depId of deps) {
+    const dep = this.tasks.get(depId) ?? this.store.get(depId) ?? undefined;
+    if (!dep || dep.status === "failed" || dep.status === "timeout" || dep.status === "cancelled") {
+      anyTerminalFail = true;
+      failedDepId = depId;
+      break;
+    }
+    if (dep.status !== "success") {
+      allSuccess = false;
+    }
+  }
+
+  if (anyTerminalFail) {
+    task.status = "failed";
+    task.error = `dependency ${failedDepId} is ${...}`;
+    // ... same terminal handling
+    continue;
+  }
+  if (!allSuccess) {
+    this.queue.push(task);
+    await this.waitForDispatch(1_000);
+    continue;
+  }
+}
+```
+
+#### 1.3.3 store.ts — Serialize array
+
+The store already serializes `depends_on` as a string column. For backward compat:
+- Write: `JSON.stringify(task.dependsOn)` if array, else store as string
+- Read: `JSON.parse()` if starts with `[`, else treat as single string
+
+**Tests to add:**
+- Single dependency still works (backward compat)
+- Multi-dependency: all success → dispatch
+- Multi-dependency: one failed → fail task
+- Multi-dependency: one pending → re-queue
+- Store serialization round-trip for arrays
+
+**LOC: ~40**
+
+---
+
+## Phase 2: Intelligence Layer (Day 3-5)
+
+Goal: Smart routing + static analysis for wave planning.
+
+### 2.1 Task Classifier + Model Router
+
+**Problem:** `agent-runner.ts:59` hardcodes `claude-sonnet-4-6` for all tasks.
+Simple renames waste expensive model time; complex refactors fail with weak models.
+
+**Files to add:**
+- `src/task-classifier.ts` (NEW)
+
+**Files to modify:**
+- `src/agent-runner.ts` (use classifier result)
+- `src/types.ts` (add `complexity` field)
+
+**Changes:**
+
+#### 2.1.1 task-classifier.ts (NEW)
+
+```typescript
+export type TaskComplexity = "quick" | "normal" | "deep";
+
+interface ClassifyResult {
+  complexity: TaskComplexity;
+  model: string;
+  reason: string;
+}
+
+// Cost per task (approximate):
+// quick (Haiku):  $0.001
+// normal (Sonnet): $0.10
+// deep (Opus):     $1.00
+
+const QUICK_PATTERNS = [
+  /\brename\b/i, /\btypo\b/i, /\bcomment\b/i, /\bformat\b/i,
+  /\bdelete\b.*\bunused\b/i, /\bremove\b.*\bimport\b/i,
+  /\badd\b.*\bfield\b/i, /\bupdate\b.*\bversion\b/i,
+];
+
+const DEEP_PATTERNS = [
+  /\brefactor\b/i, /\bredesign\b/i, /\barchitect\b/i, /\bmigrat\b/i,
+  /\boptimiz\b/i, /\bsecurity\b/i, /\bperformance\b/i,
+  /\bfrom scratch\b/i, /\bentire\b/i, /\ball files\b/i,
+];
+
+export function classifyTask(prompt: string): ClassifyResult {
+  // Rule 1: Short prompts + quick patterns → quick
+  if (prompt.length < 200 && QUICK_PATTERNS.some(p => p.test(prompt))) {
+    return { complexity: "quick", model: "claude-haiku-4-5-20251001", reason: "short prompt + simple pattern" };
+  }
+
+  // Rule 2: Deep patterns → deep
+  if (DEEP_PATTERNS.some(p => p.test(prompt))) {
+    return { complexity: "deep", model: "claude-opus-4-6", reason: "complex pattern detected" };
+  }
+
+  // Rule 3: Multi-file mention (3+ files) → deep
+  const fileRefs = prompt.match(/\b[\w./\\-]+\.(?:ts|js|tsx|jsx|py)\b/gi) ?? [];
+  const uniqueFiles = new Set(fileRefs);
+  if (uniqueFiles.size >= 4) {
+    return { complexity: "deep", model: "claude-opus-4-6", reason: `${uniqueFiles.size} files referenced` };
+  }
+
+  // Rule 4: Long prompt with error context → normal (retry scenario)
+  // Rule 5: Default → normal
+  return { complexity: "normal", model: "claude-sonnet-4-6", reason: "default" };
+}
+
+// Model cost rates for estimation
+export const MODEL_RATES: Record<string, { input: number; output: number }> = {
+  "claude-haiku-4-5-20251001": { input: 0.8 / 1_000_000, output: 4 / 1_000_000 },
+  "claude-sonnet-4-6": { input: 3 / 1_000_000, output: 15 / 1_000_000 },
+  "claude-opus-4-6": { input: 15 / 1_000_000, output: 75 / 1_000_000 },
+};
+```
+
+#### 2.1.2 agent-runner.ts modifications
+
+```typescript
+import { classifyTask, MODEL_RATES } from "./task-classifier.js";
+
+// In run(), determine model:
+const classification = classifyTask(task.prompt);
+const model = task.modelOverride ?? classification.model ?? this.model;
+
+// Update estimateCost to use MODEL_RATES:
+static estimateCost(tokenInput: number, tokenOutput: number, model: string): number {
+  const r = MODEL_RATES[model] ?? MODEL_RATES["claude-sonnet-4-6"];
+  return tokenInput * r.input + tokenOutput * r.output;
+}
+```
+
+#### 2.1.3 types.ts
+
+```typescript
+// Add to Task interface:
+complexity?: "quick" | "normal" | "deep";
+```
+
+**Tests to add:**
+- "Rename foo to bar" → quick → Haiku
+- "Refactor the entire authentication module" → deep → Opus
+- Short prompt with no patterns → normal → Sonnet
+- 4+ file references → deep
+- modelOverride takes precedence over classifier
+- Cost estimation uses correct rates per model
+
+**LOC: ~70**
+
+---
+
+### 2.2 Import Graph for Wave Validation
+
+**Problem:** `pipeline.ts:292-348` decompose stage relies entirely on LLM to plan waves.
+LLM can misjudge file dependencies, putting types.ts consumer in wave 0 alongside types.ts.
+
+**Files to add:**
+- `src/import-graph.ts` (NEW)
+
+**Files to modify:**
+- `src/pipeline.ts` (validate/reorder waves after LLM decompose)
+
+**Changes:**
+
+#### 2.2.1 import-graph.ts (NEW)
+
+```typescript
+import { readFileSync, readdirSync, statSync } from "fs";
+import { join, relative, dirname } from "path";
+
+interface FileNode {
+  path: string;           // relative path from repo root
+  imports: string[];      // relative paths of files this imports
+  importedBy: string[];   // reverse: files that import this
+}
+
+/**
+ * Build a dependency graph from TypeScript/JavaScript imports.
+ * Uses regex (not tree-sitter) for zero dependencies.
+ */
+export function buildImportGraph(repoPath: string, srcDir = "src"): Map<string, FileNode> {
+  const graph = new Map<string, FileNode>();
+  const fullSrcDir = join(repoPath, srcDir);
+
+  // Collect all TS/JS files
+  const files = collectFiles(fullSrcDir, /\.(ts|tsx|js|jsx|mts|mjs)$/);
+
+  for (const absPath of files) {
+    const relPath = relative(repoPath, absPath);
+    const content = readFileSync(absPath, "utf-8");
+    const imports = extractImports(content, dirname(absPath), repoPath);
+
+    graph.set(relPath, { path: relPath, imports, importedBy: [] });
+  }
+
+  // Build reverse edges
+  for (const [path, node] of graph) {
+    for (const imp of node.imports) {
+      const target = graph.get(imp);
+      if (target) target.importedBy.push(path);
+    }
+  }
+
+  return graph;
+}
+
+/**
+ * Given a set of files to be modified, return the topological order.
+ * Files with no dependencies come first.
+ * Returns array of arrays (waves).
+ */
+export function topologicalWaves(
+  graph: Map<string, FileNode>,
+  filesToModify: string[],
+): string[][] {
+  const subset = new Set(filesToModify);
+  const inDegree = new Map<string, number>();
+  const edges = new Map<string, string[]>(); // file → files that depend on it
+
+  for (const file of subset) {
+    const node = graph.get(file);
+    if (!node) { inDegree.set(file, 0); continue; }
+
+    // Count only dependencies within the subset
+    const depsInSubset = node.imports.filter(i => subset.has(i));
+    inDegree.set(file, depsInSubset.length);
+
+    for (const dep of depsInSubset) {
+      const list = edges.get(dep) ?? [];
+      list.push(file);
+      edges.set(dep, list);
+    }
+  }
+
+  // Kahn's algorithm
+  const waves: string[][] = [];
+  const remaining = new Set(subset);
+
+  while (remaining.size > 0) {
+    const wave = [...remaining].filter(f => (inDegree.get(f) ?? 0) === 0);
+    if (wave.length === 0) {
+      // Cycle detected — put all remaining in one wave
+      waves.push([...remaining]);
+      break;
+    }
+    waves.push(wave);
+    for (const f of wave) {
+      remaining.delete(f);
+      for (const dependent of (edges.get(f) ?? [])) {
+        inDegree.set(dependent, (inDegree.get(dependent) ?? 1) - 1);
+      }
+    }
+  }
+
+  return waves;
+}
+
+function extractImports(content: string, fileDir: string, repoRoot: string): string[] {
+  const imports: string[] = [];
+  // Match: import ... from "./foo.js"  or  import ... from "../bar.js"
+  const importRegex = /(?:import|export)\s+.*?from\s+["'](\.[^"']+)["']/g;
+  let match: RegExpExecArray | null;
+  while ((match = importRegex.exec(content)) !== null) {
+    const specifier = match[1];
+    // Resolve to actual file path
+    const resolved = resolveImport(specifier, fileDir, repoRoot);
+    if (resolved) imports.push(resolved);
+  }
+  return imports;
+}
+
+function resolveImport(specifier: string, fromDir: string, repoRoot: string): string | null {
+  const abs = join(fromDir, specifier);
+  // Try exact, .ts, /index.ts
+  for (const ext of ["", ".ts", ".tsx", ".js", "/index.ts"]) {
+    const candidate = abs.replace(/\.js$/, ".ts") + ext;
+    try {
+      statSync(candidate);
+      return relative(repoRoot, candidate);
+    } catch { continue; }
+  }
+  // .js → .ts resolution
+  const tsPath = abs.replace(/\.js$/, ".ts");
+  try { statSync(tsPath); return relative(repoRoot, tsPath); } catch { /* */ }
+  return null;
+}
+
+function collectFiles(dir: string, pattern: RegExp): string[] {
+  const results: string[] = [];
+  for (const entry of readdirSync(dir, { withFileTypes: true })) {
+    const full = join(dir, entry.name);
+    if (entry.isDirectory() && !entry.name.startsWith(".") && entry.name !== "node_modules") {
+      results.push(...collectFiles(full, pattern));
+    } else if (entry.isFile() && pattern.test(entry.name)) {
+      results.push(full);
+    }
+  }
+  return results;
+}
+```
+
+#### 2.2.2 pipeline.ts — Validate waves after decompose
+
+```typescript
+import { buildImportGraph, topologicalWaves } from "./import-graph.js";
+
+// In doDecompose(), after LLM returns waves and before saving:
+private validateWaveOrder(
+  decomposed: DecomposeOutput,
+  repoPath: string,
+): DecomposeOutput {
+  const graph = buildImportGraph(repoPath);
+
+  // Extract file mentions from each task prompt
+  for (const wave of decomposed.waves) {
+    for (let i = 0; i < wave.tasks.length; i++) {
+      const taskPrompt = wave.tasks[i];
+      const files = (taskPrompt.match(/\b(src\/[\w./\\-]+\.(?:ts|js))\b/gi) ?? []);
+      // Check if any referenced file depends on a file in a LATER wave
+      // If so, log a warning (future: reorder)
+    }
+  }
+
+  return decomposed; // Phase 1: validate only. Phase 2: auto-reorder.
+}
+```
+
+**Tests to add:**
+- buildImportGraph() parses simple TS imports
+- topologicalWaves() returns correct order for linear chain
+- topologicalWaves() handles cycle gracefully
+- topologicalWaves() puts files with no deps in wave 0
+- validateWaveOrder() detects misordered waves
+
+**LOC: ~150**
+
+---
+
+### 2.3 Failure Pattern Injection
+
+**Problem:** `store.ts:449` has `getFailurePatterns()` that returns recent errors,
+but nothing reads it. Agents repeat the same mistakes.
+
+**Files to modify:**
+- `src/agent-runner.ts` (line 235-280, buildSystemPrompt)
+- `src/scheduler.ts` (pass store reference to runner)
+
+**Changes:**
+
+#### 2.3.1 agent-runner.ts — Inject patterns into system prompt
+
+```typescript
+// Add parameter to buildSystemPrompt:
+buildSystemPrompt(task: Task, cwd: string, failurePatterns?: { prompt: string; error: string }[]): string {
+  const parts: string[] = [];
+  // ... existing code ...
+
+  // NEW: Inject failure patterns
+  if (failurePatterns && failurePatterns.length > 0) {
+    parts.push("\n## Known Issues to Avoid");
+    for (const p of failurePatterns.slice(0, 3)) {
+      // Only inject if the pattern is relevant (similar prompt)
+      const similarity = jaccardSimilarity(task.prompt, p.prompt);
+      if (similarity > 0.2) {
+        const shortError = p.error.length > 150 ? p.error.slice(0, 150) + "..." : p.error;
+        parts.push(`- Previous similar task failed: ${shortError}`);
+      }
+    }
+  }
+
+  return parts.join("\n");
+}
+
+// Simple Jaccard similarity on word sets
+function jaccardSimilarity(a: string, b: string): number {
+  const setA = new Set(a.toLowerCase().split(/\s+/));
+  const setB = new Set(b.toLowerCase().split(/\s+/));
+  const intersection = [...setA].filter(x => setB.has(x)).length;
+  const union = new Set([...setA, ...setB]).size;
+  return union > 0 ? intersection / union : 0;
+}
+```
+
+#### 2.3.2 scheduler.ts — Pass patterns to runner
+
+```typescript
+// In executeAndRelease(), before runner.run():
+const patterns = this.store.getFailurePatterns(5);
+// Pass to buildSystemPrompt via runner configuration
+```
+
+**Tests to add:**
+- Failure patterns injected when similarity > 0.2
+- Irrelevant patterns not injected (similarity < 0.2)
+- Jaccard similarity function correctness
+- Empty patterns → no injection
+
+**LOC: ~30**
+
+---
+
+## Phase 3: Safety & Efficiency (Day 6-7)
+
+Goal: Prevent waste, catch more issues before merge.
+
+### 3.1 Enhanced Verification Gate
+
+**Problem:** Only TSC check exists in agent-runner.ts:338-346. No lint check, no
+scope verification (agent can modify files outside its mandate).
+
+**Files to modify:**
+- `src/agent-runner.ts` (extend verifyBuild)
+
+**Changes:**
+
+```typescript
+// In verifyBuild() or as a new method verifyTask():
+async verifyTask(task: Task, cwd: string): Promise<{ pass: boolean; issues: string[] }> {
+  const issues: string[] = [];
+
+  // 1. TSC check (existing)
+  try {
+    await execAsync("npx tsc --noEmit", { cwd });
+  } catch (err: any) {
+    issues.push(`TSC: ${err.stdout?.slice(0, 300) ?? err.message}`);
+  }
+
+  // 2. Scope check: verify agent didn't modify unexpected files
+  try {
+    const { stdout } = await execAsync("git diff --name-only HEAD~1", { cwd });
+    const modifiedFiles = stdout.trim().split("\n").filter(Boolean);
+    if (modifiedFiles.length > 5) {
+      issues.push(`Scope: modified ${modifiedFiles.length} files (expected <=5)`);
+    }
+  } catch { /* no commits yet */ }
+
+  // 3. Lint check (if eslint configured)
+  if (existsSync(join(cwd, ".eslintrc.json")) || existsSync(join(cwd, "eslint.config.js"))) {
+    try {
+      await execAsync("npx eslint --quiet --no-color src/", { cwd, timeout: 30_000 });
+    } catch (err: any) {
+      issues.push(`Lint: ${err.stdout?.slice(0, 200) ?? "lint errors"}`);
+    }
+  }
+
+  return { pass: issues.length === 0, issues };
+}
+```
+
+**Tests to add:**
+- TSC failure detected
+- Scope violation detected (>5 files)
+- Lint errors detected
+- All pass → { pass: true, issues: [] }
+
+**LOC: ~35**
+
+---
+
+### 3.2 Smart Dead-Loop Detection
+
+**Problem:** `pipeline.ts:459-462` only compares exact error strings. Doesn't detect:
+- Oscillating errors (A→B→A→B)
+- Token count inflation (agent adding more context each loop)
+- Budget-aware stopping
+
+**Files to modify:**
+- `src/pipeline.ts` (lines 458-491)
+
+**Changes:**
+
+```typescript
+// Replace simple sameErrors check with:
+private isStuckLoop(run: PipelineRun): { stuck: boolean; reason: string } {
+  const results = run.verifyResults ?? [];
+  if (results.length < 2) return { stuck: false, reason: "" };
+
+  const current = results[results.length - 1];
+  const prev = results[results.length - 2];
+
+  // Check 1: Exact same errors (existing)
+  if (JSON.stringify(prev.errors) === JSON.stringify(current.errors)) {
+    return { stuck: true, reason: "identical errors repeated" };
+  }
+
+  // Check 2: Oscillation (A→B→A pattern)
+  if (results.length >= 3) {
+    const prevPrev = results[results.length - 3];
+    if (JSON.stringify(prevPrev.errors) === JSON.stringify(current.errors)) {
+      return { stuck: true, reason: "oscillating errors (A→B→A)" };
+    }
+  }
+
+  // Check 3: Error count not decreasing over 3 iterations
+  if (results.length >= 3) {
+    const counts = results.slice(-3).map(r => r.errors.length);
+    if (counts[2] >= counts[0] && counts[1] >= counts[0]) {
+      return { stuck: true, reason: `error count not decreasing: ${counts.join(" → ")}` };
+    }
+  }
+
+  return { stuck: false, reason: "" };
+}
+```
+
+**Tests to add:**
+- Exact duplicate errors → stuck
+- Oscillating A→B→A → stuck
+- Error count increasing → stuck
+- Error count decreasing → not stuck
+- Less than 2 results → not stuck
+
+**LOC: ~30**
+
+---
+
+### 3.3 Budget-Aware Model Downgrade
+
+**Problem:** When pipeline budget is running low, tasks still use the originally
+assigned model. Should auto-downgrade to cheaper models to complete more tasks.
+
+**Files to modify:**
+- `src/pipeline.ts` (in doExecute, before submitting tasks)
+
+**Changes:**
+
+```typescript
+// In doExecute(), before submitting each wave task:
+private selectModelForBudget(
+  run: PipelineRun,
+  defaultModel: string,
+): string {
+  const cfg = this.cfg(run.id);
+  if (cfg.totalBudget <= 0) return defaultModel;
+
+  let spent = 0;
+  for (const taskId of run.taskIds) {
+    const t = this.scheduler.getTask(taskId);
+    if (t?.costUsd) spent += t.costUsd;
+  }
+
+  const remaining = cfg.totalBudget - spent;
+  const remainingRatio = remaining / cfg.totalBudget;
+
+  // Below 20% budget → downgrade to Sonnet
+  if (remainingRatio < 0.2 && defaultModel === "claude-opus-4-6") {
+    log("info", "budget low, downgrading to Sonnet", { remaining, ratio: remainingRatio });
+    return "claude-sonnet-4-6";
+  }
+
+  // Below 10% budget → downgrade to Haiku
+  if (remainingRatio < 0.1) {
+    log("info", "budget critical, downgrading to Haiku", { remaining, ratio: remainingRatio });
+    return "claude-haiku-4-5-20251001";
+  }
+
+  return defaultModel;
+}
+```
+
+**Tests to add:**
+- >20% budget → no downgrade
+- 10-20% budget → Opus downgrades to Sonnet
+- <10% budget → all downgrade to Haiku
+- Budget of 0 (unlimited) → no downgrade
+
+**LOC: ~25**
+
+---
+
+## Summary Table
+
+| # | Feature | Phase | File(s) | LOC | Success Rate Impact | Cost Impact |
+|---|---------|-------|---------|-----|--------------------|----|
+| 1.1 | Error context fix + model escalation | 1 | scheduler, agent-runner, types | 25 | +15-25% | +5% (Opus retries) |
+| 1.2 | Staged merge + rebase | 1 | worktree-pool, scheduler | 50 | +40-60% | 0 |
+| 1.3 | Dependency DAG (string[]) | 1 | types, scheduler, store | 40 | +10% | 0 |
+| 2.1 | Task classifier + model router | 2 | NEW task-classifier, agent-runner | 70 | +10% | -50% to -70% |
+| 2.2 | Import graph wave validation | 2 | NEW import-graph, pipeline | 150 | +20% | -10% |
+| 2.3 | Failure pattern injection | 2 | agent-runner, scheduler | 30 | +5-10% | 0 |
+| 3.1 | Enhanced verification gate | 3 | agent-runner | 35 | +5-10% | 0 |
+| 3.2 | Smart dead-loop detection | 3 | pipeline | 30 | 0 (defensive) | -$50-100/incident |
+| 3.3 | Budget-aware model downgrade | 3 | pipeline | 25 | 0 | -20% |
+| | **TOTAL** | | **4 new + 6 modified** | **~455** | **0% → 90%+** | **-50%** |
+
+---
+
+## Test Plan
+
+Each feature must have tests BEFORE implementation (TDD):
+
+### Phase 1 Tests (~15 tests)
+- `scheduler.test.ts`: retry error preservation, prompt accumulation prevention,
+  model escalation, multi-dependency dispatch
+- `worktree-pool.test.ts`: rebaseOnMain success/conflict/abort, getActiveWorkers
+- Integration: merge → rebase → next task sees new types
+
+### Phase 2 Tests (~20 tests)
+- `task-classifier.test.ts` (NEW): pattern matching, file counting, model selection
+- `import-graph.test.ts` (NEW): graph building, topological sort, cycle handling
+- `agent-runner.test.ts`: failure pattern injection, similarity filtering
+
+### Phase 3 Tests (~10 tests)
+- `agent-runner.test.ts`: scope check, lint check
+- `pipeline.test.ts`: oscillation detection, error count monitoring, budget downgrade
+
+---
+
+## Migration Notes
+
+- `dependsOn: string` → `string | string[]` is backward compatible
+  (existing single-string values still work)
+- `modelOverride` and `_originalPrompt` are optional fields — no DB migration needed
+- `task-classifier.ts` and `import-graph.ts` are new files — no conflicts
+- All changes are additive — existing tests must continue to pass
+
+---
+
+## Evidence Base
+
+| Feature | Evidence Source | Data Point |
+|---------|---------------|------------|
+| Error context fix | cc-manager scheduler.ts:549 | Bug: `task.error = ""` clears context |
+| Model escalation | RouteLLM (ICLR 2025) | 85% cost reduction, 95% quality retention |
+| Staged merge | Graphite production data | 1.5-2.5x merge speed improvement |
+| Rebase pattern | Gas Town (Refinery) | Bors-style merge queue |
+| Import graph | Aider repo-map | 40% → 85% multi-file success rate |
+| Task classifier | oh-my-opencode categories | quick/deep/visual/ultrabrain routing |
+| Failure injection | SWE-Exp (2025) | Structured experience → guided repair |
+| Dual verification | Spotify Honk | 650+ PR/month, LLM judge rejects 25% |
+| Dead-loop detect | OpenClaw issue #16808 | Sliding window detection |
+| Budget downgrade | Perplexity Computer | Per-token billing with spending caps |
diff --git a/docs/research/2026-03-05-agent-landscape.md b/docs/research/2026-03-05-agent-landscape.md
new file mode 100644
index 0000000..54bf56e
--- /dev/null
+++ b/docs/research/2026-03-05-agent-landscape.md
@@ -0,0 +1,71 @@
+# Agent Landscape Research (2026-03-05)
+
+## Perplexity Computer
+- 19-model orchestrator, meta-router picks best model per subtask
+- $200/month Max plan, Claude Opus 4.6 as core reasoning engine
+- Cloud sandbox isolation, persistent memory across sessions
+- "Wide but shallow" — good at general tasks, less reliable for complex UI/multi-file/production code
+- cc-manager positioning: "narrow but deep" — specialized for code with git-native verification
+
+## GPT-5.4 (Released 2026-03-05)
+- Pricing: $2.50/$15.00 per M tokens (standard 272K context)
+- 1M context: experimental, opt-in via Codex config.toml, 2x/1.5x cost penalty
+- SWE-bench: 77.2% (vs Opus 4.6 80.9%, Sonnet 4.6 ~65%)
+- OSWorld: 75.0%, native computer use
+- Variants: GPT-5.4 Thinking, GPT-5.4 Pro
+- Key for cc-manager: cost-effective alternative to Opus for cross-model retry
+
+## Claude Code CLI (2.1.x)
+- New flags since cc-manager was built:
+  - `--max-budget-usd` — built-in budget (we already use this)
+  - `--json-schema` — guaranteed structured output
+  - `--fallback-model` — auto-downgrade on overload
+  - `--resume` — session recovery for retries
+  - `--max-turns` — loop prevention
+  - `--agents` — dynamic subagent definitions
+  - `--worktree` — built-in worktree support
+
+## Claude Agent SDK (v0.2.69)
+- V2 preview: `send()`/`stream()` replaces V1 `query()` async generator
+- `createSession()`/`resumeSession()` — persistent sessions
+- 18 lifecycle hooks: PreToolUse, PostToolUse, Stop, WorktreeCreate, etc.
+- Subagent definitions, MCP server integration, structured outputs
+- cc-manager still on V1 `query()` — major upgrade needed
+
+## Codex CLI (0.104.0)
+- GPT-5.4 support with profile-based configuration
+- `model_reasoning_effort`: low/medium/high/xhigh
+- Agent roles: worker/explorer/reviewer/monitor
+- Config via `~/.codex/config.toml` with profiles
+- cc-manager hardcodes o4-mini — needs routing update
+
+## Model Comparison Table
+| Model | Input $/M | Output $/M | SWE-bench | Context |
+|-------|----------|-----------|-----------|---------|
+| claude-haiku-4-5 | 0.80 | 4.00 | ~40% | 200K |
+| claude-sonnet-4-6 | 3.00 | 15.00 | ~65% | 200K |
+| claude-opus-4-6 | 15.00 | 75.00 | 80.9% | 200K |
+| gpt-5.4 | 2.50 | 15.00 | 77.2% | 272K (1.05M opt-in) |
+| gpt-5.4 (1M mode) | 5.00 | 22.50 | 77.2% | 1.05M |
+| o4-mini | 1.10 | 4.40 | ~55% | 200K |
+
+## Key Insight: Cross-Model Retry
+Different models have different training biases. When Claude fails on a task,
+GPT-5.4 may succeed (and vice versa) — not because one is "better" but because
+they approach problems differently. This is why cc-manager's `pickFallbackAgent()`
+(claude ↔ codex swap on retry) is architecturally correct, just needs better
+model selection within each agent.
+
+## NeurIPS 2025 Finding
+79% of multi-agent failures are specification/coordination issues, not technical.
+This validates cc-manager's focus on wave planning and staged merging over
+raw model capability.
+
+## Sources
+- Perplexity Computer: perplexity.ai/computer
+- GPT-5.4: openai.com/index/introducing-gpt-5-4/
+- Claude SDK: npmjs.com/package/@anthropic-ai/claude-agent-sdk
+- Codex config: developers.openai.com/codex/config-reference
+- RouteLLM (ICLR 2025): 85% cost reduction, 95% quality retention
+- Aider repo-map: tree-sitter + PageRank → 40%→85% multi-file success
+- Spotify Honk: 650+ PR/month, dual verification
diff --git a/package.json b/package.json
index 609f1cf..221aea6 100644
--- a/package.json
+++ b/package.json
@@ -1,6 +1,6 @@
 {
   "name": "cc-manager",
-  "version": "0.1.0",
+  "version": "0.1.7",
   "description": "Multi-agent orchestrator for Claude Code",
   "type": "module",
   "bin": {
diff --git a/src/__tests__/agent-runner.test.ts b/src/__tests__/agent-runner.test.ts
index f0d7f48..464a23c 100644
--- a/src/__tests__/agent-runner.test.ts
+++ b/src/__tests__/agent-runner.test.ts
@@ -2,9 +2,10 @@ import { describe, it, before, after } from "node:test";
 import assert from "node:assert/strict";
 import { AgentRunner, type ReviewResult } from "../agent-runner.js";
 import { createTask } from "../types.js";
-import { mkdtempSync, writeFileSync, mkdirSync, rmSync } from "node:fs";
+import { mkdtempSync, writeFileSync, readFileSync, mkdirSync, rmSync } from "node:fs";
 import { join } from "node:path";
 import { tmpdir } from "node:os";
+import { execFileSync } from "node:child_process";
 
 describe("AgentRunner", () => {
   // Temp directories for language detection tests
@@ -40,7 +41,7 @@ describe("AgentRunner", () => {
   });
 
   it("estimateCost returns correct values for opus model", () => {
-    const cost = AgentRunner.estimateCost(1_000_000, 1_000_000, "claude-opus-4-5");
+    const cost = AgentRunner.estimateCost(1_000_000, 1_000_000, "claude-opus-4-6");
     assert.strictEqual(cost, 90); // 15 + 75
   });
 
@@ -141,7 +142,7 @@ describe("AgentRunner", () => {
   });
 
   it("constructor accepts custom parameters", () => {
-    const runner = new AgentRunner("claude-opus-4-5", "be concise", "codex");
+    const runner = new AgentRunner("claude-opus-4-6", "be concise", "codex");
     assert.deepStrictEqual(runner.getRunningTasks(), []);
   });
 
@@ -409,6 +410,116 @@ describe("AgentRunner", () => {
     assert.strictEqual(parse('{"approve": true, "issues": []}'), null); // missing score
   });
 
+  // ── F2: buildTaskPrompt enforces commit ──
+
+  it("buildTaskPrompt includes CRITICAL commit enforcement", () => {
+    const runner = new AgentRunner();
+    const task = createTask("fix a bug in src/server.ts");
+    const prompt = (runner as unknown as { buildTaskPrompt: (t: typeof task, cwd: string) => string }).buildTaskPrompt(task, "/tmp");
+    assert.ok(prompt.includes("CRITICAL"), "prompt should contain CRITICAL commit warning");
+    assert.ok(prompt.includes("MUST run"), "prompt should enforce git commit");
+  });
+
+  it("buildTaskPrompt returns the raw prompt for meta tasks", () => {
+    const runner = new AgentRunner();
+    const task = createTask("plan the work only", { meta: true });
+    const prompt = (runner as unknown as { buildTaskPrompt: (t: typeof task, cwd: string) => string }).buildTaskPrompt(task, tsDir);
+    assert.strictEqual(prompt, "plan the work only");
+  });
+
+  it("buildSystemPrompt omits coding-task instructions for meta tasks", () => {
+    const runner = new AgentRunner();
+    const task = createTask("research the repository", { meta: true });
+    const prompt = runner.buildSystemPrompt(task, tsDir);
+    assert.strictEqual(prompt, "");
+  });
+
+  it("run() lets a meta task succeed without commits or build verification", async () => {
+    const runner = new AgentRunner();
+    const repoDir = mkdtempSync(join(tmpdir(), "meta-runner-repo-"));
+    try {
+      execFileSync("git", ["init", "-b", "main"], { cwd: repoDir });
+      execFileSync("git", ["config", "user.email", "test@example.com"], { cwd: repoDir });
+      execFileSync("git", ["config", "user.name", "Test"], { cwd: repoDir });
+      writeFileSync(join(repoDir, "tsconfig.json"), JSON.stringify({ include: ["src/**/*.ts"] }));
+      execFileSync("git", ["add", "."], { cwd: repoDir });
+      execFileSync("git", ["commit", "-m", "init"], { cwd: repoDir });
+
+      const task = createTask("research the repository", { agent: "echo", timeout: 5, meta: true });
+      await runner.run(task, repoDir);
+
+      assert.strictEqual(task.status, "success");
+      assert.ok(task.output.includes("research the repository"));
+    } finally {
+      rmSync(repoDir, { recursive: true, force: true });
+    }
+  });
+
+  // ── F4: Complete pricing table ──
+
+  it("estimateCost returns correct values for haiku", () => {
+    const cost = AgentRunner.estimateCost(1_000_000, 1_000_000, "claude-haiku-4-5-20251001");
+    assert.strictEqual(cost, 4.8); // 0.80 + 4.00
+  });
+
+  it("estimateCost returns correct values for gpt-5.4", () => {
+    const cost = AgentRunner.estimateCost(1_000_000, 1_000_000, "gpt-5.4");
+    assert.strictEqual(cost, 17.5); // 2.50 + 15.00
+  });
+
+  it("estimateCost returns correct values for o4-mini", () => {
+    const cost = AgentRunner.estimateCost(1_000_000, 1_000_000, "o4-mini");
+    assert.strictEqual(cost, 5.5); // 1.10 + 4.40
+  });
+
+  it("estimateCost returns correct values for gpt-5.4-wide", () => {
+    const cost = AgentRunner.estimateCost(1_000_000, 1_000_000, "gpt-5.4-wide");
+    assert.strictEqual(cost, 27.5); // 5.00 + 22.50
+  });
+
+  // ── F5: sessionId capture ──
+
+  it("handleClaudeEvent captures sessionId from system message", () => {
+    const runner = new AgentRunner();
+    const task = createTask("test");
+    task.status = "running";
+    const handler = (runner as unknown as { handleClaudeEvent: Function }).handleClaudeEvent.bind(runner);
+    handler({ type: "system", session_id: "sess_abc123" }, task, Date.now());
+    assert.strictEqual(task.sessionId, "sess_abc123");
+  });
+
+  it("handleClaudeEvent captures sessionId from result if not set", () => {
+    const runner = new AgentRunner();
+    const task = createTask("test");
+    task.status = "running";
+    const handler = (runner as unknown as { handleClaudeEvent: Function }).handleClaudeEvent.bind(runner);
+    handler({
+      type: "result", subtype: "success", result: "done",
+      session_id: "sess_def456",
+      total_cost_usd: 0.1, usage: { input_tokens: 100, output_tokens: 50 },
+    }, task, Date.now());
+    assert.strictEqual(task.sessionId, "sess_def456");
+  });
+
+  // ── F9: Codex config.toml ──
+
+  it("ensureCodexConfig creates config with default + wide profiles", () => {
+    const origHome = process.env.HOME;
+    const tmpHome = mkdtempSync(join(tmpdir(), "test-codex-config-"));
+    process.env.HOME = tmpHome;
+    try {
+      AgentRunner.ensureCodexConfig();
+      const content = readFileSync(join(tmpHome, ".codex", "config.toml"), "utf8");
+      assert.ok(content.includes("[profiles.default]"), "should have default profile");
+      assert.ok(content.includes("[profiles.wide]"), "should have wide profile");
+      assert.ok(content.includes("gpt-5.4"), "should use gpt-5.4");
+      assert.ok(content.includes("1050000"), "wide profile should have 1M context");
+    } finally {
+      process.env.HOME = origHome;
+      rmSync(tmpHome, { recursive: true, force: true });
+    }
+  });
+
   // ── reviewDiff approve field ──
 
   it("reviewDiff includes approve field based on score threshold", () => {
diff --git a/src/__tests__/pipeline.test.ts b/src/__tests__/pipeline.test.ts
new file mode 100644
index 0000000..fc87718
--- /dev/null
+++ b/src/__tests__/pipeline.test.ts
@@ -0,0 +1,1325 @@
+import { describe, it } from "node:test";
+import assert from "node:assert/strict";
+import Database from "better-sqlite3";
+import fs from "node:fs";
+import os from "node:os";
+import path from "node:path";
+import { Pipeline, extractFilePaths, validateWaves } from "../pipeline.js";
+import { PipelineStore } from "../pipeline-store.js";
+import { createTask } from "../types.js";
+import type { Task } from "../types.js";
+import type { AgentRunner } from "../agent-runner.js";
+import type { Scheduler } from "../scheduler.js";
+import type { PipelineConfig, PipelineRun } from "../pipeline-types.js";
+import { defaultPipelineConfig } from "../pipeline-types.js";
+
+// ---------------------------------------------------------------------------
+// Helpers
+// ---------------------------------------------------------------------------
+
+function makeTempDb(): { db: Database.Database; cleanup: () => void } {
+  const dir = fs.mkdtempSync(path.join(os.tmpdir(), "pipeline-test-"));
+  const db = new Database(path.join(dir, "test.db"));
+  db.pragma("journal_mode = WAL");
+  return {
+    db,
+    cleanup: () => {
+      db.close();
+      fs.rmSync(dir, { recursive: true, force: true });
+    },
+  };
+}
+
+function makeConfig(overrides: Partial<PipelineConfig> = {}): PipelineConfig {
+  return { ...defaultPipelineConfig, autoApprove: true, ...overrides };
+}
+
+function makeRunner(handler?: (task: Task, cwd: string) => Task): AgentRunner {
+  return {
+    run: async (task: Task, cwd: string, _cb?: unknown) => {
+      if (handler) return handler(task, cwd);
+      task.status = "success";
+      task.output = "done";
+      return task;
+    },
+    getRunningTasks: () => [],
+    reviewDiffWithAgent: async () => ({ approve: true, score: 80, issues: [], suggestions: [] }),
+  } as unknown as AgentRunner;
+}
+
+function makeScheduler(opts?: {
+  submitHandler?: (prompt: string) => Task;
+  getTaskHandler?: (id: string) => Task | undefined;
+  cancelHandler?: (id: string) => boolean;
+  abortHandler?: (id: string) => boolean;
+}): Scheduler {
+  const tasks = new Map<string, Task>();
+  return {
+    submit: (prompt: string, submitOpts?: Record<string, unknown>) => {
+      if (opts?.submitHandler) return opts.submitHandler(prompt);
+      const t = createTask(prompt, { tags: submitOpts?.tags as string[] });
+      t.status = "success";
+      tasks.set(t.id, t);
+      return t;
+    },
+    getTask: (id: string) => {
+      if (opts?.getTaskHandler) return opts.getTaskHandler(id);
+      return tasks.get(id);
+    },
+    cancel: (id: string) => {
+      if (opts?.cancelHandler) return opts.cancelHandler(id);
+      return true;
+    },
+    abort: (id: string) => {
+      if (opts?.abortHandler) return opts.abortHandler(id);
+      return false;
+    },
+  } as unknown as Scheduler;
+}
+
+// ---------------------------------------------------------------------------
+// PipelineStore tests
+// ---------------------------------------------------------------------------
+
+describe("PipelineStore", () => {
+  it("save and get a PipelineRun", () => {
+    const { db, cleanup } = makeTempDb();
+    try {
+      const store = new PipelineStore(db);
+      const now = new Date().toISOString();
+      const run: PipelineRun = {
+        id: "run-001",
+        goal: "add auth",
+        stage: "research_plan",
+        mode: "augment",
+        iteration: 0,
+        maxIterations: 3,
+        waves: [],
+        taskIds: [],
+        createdAt: now,
+        updatedAt: now,
+      };
+      store.save(run);
+      const got = store.get("run-001");
+      assert.ok(got !== null);
+      assert.strictEqual(got.id, "run-001");
+      assert.strictEqual(got.goal, "add auth");
+      assert.strictEqual(got.stage, "research_plan");
+      assert.strictEqual(got.mode, "augment");
+      assert.strictEqual(got.iteration, 0);
+      assert.strictEqual(got.maxIterations, 3);
+      assert.deepStrictEqual(got.waves, []);
+      assert.deepStrictEqual(got.taskIds, []);
+      assert.strictEqual(got.createdAt, now);
+    } finally {
+      cleanup();
+    }
+  });
+
+  it("list returns runs in descending order", () => {
+    const { db, cleanup } = makeTempDb();
+    try {
+      const store = new PipelineStore(db);
+      const run1: PipelineRun = {
+        id: "r1", goal: "first", stage: "done", mode: "augment",
+        iteration: 0, maxIterations: 3, waves: [], taskIds: [],
+        createdAt: "2024-01-01T00:00:00.000Z", updatedAt: "2024-01-01T00:00:00.000Z",
+      };
+      const run2: PipelineRun = {
+        id: "r2", goal: "second", stage: "execute", mode: "greenfield",
+        iteration: 1, maxIterations: 3, waves: [], taskIds: [],
+        createdAt: "2024-01-03T00:00:00.000Z", updatedAt: "2024-01-03T00:00:00.000Z",
+      };
+      const run3: PipelineRun = {
+        id: "r3", goal: "third", stage: "verify", mode: "augment",
+        iteration: 0, maxIterations: 3, waves: [], taskIds: [],
+        createdAt: "2024-01-02T00:00:00.000Z", updatedAt: "2024-01-02T00:00:00.000Z",
+      };
+      store.save(run1);
+      store.save(run2);
+      store.save(run3);
+      const runs = store.list();
+      assert.strictEqual(runs.length, 3);
+      assert.strictEqual(runs[0].id, "r2", "newest first");
+      assert.strictEqual(runs[1].id, "r3");
+      assert.strictEqual(runs[2].id, "r1", "oldest last");
+    } finally {
+      cleanup();
+    }
+  });
+
+  it("updateStage changes stage and updatedAt", () => {
+    const { db, cleanup } = makeTempDb();
+    try {
+      const store = new PipelineStore(db);
+      const now = "2024-01-01T00:00:00.000Z";
+      const run: PipelineRun = {
+        id: "upd-1", goal: "test", stage: "research_plan", mode: "augment",
+        iteration: 0, maxIterations: 3, waves: [], taskIds: [],
+        createdAt: now, updatedAt: now,
+      };
+      store.save(run);
+      store.updateStage("upd-1", "decompose");
+      const got = store.get("upd-1");
+      assert.ok(got !== null);
+      assert.strictEqual(got.stage, "decompose");
+      assert.notStrictEqual(got.updatedAt, now, "updatedAt should have changed");
+    } finally {
+      cleanup();
+    }
+  });
+
+  it("get returns null for missing id", () => {
+    const { db, cleanup } = makeTempDb();
+    try {
+      const store = new PipelineStore(db);
+      assert.strictEqual(store.get("nonexistent"), null);
+    } finally {
+      cleanup();
+    }
+  });
+
+  it("save persists waves and taskIds as JSON", () => {
+    const { db, cleanup } = makeTempDb();
+    try {
+      const store = new PipelineStore(db);
+      const now = new Date().toISOString();
+      const run: PipelineRun = {
+        id: "json-1", goal: "test json", stage: "execute", mode: "augment",
+        iteration: 1, maxIterations: 3,
+        waves: [{ waveIndex: 0, taskIds: ["t1", "t2"], successCount: 2, failCount: 0 }],
+        taskIds: ["t1", "t2"],
+        createdAt: now, updatedAt: now,
+      };
+      store.save(run);
+      const got = store.get("json-1");
+      assert.ok(got !== null);
+      assert.deepStrictEqual(got.waves, run.waves);
+      assert.deepStrictEqual(got.taskIds, run.taskIds);
+    } finally {
+      cleanup();
+    }
+  });
+
+  it("updateStage with additional fields merges them", () => {
+    const { db, cleanup } = makeTempDb();
+    try {
+      const store = new PipelineStore(db);
+      const now = new Date().toISOString();
+      const run: PipelineRun = {
+        id: "merge-1", goal: "test", stage: "verify", mode: "augment",
+        iteration: 0, maxIterations: 3, waves: [], taskIds: [],
+        createdAt: now, updatedAt: now,
+      };
+      store.save(run);
+      store.updateStage("merge-1", "failed", { error: "tsc failed", iteration: 2 });
+      const got = store.get("merge-1");
+      assert.ok(got !== null);
+      assert.strictEqual(got.stage, "failed");
+      assert.strictEqual(got.error, "tsc failed");
+      assert.strictEqual(got.iteration, 2);
+    } finally {
+      cleanup();
+    }
+  });
+});
+
+// ---------------------------------------------------------------------------
+// Pipeline tests
+// ---------------------------------------------------------------------------
+
+describe("Pipeline", () => {
+  it("start() returns a PipelineRun with stage=research_plan", async () => {
+    const { db, cleanup } = makeTempDb();
+    try {
+      const store = new PipelineStore(db);
+      const events: Record<string, unknown>[] = [];
+      const repoDir = fs.mkdtempSync(path.join(os.tmpdir(), "pipeline-repo-"));
+
+      const pipeline = new Pipeline(
+        makeRunner(),
+        makeScheduler(),
+        store,
+        repoDir,
+        (ev) => events.push(ev),
+        makeConfig(),
+      );
+
+      const run = pipeline.start("build a feature");
+      assert.ok(run.id);
+      assert.strictEqual(run.stage, "research_plan");
+      assert.strictEqual(run.goal, "build a feature");
+      assert.strictEqual(run.iteration, 0);
+      assert.deepStrictEqual(run.waves, []);
+      assert.deepStrictEqual(run.taskIds, []);
+      assert.ok(events.some((e) => e.type === "pipeline:started"));
+
+      // Wait for background drive() to settle before cleanup
+      await new Promise((r) => setTimeout(r, 500));
+      fs.rmSync(repoDir, { recursive: true, force: true });
+    } finally {
+      cleanup();
+    }
+  });
+
+  it("doResearchPlan detects greenfield mode when git log fails", async () => {
+    const { db, cleanup } = makeTempDb();
+    try {
+      const store = new PipelineStore(db);
+      // Use a non-git directory to trigger greenfield detection
+      const repoDir = fs.mkdtempSync(path.join(os.tmpdir(), "pipeline-no-git-"));
+      const events: Record<string, unknown>[] = [];
+
+      const runner = makeRunner((task) => {
+        task.status = "success";
+        task.output = "plan created";
+        return task;
+      });
+
+      const pipeline = new Pipeline(
+        runner,
+        makeScheduler(),
+        store,
+        repoDir,
+        (ev) => events.push(ev),
+        makeConfig(),
+      );
+
+      const run = pipeline.start("new project");
+      // Wait for drive() to complete
+      await new Promise((r) => setTimeout(r, 200));
+
+      const saved = store.get(run.id);
+      assert.ok(saved !== null);
+      assert.strictEqual(saved.mode, "greenfield");
+
+      fs.rmSync(repoDir, { recursive: true, force: true });
+    } finally {
+      cleanup();
+    }
+  });
+
+  it("fails the pipeline immediately when research_plan meta-task fails", async () => {
+    const { db, cleanup } = makeTempDb();
+    try {
+      const store = new PipelineStore(db);
+      const repoDir = fs.mkdtempSync(path.join(os.tmpdir(), "pipeline-research-fail-"));
+      const events: Record<string, unknown>[] = [];
+
+      const runner = makeRunner((task) => {
+        task.status = "failed";
+        task.error = "planner crashed";
+        return task;
+      });
+
+      const pipeline = new Pipeline(
+        runner,
+        makeScheduler(),
+        store,
+        repoDir,
+        (ev) => events.push(ev),
+        makeConfig(),
+      );
+
+      const run = pipeline.start("break at planning");
+      await new Promise((r) => setTimeout(r, 200));
+
+      const saved = store.get(run.id);
+      assert.ok(saved !== null);
+      assert.strictEqual(saved.stage, "failed");
+      assert.ok(saved.error?.includes("research_plan task failed"));
+      assert.ok(saved.error?.includes("planner crashed"));
+      assert.ok(events.some((e) => e.type === "pipeline:failed"));
+
+      fs.rmSync(repoDir, { recursive: true, force: true });
+    } finally {
+      cleanup();
+    }
+  });
+
+  it("fails the pipeline immediately when decompose meta-task fails", async () => {
+    const { db, cleanup } = makeTempDb();
+    try {
+      const store = new PipelineStore(db);
+      const repoDir = fs.mkdtempSync(path.join(os.tmpdir(), "pipeline-decompose-fail-"));
+
+      let callCount = 0;
+      const runner = makeRunner((task) => {
+        callCount++;
+        if (callCount === 1) {
+          task.status = "success";
+          task.output = "plan created";
+        } else {
+          task.status = "failed";
+          task.error = "decompose agent timed out";
+        }
+        return task;
+      });
+
+      const pipeline = new Pipeline(
+        runner,
+        makeScheduler(),
+        store,
+        repoDir,
+        () => {},
+        makeConfig(),
+      );
+
+      const run = pipeline.start("break at decompose");
+      await new Promise((r) => setTimeout(r, 300));
+
+      const saved = store.get(run.id);
+      assert.ok(saved !== null);
+      assert.strictEqual(saved.stage, "failed");
+      assert.ok(saved.error?.includes("decompose task failed"));
+      assert.ok(saved.error?.includes("decompose agent timed out"));
+
+      fs.rmSync(repoDir, { recursive: true, force: true });
+    } finally {
+      cleanup();
+    }
+  });
+
+  it("human checkpoint: pauses at waiting_approval, approve() resumes", async () => {
+    const { db, cleanup } = makeTempDb();
+    try {
+      const store = new PipelineStore(db);
+      const repoDir = fs.mkdtempSync(path.join(os.tmpdir(), "pipeline-approve-"));
+      const events: Record<string, unknown>[] = [];
+
+      // Runner that writes plan file and returns decompose JSON for subsequent stages
+      let callCount = 0;
+      const runner = makeRunner((task) => {
+        callCount++;
+        task.status = "success";
+        if (callCount === 1) {
+          // research_plan stage
+          task.output = "plan written";
+        } else if (callCount === 2) {
+          // decompose stage
+          task.output = JSON.stringify({ waves: [{ waveIndex: 0, tasks: ["task A"] }], totalTasks: 1 });
+        } else {
+          // verify stage
+          task.output = JSON.stringify({ tscClean: true, testsPass: true, errors: [], verdict: "pass" });
+        }
+        return task;
+      });
+
+      // Scheduler that returns tasks as immediately completed
+      const scheduler = makeScheduler();
+
+      const pipeline = new Pipeline(
+        runner,
+        scheduler,
+        store,
+        repoDir,
+        (ev) => events.push(ev),
+        makeConfig({ autoApprove: false }),
+      );
+
+      const run = pipeline.start("feature with approval");
+      // Wait for pipeline to reach waiting_approval
+      await new Promise((r) => setTimeout(r, 200));
+
+      const savedBefore = store.get(run.id);
+      assert.ok(savedBefore !== null);
+      assert.strictEqual(savedBefore.stage, "waiting_approval");
+      assert.ok(events.some((e) => e.type === "pipeline:waiting_approval"));
+
+      // Approve the plan
+      const approved = pipeline.approve(run.id);
+      assert.strictEqual(approved, true);
+
+      // Wait for pipeline to proceed
+      await new Promise((r) => setTimeout(r, 500));
+
+      const savedAfter = store.get(run.id);
+      assert.ok(savedAfter !== null);
+      // Should have progressed past waiting_approval
+      assert.ok(savedAfter.stage !== "waiting_approval" && savedAfter.stage !== "research_plan",
+        `Expected stage past approval, got ${savedAfter.stage}`);
+
+      fs.rmSync(repoDir, { recursive: true, force: true });
+    } finally {
+      cleanup();
+    }
+  });
+
+  it("cancel() sets stage to failed and cancels scheduler tasks", () => {
+    const { db, cleanup } = makeTempDb();
+    try {
+      const store = new PipelineStore(db);
+      const repoDir = fs.mkdtempSync(path.join(os.tmpdir(), "pipeline-cancel-"));
+      const events: Record<string, unknown>[] = [];
+      const cancelledIds: string[] = [];
+      const abortedIds: string[] = [];
+
+      const scheduler = makeScheduler({
+        cancelHandler: (id) => { cancelledIds.push(id); return true; },
+        abortHandler: (id) => { abortedIds.push(id); return true; },
+      });
+
+      const pipeline = new Pipeline(
+        makeRunner(),
+        scheduler,
+        store,
+        repoDir,
+        (ev) => events.push(ev),
+        makeConfig(),
+      );
+
+      // Manually create a run with taskIds to test cancel
+      const now = new Date().toISOString();
+      const run: PipelineRun = {
+        id: "cancel-run", goal: "test", stage: "execute", mode: "augment",
+        iteration: 0, maxIterations: 3, waves: [], taskIds: ["t1", "t2"],
+        createdAt: now, updatedAt: now,
+      };
+      store.save(run);
+
+      pipeline.cancel("cancel-run");
+
+      const saved = store.get("cancel-run");
+      assert.ok(saved !== null);
+      assert.strictEqual(saved.stage, "failed");
+      assert.strictEqual(saved.error, "Cancelled by user");
+      assert.deepStrictEqual(cancelledIds, ["t1", "t2"]);
+      assert.deepStrictEqual(abortedIds, ["t1", "t2"]);
+      assert.ok(events.some((e) => e.type === "pipeline:cancelled"));
+
+      fs.rmSync(repoDir, { recursive: true, force: true });
+    } finally {
+      cleanup();
+    }
+  });
+
+  it("full flow: research_plan → decompose → execute → verify → done", async () => {
+    const { db, cleanup } = makeTempDb();
+    try {
+      const store = new PipelineStore(db);
+      const repoDir = fs.mkdtempSync(path.join(os.tmpdir(), "pipeline-full-"));
+      // Initialize as git repo for augment mode detection
+      const { execSync } = await import("node:child_process");
+      execSync("git init && git config user.email 'test@test.com' && git config user.name 'test' && git commit --allow-empty -m 'init'", { cwd: repoDir, stdio: "ignore" });
+
+      const events: Record<string, unknown>[] = [];
+
+      let callCount = 0;
+      const runner = makeRunner((task) => {
+        callCount++;
+        task.status = "success";
+        if (callCount === 1) {
+          // research_plan: write plan file
+          const planDir = path.join(repoDir, ".cc-pipeline");
+          fs.mkdirSync(planDir, { recursive: true });
+          fs.writeFileSync(path.join(planDir, "plan.md"), "# Plan\n- Do stuff");
+          task.output = "plan created";
+        } else if (callCount === 2) {
+          // decompose
+          task.output = JSON.stringify({
+            waves: [
+              { waveIndex: 0, tasks: ["implement feature A", "implement feature B"] },
+              { waveIndex: 1, tasks: ["integrate A and B"] },
+            ],
+            totalTasks: 3,
+          });
+        } else {
+          // verify
+          task.output = JSON.stringify({
+            tscClean: true, testsPass: true, errors: [], verdict: "pass",
+          });
+        }
+        return task;
+      });
+
+      const scheduler = makeScheduler();
+
+      const pipeline = new Pipeline(
+        runner,
+        scheduler,
+        store,
+        repoDir,
+        (ev) => events.push(ev),
+        makeConfig(),
+      );
+
+      const run = pipeline.start("build complete feature");
+      // Wait for the full flow
+      await new Promise((r) => setTimeout(r, 500));
+
+      const saved = store.get(run.id);
+      assert.ok(saved !== null);
+      assert.strictEqual(saved.stage, "done");
+      assert.strictEqual(saved.mode, "augment");
+      assert.ok(events.some((e) => e.type === "pipeline:started"));
+      assert.ok(events.some((e) => e.type === "pipeline:plan_ready"));
+      assert.ok(events.some((e) => e.type === "pipeline:decomposed"));
+      assert.ok(events.some((e) => e.type === "pipeline:done"));
+
+      fs.rmSync(repoDir, { recursive: true, force: true });
+    } finally {
+      cleanup();
+    }
+  });
+
+  it("persists taskIds before a wave completes so cancel can see in-flight tasks", async () => {
+    const { db, cleanup } = makeTempDb();
+    try {
+      const store = new PipelineStore(db);
+      const repoDir = fs.mkdtempSync(path.join(os.tmpdir(), "pipeline-persist-taskids-"));
+      const taskMap = new Map<string, Task>();
+
+      let callCount = 0;
+      const runner = makeRunner((task) => {
+        callCount++;
+        task.status = "success";
+        if (callCount === 1) {
+          task.output = "plan created";
+        } else if (callCount === 2) {
+          task.output = JSON.stringify({
+            waves: [{ waveIndex: 0, tasks: ["long running task"] }],
+            totalTasks: 1,
+          });
+        } else {
+          task.output = JSON.stringify({ tscClean: true, testsPass: true, errors: [], verdict: "pass" });
+        }
+        return task;
+      });
+
+      const scheduler = makeScheduler({
+        submitHandler: (prompt: string) => {
+          const task = createTask(prompt);
+          task.status = "running";
+          taskMap.set(task.id, task);
+          return task;
+        },
+        getTaskHandler: (id: string) => taskMap.get(id),
+        cancelHandler: (id: string) => {
+          const task = taskMap.get(id);
+          if (task) task.status = "cancelled";
+          return true;
+        },
+        abortHandler: (id: string) => {
+          const task = taskMap.get(id);
+          if (task) task.status = "cancelled";
+          return true;
+        },
+      });
+
+      const pipeline = new Pipeline(
+        runner,
+        scheduler,
+        store,
+        repoDir,
+        () => {},
+        makeConfig(),
+      );
+
+      const run = pipeline.start("persist task ids early");
+      await new Promise((r) => setTimeout(r, 300));
+
+      const midRun = store.get(run.id);
+      assert.ok(midRun !== null);
+      assert.strictEqual(midRun.taskIds.length, 1, "taskIds should be saved before the wave finishes");
+
+      pipeline.cancel(run.id);
+      await new Promise((r) => setTimeout(r, 200));
+
+      const saved = store.get(run.id);
+      assert.ok(saved !== null);
+      assert.strictEqual(saved.stage, "failed");
+
+      fs.rmSync(repoDir, { recursive: true, force: true });
+    } finally {
+      cleanup();
+    }
+  });
+
+  it("wave execution: wave 0 completes before wave 1 starts", async () => {
+    const { db, cleanup } = makeTempDb();
+    try {
+      const store = new PipelineStore(db);
+      const repoDir = fs.mkdtempSync(path.join(os.tmpdir(), "pipeline-wave-"));
+
+      const events: Record<string, unknown>[] = [];
+      let callCount = 0;
+
+      const runner = makeRunner((task) => {
+        callCount++;
+        task.status = "success";
+        if (callCount === 1) {
+          const planDir = path.join(repoDir, ".cc-pipeline");
+          fs.mkdirSync(planDir, { recursive: true });
+          fs.writeFileSync(path.join(planDir, "plan.md"), "# Plan");
+          task.output = "plan";
+        } else if (callCount === 2) {
+          task.output = JSON.stringify({
+            waves: [
+              { waveIndex: 0, tasks: ["task A"] },
+              { waveIndex: 1, tasks: ["task B"] },
+            ],
+            totalTasks: 2,
+          });
+        } else {
+          task.output = JSON.stringify({ tscClean: true, testsPass: true, errors: [], verdict: "pass" });
+        }
+        return task;
+      });
+
+      const scheduler = makeScheduler();
+
+      const pipeline = new Pipeline(
+        runner, scheduler, store, repoDir,
+        (ev) => events.push(ev),
+        makeConfig(),
+      );
+
+      pipeline.start("wave test");
+      await new Promise((r) => setTimeout(r, 500));
+
+      // Verify wave events are in order
+      const waveStartEvents = events.filter((e) => e.type === "pipeline:wave_started");
+      const waveDoneEvents = events.filter((e) => e.type === "pipeline:wave_done");
+      assert.strictEqual(waveStartEvents.length, 2);
+      assert.strictEqual(waveDoneEvents.length, 2);
+      assert.strictEqual(waveStartEvents[0].waveIndex, 0);
+      assert.strictEqual(waveStartEvents[1].waveIndex, 1);
+
+      fs.rmSync(repoDir, { recursive: true, force: true });
+    } finally {
+      cleanup();
+    }
+  });
+
+  it("writes decomposed task artifacts under run-scoped directories", async () => {
+    const { db, cleanup } = makeTempDb();
+    try {
+      const store = new PipelineStore(db);
+      const repoDir = fs.mkdtempSync(path.join(os.tmpdir(), "pipeline-run-scope-"));
+
+      const runner = makeRunner((task) => {
+        task.status = "success";
+        if (task.prompt.includes("Convert the plan")) {
+          task.output = JSON.stringify({
+            waves: [{ waveIndex: 0, tasks: ["task A"] }],
+            totalTasks: 1,
+          });
+        } else if (task.prompt.includes("verification")) {
+          task.output = JSON.stringify({ tscClean: true, testsPass: true, errors: [], verdict: "pass" });
+        } else {
+          task.output = "plan";
+        }
+        return task;
+      });
+
+      const pipeline = new Pipeline(
+        runner,
+        makeScheduler(),
+        store,
+        repoDir,
+        () => {},
+        makeConfig(),
+      );
+
+      const runA = pipeline.start("goal A");
+      const runB = pipeline.start("goal B");
+      await new Promise((r) => setTimeout(r, 500));
+
+      assert.ok(fs.existsSync(path.join(repoDir, ".cc-pipeline", runA.id, "tasks.json")));
+      assert.ok(fs.existsSync(path.join(repoDir, ".cc-pipeline", runB.id, "tasks.json")));
+
+      fs.rmSync(repoDir, { recursive: true, force: true });
+    } finally {
+      cleanup();
+    }
+  });
+
+  it("feedback loop: verify fail → re-execute → verify pass", async () => {
+    const { db, cleanup } = makeTempDb();
+    try {
+      const store = new PipelineStore(db);
+      const repoDir = fs.mkdtempSync(path.join(os.tmpdir(), "pipeline-retry-"));
+
+      const events: Record<string, unknown>[] = [];
+      let callCount = 0;
+      let verifyCount = 0;
+
+      const runner = makeRunner((task) => {
+        callCount++;
+        task.status = "success";
+        if (callCount === 1) {
+          // research_plan
+          const planDir = path.join(repoDir, ".cc-pipeline");
+          fs.mkdirSync(planDir, { recursive: true });
+          fs.writeFileSync(path.join(planDir, "plan.md"), "# Plan");
+          task.output = "plan";
+        } else if (callCount === 2) {
+          // decompose
+          task.output = JSON.stringify({
+            waves: [{ waveIndex: 0, tasks: ["fix bug"] }],
+            totalTasks: 1,
+          });
+        } else if (task.prompt.includes("verification")) {
+          // verify stage
+          verifyCount++;
+          if (verifyCount === 1) {
+            task.output = JSON.stringify({ tscClean: false, testsPass: false, errors: ["type error"], verdict: "fail" });
+          } else {
+            task.output = JSON.stringify({ tscClean: true, testsPass: true, errors: [], verdict: "pass" });
+          }
+        } else {
+          task.output = "executed";
+        }
+        return task;
+      });
+
+      const scheduler = makeScheduler();
+
+      const pipeline = new Pipeline(
+        runner, scheduler, store, repoDir,
+        (ev) => events.push(ev),
+        makeConfig({ maxIterations: 3 }),
+      );
+
+      const run = pipeline.start("fix things");
+      await new Promise((r) => setTimeout(r, 800));
+
+      const saved = store.get(run.id);
+      assert.ok(saved !== null);
+      assert.strictEqual(saved.stage, "done");
+      assert.ok(saved.iteration >= 1, "iteration should have incremented");
+      assert.ok(events.some((e) => e.type === "pipeline:retry"));
+      assert.ok(events.some((e) => e.type === "pipeline:done"));
+
+      fs.rmSync(repoDir, { recursive: true, force: true });
+    } finally {
+      cleanup();
+    }
+  });
+
+  it("maxIterations cap: verify always fails → pipeline fails", async () => {
+    const { db, cleanup } = makeTempDb();
+    try {
+      const store = new PipelineStore(db);
+      const repoDir = fs.mkdtempSync(path.join(os.tmpdir(), "pipeline-maxiter-"));
+
+      const events: Record<string, unknown>[] = [];
+      let callCount = 0;
+
+      const runner = makeRunner((task) => {
+        callCount++;
+        task.status = "success";
+        if (callCount === 1) {
+          const planDir = path.join(repoDir, ".cc-pipeline");
+          fs.mkdirSync(planDir, { recursive: true });
+          fs.writeFileSync(path.join(planDir, "plan.md"), "# Plan");
+          task.output = "plan";
+        } else if (callCount === 2) {
+          task.output = JSON.stringify({
+            waves: [{ waveIndex: 0, tasks: ["task"] }],
+            totalTasks: 1,
+          });
+        } else if (task.prompt.includes("verification")) {
+          // Always fail verification
+          task.output = JSON.stringify({ tscClean: false, testsPass: false, errors: ["persistent error"], verdict: "fail" });
+        } else {
+          task.output = "executed";
+        }
+        return task;
+      });
+
+      const scheduler = makeScheduler();
+
+      const pipeline = new Pipeline(
+        runner, scheduler, store, repoDir,
+        (ev) => events.push(ev),
+        makeConfig({ maxIterations: 2 }),
+      );
+
+      const run = pipeline.start("doomed to fail");
+      await new Promise((r) => setTimeout(r, 1000));
+
+      const saved = store.get(run.id);
+      assert.ok(saved !== null);
+      assert.strictEqual(saved.stage, "failed");
+      assert.ok(saved.error!.includes("Verification failed"));
+      assert.ok(saved.error!.includes("persistent error"));
+      assert.ok(events.some((e) => e.type === "pipeline:failed"));
+
+      fs.rmSync(repoDir, { recursive: true, force: true });
+    } finally {
+      cleanup();
+    }
+  });
+
+  // JSON parsing tests (via decompose stage)
+  describe("JSON parsing through decompose", () => {
+    async function runDecomposeWithOutput(output: string): Promise<PipelineRun | null> {
+      const { db, cleanup: cleanupDb } = makeTempDb();
+      const store = new PipelineStore(db);
+      const repoDir = fs.mkdtempSync(path.join(os.tmpdir(), "pipeline-json-"));
+
+      let callCount = 0;
+      const runner = makeRunner((task) => {
+        callCount++;
+        task.status = "success";
+        if (callCount === 1) {
+          const planDir = path.join(repoDir, ".cc-pipeline");
+          fs.mkdirSync(planDir, { recursive: true });
+          fs.writeFileSync(path.join(planDir, "plan.md"), "# Plan");
+          task.output = "plan";
+        } else if (callCount === 2) {
+          task.output = output;
+        } else {
+          task.output = JSON.stringify({ tscClean: true, testsPass: true, errors: [], verdict: "pass" });
+        }
+        return task;
+      });
+
+      const scheduler = makeScheduler();
+      const events: Record<string, unknown>[] = [];
+
+      const pipeline = new Pipeline(
+        runner, scheduler, store, repoDir,
+        (ev) => events.push(ev),
+        makeConfig(),
+      );
+
+      const run = pipeline.start("json test");
+      await new Promise((r) => setTimeout(r, 500));
+
+      const result = store.get(run.id);
+      cleanupDb();
+      fs.rmSync(repoDir, { recursive: true, force: true });
+      return result;
+    }
+
+    it("clean JSON output → parsed correctly", async () => {
+      const output = JSON.stringify({ waves: [{ waveIndex: 0, tasks: ["task A"] }], totalTasks: 1 });
+      const result = await runDecomposeWithOutput(output);
+      assert.ok(result !== null);
+      assert.ok(result.stage === "done" || result.stage === "verify",
+        `Expected done or verify, got ${result.stage}`);
+    });
+
+    it("JSON wrapped in text → parsed correctly", async () => {
+      const json = JSON.stringify({ waves: [{ waveIndex: 0, tasks: ["task B"] }], totalTasks: 1 });
+      const output = `Here is the decomposition:\n${json}\nThat's the plan.`;
+      const result = await runDecomposeWithOutput(output);
+      assert.ok(result !== null);
+      assert.ok(result.stage === "done" || result.stage === "verify",
+        `Expected done or verify, got ${result.stage}`);
+    });
+
+    it("JSON in ```json fences → parsed correctly", async () => {
+      const json = JSON.stringify({ waves: [{ waveIndex: 0, tasks: ["task C"] }], totalTasks: 1 });
+      const output = `\`\`\`json\n${json}\n\`\`\``;
+      const result = await runDecomposeWithOutput(output);
+      assert.ok(result !== null);
+      assert.ok(result.stage === "done" || result.stage === "verify",
+        `Expected done or verify, got ${result.stage}`);
+    });
+
+    it("completely invalid JSON → pipeline fails", async () => {
+      const result = await runDecomposeWithOutput("not json at all, just text");
+      assert.ok(result !== null);
+      assert.strictEqual(result.stage, "failed");
+      assert.ok(result.error!.includes("Failed to parse JSON"));
+    });
+  });
+
+  it("approve() returns false for unknown run id", () => {
+    const { db, cleanup } = makeTempDb();
+    try {
+      const store = new PipelineStore(db);
+      const repoDir = fs.mkdtempSync(path.join(os.tmpdir(), "pipeline-noapprove-"));
+
+      const pipeline = new Pipeline(
+        makeRunner(), makeScheduler(), store, repoDir,
+        () => {}, makeConfig(),
+      );
+
+      assert.strictEqual(pipeline.approve("nonexistent"), false);
+      fs.rmSync(repoDir, { recursive: true, force: true });
+    } finally {
+      cleanup();
+    }
+  });
+
+  it("cancel() is a no-op for done/failed runs", () => {
+    const { db, cleanup } = makeTempDb();
+    try {
+      const store = new PipelineStore(db);
+      const repoDir = fs.mkdtempSync(path.join(os.tmpdir(), "pipeline-nocancel-"));
+      const events: Record<string, unknown>[] = [];
+
+      const pipeline = new Pipeline(
+        makeRunner(), makeScheduler(), store, repoDir,
+        (ev) => events.push(ev), makeConfig(),
+      );
+
+      const now = new Date().toISOString();
+      store.save({
+        id: "done-run", goal: "test", stage: "done", mode: "augment",
+        iteration: 0, maxIterations: 3, waves: [], taskIds: [],
+        createdAt: now, updatedAt: now,
+      });
+
+      pipeline.cancel("done-run");
+      const saved = store.get("done-run");
+      assert.ok(saved !== null);
+      assert.strictEqual(saved.stage, "done", "done run should not be changed by cancel");
+      assert.ok(!events.some((e) => e.type === "pipeline:cancelled"));
+
+      fs.rmSync(repoDir, { recursive: true, force: true });
+    } finally {
+      cleanup();
+    }
+  });
+
+  it("verify failure stores verifyResults and generates fix tasks grouped by file", async () => {
+    const { db, cleanup } = makeTempDb();
+    try {
+      const store = new PipelineStore(db);
+      const repoDir = fs.mkdtempSync(path.join(os.tmpdir(), "pipeline-verify-fix-"));
+      fs.mkdirSync(path.join(repoDir, ".git"));
+      fs.mkdirSync(path.join(repoDir, ".cc-pipeline"), { recursive: true });
+      fs.writeFileSync(path.join(repoDir, ".cc-pipeline", "plan.md"), "# Plan\nDo things");
+
+      let callNum = 0;
+      const runner = makeRunner((task) => {
+        callNum++;
+        if (callNum <= 2) {
+          // research_plan + decompose
+          if (task.prompt.includes("decomposition")) {
+            task.output = JSON.stringify({
+              waves: [{ waveIndex: 0, tasks: ["task one"] }],
+              totalTasks: 1,
+            });
+          }
+          task.status = "success";
+          return task;
+        }
+        if (callNum === 3) {
+          // first verify — fail with file-grouped errors
+          task.output = JSON.stringify({
+            tscClean: false,
+            testsPass: false,
+            errors: [
+              "src/foo.ts:10 - TS2304: Cannot find name 'Bar'",
+              "src/foo.ts:20 - TS2551: Missing property",
+              "src/baz.ts:5 - TS2307: Cannot find module",
+            ],
+            verdict: "fail",
+          });
+          task.status = "success";
+          return task;
+        }
+        // second verify — pass
+        task.output = JSON.stringify({
+          tscClean: true,
+          testsPass: true,
+          errors: [],
+          verdict: "pass",
+        });
+        task.status = "success";
+        return task;
+      });
+
+      const scheduler = makeScheduler();
+      const events: Record<string, unknown>[] = [];
+      const pipeline = new Pipeline(runner, scheduler, store, repoDir, (e) => events.push(e), makeConfig());
+      pipeline.start("test verify fix");
+
+      await new Promise((r) => setTimeout(r, 1500));
+
+      const run = store.list()[0];
+      assert.strictEqual(run.stage, "done");
+
+      // verifyResults should have at least the first failure
+      assert.ok(run.verifyResults, "verifyResults should be populated");
+      assert.ok(run.verifyResults.length >= 1, "should have at least 1 verify result");
+      assert.strictEqual(run.verifyResults[0].verdict, "fail");
+      assert.strictEqual(run.verifyResults[0].errors.length, 3);
+
+      // Check that retry event was emitted
+      assert.ok(events.some((e) => e.type === "pipeline:retry"));
+
+      fs.rmSync(repoDir, { recursive: true, force: true });
+    } finally {
+      cleanup();
+    }
+  });
+
+  it("markStaleRunsFailed recovers orphaned runs", () => {
+    const { db, cleanup } = makeTempDb();
+    try {
+      const store = new PipelineStore(db);
+      const now = new Date().toISOString();
+
+      // Create a run stuck in "execute" (simulating crash)
+      store.save({
+        id: "stale-1",
+        goal: "stale",
+        stage: "execute",
+        mode: "augment",
+        iteration: 1,
+        maxIterations: 3,
+        waves: [],
+        taskIds: [],
+        createdAt: now,
+        updatedAt: now,
+      });
+
+      // Create a completed run (should not be affected)
+      store.save({
+        id: "done-1",
+        goal: "done",
+        stage: "done",
+        mode: "augment",
+        iteration: 0,
+        maxIterations: 3,
+        waves: [],
+        taskIds: [],
+        createdAt: now,
+        updatedAt: now,
+      });
+
+      const recovered = store.markStaleRunsFailed();
+      assert.strictEqual(recovered, 1);
+
+      const stale = store.get("stale-1")!;
+      assert.strictEqual(stale.stage, "failed");
+      assert.ok(stale.error?.includes("Server restarted"));
+
+      const done = store.get("done-1")!;
+      assert.strictEqual(done.stage, "done");
+    } finally {
+      cleanup();
+    }
+  });
+
+  it("wave task prompts include plan context", async () => {
+    const { db, cleanup } = makeTempDb();
+    try {
+      const store = new PipelineStore(db);
+      const repoDir = fs.mkdtempSync(path.join(os.tmpdir(), "pipeline-context-"));
+      fs.mkdirSync(path.join(repoDir, ".git"));
+
+      const submittedPrompts: string[] = [];
+      let callNum = 0;
+      const runner = makeRunner((task) => {
+        callNum++;
+        if (callNum === 2) {
+          // decompose
+          task.output = JSON.stringify({
+            waves: [{ waveIndex: 0, tasks: ["do thing A"] }],
+            totalTasks: 1,
+          });
+        }
+        if (callNum === 3) {
+          // verify
+          task.output = JSON.stringify({ tscClean: true, testsPass: true, errors: [], verdict: "pass" });
+        }
+        task.status = "success";
+        return task;
+      });
+
+      const scheduler = makeScheduler({
+        submitHandler: (prompt: string) => {
+          submittedPrompts.push(prompt);
+          const t = createTask(prompt);
+          t.status = "success";
+          return t;
+        },
+      });
+
+      const pipeline = new Pipeline(runner, scheduler, store, repoDir, () => {}, makeConfig());
+      const run = pipeline.start("context test");
+      fs.mkdirSync(path.join(repoDir, ".cc-pipeline", run.id), { recursive: true });
+      fs.writeFileSync(path.join(repoDir, ".cc-pipeline", run.id, "plan.md"), "# My Plan\nDetails here");
+
+      await new Promise((r) => setTimeout(r, 1500));
+
+      assert.ok(submittedPrompts.length > 0, "should have submitted at least one task");
+      assert.ok(
+        submittedPrompts[0].includes("wave 0") || submittedPrompts[0].includes(`.cc-pipeline/${run.id}/plan.md`),
+        "submitted prompt should reference wave context or run-scoped plan"
+      );
+
+      fs.rmSync(repoDir, { recursive: true, force: true });
+    } finally {
+      cleanup();
+    }
+  });
+
+  it("dead-loop detection: same errors twice → pipeline fails", async () => {
+    const { db, cleanup } = makeTempDb();
+    try {
+      const store = new PipelineStore(db);
+      const events: Record<string, unknown>[] = [];
+      let verifyCount = 0;
+
+      // ResearchPlan succeeds, Decompose returns 1 task, Verify always returns same error
+      const runner = makeRunner((task) => {
+        if (task.prompt.includes("architect")) {
+          task.status = "success";
+          task.output = "planned";
+          return task;
+        }
+        if (task.prompt.includes("decomposition")) {
+          task.status = "success";
+          task.output = JSON.stringify({
+            waves: [{ waveIndex: 0, tasks: ["Fix src/app.ts"] }],
+            totalTasks: 1,
+          });
+          return task;
+        }
+        if (task.prompt.includes("verification")) {
+          verifyCount++;
+          task.status = "success";
+          task.output = JSON.stringify({
+            tscClean: false,
+            testsPass: false,
+            errors: ["src/app.ts:1 - same error every time"],
+            verdict: "fail",
+          });
+          return task;
+        }
+        task.status = "success";
+        return task;
+      });
+
+      const repoDir = fs.mkdtempSync(path.join(os.tmpdir(), "deadloop-"));
+      fs.mkdirSync(path.join(repoDir, ".git"), { recursive: true });
+      fs.mkdirSync(path.join(repoDir, ".cc-pipeline"), { recursive: true });
+
+      const pipeline = new Pipeline(
+        runner,
+        makeScheduler(),
+        store,
+        repoDir,
+        (ev) => events.push(ev),
+        makeConfig({ maxIterations: 10 }), // high cap to test dead-loop kicks in first
+      );
+
+      const run = pipeline.start("test dead loop");
+      await new Promise((r) => setTimeout(r, 1500));
+
+      const saved = store.get(run.id);
+      assert.ok(saved !== null);
+      assert.strictEqual(saved.stage, "failed");
+      assert.ok(saved.error!.includes("same errors repeated"));
+
+      fs.rmSync(repoDir, { recursive: true, force: true });
+    } finally {
+      cleanup();
+    }
+  });
+});
+
+// ---------------------------------------------------------------------------
+// extractFilePaths tests
+// ---------------------------------------------------------------------------
+
+describe("extractFilePaths", () => {
+  it("extracts simple file paths from a prompt", () => {
+    const paths = extractFilePaths("Create src/types.ts and modify src/index.ts");
+    assert.ok(paths.includes("src/types.ts"));
+    assert.ok(paths.includes("src/index.ts"));
+  });
+
+  it("ignores non-code files (md, json, yaml)", () => {
+    const paths = extractFilePaths("Update README.md and package.json and src/app.ts");
+    assert.ok(!paths.includes("README.md"));
+    assert.ok(!paths.includes("package.json"));
+    assert.ok(paths.includes("src/app.ts"));
+  });
+
+  it("extracts nested paths", () => {
+    const paths = extractFilePaths("Fix src/lib/utils/helpers.ts");
+    assert.ok(paths.includes("src/lib/utils/helpers.ts"));
+  });
+
+  it("returns empty for no file paths", () => {
+    const paths = extractFilePaths("Just do something generic");
+    assert.deepStrictEqual(paths, []);
+  });
+});
+
+// ---------------------------------------------------------------------------
+// validateWaves tests
+// ---------------------------------------------------------------------------
+
+describe("validateWaves", () => {
+  it("no conflicts → waves unchanged", () => {
+    const input = {
+      waves: [
+        { waveIndex: 0, tasks: ["Create src/a.ts", "Create src/b.ts"] },
+      ],
+      totalTasks: 2,
+    };
+    const result = validateWaves(input);
+    assert.strictEqual(result.waves.length, 1);
+    assert.strictEqual(result.waves[0].tasks.length, 2);
+  });
+
+  it("file conflict → task moved to next wave", () => {
+    const input = {
+      waves: [
+        { waveIndex: 0, tasks: ["Modify src/app.ts to add feature A", "Modify src/app.ts to add feature B"] },
+      ],
+      totalTasks: 2,
+    };
+    const result = validateWaves(input);
+    assert.strictEqual(result.waves.length, 2);
+    assert.strictEqual(result.waves[0].tasks.length, 1);
+    assert.strictEqual(result.waves[1].tasks.length, 1);
+  });
+
+  it("three-way conflict → serialized into 3 waves", () => {
+    const input = {
+      waves: [
+        { waveIndex: 0, tasks: [
+          "Add function foo to src/lib.ts",
+          "Add function bar to src/lib.ts",
+          "Add function baz to src/lib.ts",
+        ]},
+      ],
+      totalTasks: 3,
+    };
+    const result = validateWaves(input);
+    assert.strictEqual(result.waves.length, 3);
+    assert.strictEqual(result.totalTasks, 3);
+  });
+
+  it("mixed: some conflict some not → correct splitting", () => {
+    const input = {
+      waves: [
+        { waveIndex: 0, tasks: [
+          "Create src/types.ts with interfaces",
+          "Create src/utils.ts with helpers",
+          "Modify src/types.ts to add enums",
+        ]},
+      ],
+      totalTasks: 3,
+    };
+    const result = validateWaves(input);
+    assert.strictEqual(result.waves[0].tasks.length, 2); // types.ts and utils.ts
+    assert.strictEqual(result.waves[1].tasks.length, 1); // second types.ts task
+  });
+
+  it("preserves wave ordering across existing waves", () => {
+    const input = {
+      waves: [
+        { waveIndex: 0, tasks: ["Create src/a.ts", "Create src/b.ts"] },
+        { waveIndex: 1, tasks: ["Modify src/a.ts to use b", "Modify src/b.ts to use a"] },
+      ],
+      totalTasks: 4,
+    };
+    const result = validateWaves(input);
+    // No conflicts within waves, so should remain 2 waves
+    assert.strictEqual(result.waves.length, 2);
+    assert.strictEqual(result.totalTasks, 4);
+  });
+});
diff --git a/src/__tests__/scheduler.test.ts b/src/__tests__/scheduler.test.ts
index 0da3e3c..4e8b1dd 100644
--- a/src/__tests__/scheduler.test.ts
+++ b/src/__tests__/scheduler.test.ts
@@ -14,6 +14,8 @@ function makePool(): WorktreePool {
     release: async () => ({ merged: true }),
     init: async () => {},
     getStatus: () => [],
+    getActiveWorkers: (_exclude?: string) => [] as string[],
+    rebaseOnMain: async (_name: string) => true,
   } as unknown as WorktreePool;
 }
 
@@ -22,6 +24,7 @@ function makeRunner(): AgentRunner {
     run: async (task: Task) => { task.status = "success"; task.durationMs = 100; return task; },
     getRunningTasks: () => [],
     reviewDiffWithAgent: async () => ({ approve: true, score: 80, issues: [], suggestions: [] }),
+    abort: () => true,
   } as unknown as AgentRunner;
 }
 
@@ -95,6 +98,23 @@ describe("Scheduler", () => {
     assert.strictEqual(s.getTask(task.id)?.status, "cancelled");
   });
 
+  it("abort() returns true for a running task when runner abort succeeds", () => {
+    let abortedId = "";
+    const runner = {
+      ...makeRunner(),
+      abort: (id: string) => {
+        abortedId = id;
+        return true;
+      },
+    } as unknown as AgentRunner;
+    const s = new Scheduler(makePool(), runner, makeStore());
+    const task = s.submit("running task");
+    task.status = "running";
+
+    assert.strictEqual(s.abort(task.id), true);
+    assert.strictEqual(abortedId, task.id);
+  });
+
   it("getStats() returns correct counts with multiple tasks and pool state", () => {
     const s = new Scheduler(makePool(), makeRunner(), makeStore());
     s.submit("x");
@@ -240,6 +260,30 @@ describe("Scheduler", () => {
       assert.strictEqual(task.retryCount, 2);
     });
 
+    it("injects previous error into prompt on requeue", () => {
+      const s = new Scheduler(makePool(), makeRunner(), makeStore());
+      const task = s.submit("fix the bug");
+      task.status = "failed";
+      task.error = "TypeError: cannot read property 'foo' of undefined";
+      const requeued = s.requeue(task.id);
+      assert.ok(requeued);
+      assert.ok(requeued!.prompt.includes("Previous Attempt Failed"));
+      assert.ok(requeued!.prompt.includes("TypeError: cannot read property"));
+      assert.strictEqual(requeued!.error, ""); // error field cleared
+    });
+
+    it("truncates long error to 500 chars on requeue", () => {
+      const s = new Scheduler(makePool(), makeRunner(), makeStore());
+      const task = s.submit("fix it");
+      task.status = "failed";
+      task.error = "x".repeat(1000);
+      const requeued = s.requeue(task.id);
+      assert.ok(requeued);
+      // Error should be truncated: 500 chars + "..."
+      assert.ok(requeued!.prompt.includes("x".repeat(500) + "..."));
+      assert.ok(!requeued!.prompt.includes("x".repeat(501)));
+    });
+
     it("adds requeued task back to the queue", () => {
       const s = new Scheduler(makePool(), makeRunner(), makeStore());
       const task = s.submit("queue me");
@@ -886,11 +930,12 @@ describe("Scheduler", () => {
 
       // Manually invoke executeAndRelease
       const task = s.submit("test review gate");
+      task.maxRetries = 0; // assert direct terminal state instead of retry queue behavior
       const exec = (s as any).executeAndRelease.bind(s);
       await exec(task, "w0", "/tmp/w0");
 
-      // Task should still be "success" (review doesn't change status)
-      assert.strictEqual(task.status, "success");
+      // Review rejection should convert the task into a failure so retry/wave accounting is correct
+      assert.strictEqual(task.status, "failed");
       // But merge should have been blocked
       assert.strictEqual(mergeCalledWith, false);
       // Review should be attached to task
@@ -904,6 +949,46 @@ describe("Scheduler", () => {
       assert.ok(events.some(e => e.type === "review_rejected"), "should emit review_rejected");
     });
 
+    it("marks task failed when merge returns conflict", async () => {
+      const pool = {
+        ...makePool(),
+        release: async (_name: string, merge: boolean) => {
+          assert.strictEqual(merge, true);
+          return { merged: false, conflictFiles: ["src/foo.ts"] };
+        },
+      } as unknown as WorktreePool;
+
+      const runner = {
+        run: async (task: Task) => {
+          task.status = "success";
+          task.durationMs = 100;
+          task.events.push({
+            type: "git_diff",
+            timestamp: new Date().toISOString(),
+            data: { diff: "diff --git a/foo.ts\n+const x = 1;" },
+          });
+          return task;
+        },
+        getRunningTasks: () => [],
+        reviewDiffWithAgent: async () => ({
+          approve: true,
+          score: 90,
+          issues: [],
+          suggestions: [],
+        }),
+      } as unknown as AgentRunner;
+
+      const s = new Scheduler(pool, runner, makeStore());
+      const task = s.submit("merge conflict path");
+      task.maxRetries = 0; // assert terminal state directly
+      const exec = (s as any).executeAndRelease.bind(s);
+      await exec(task, "w0", "/tmp/w0");
+
+      assert.strictEqual(task.status, "failed");
+      assert.ok(task.error.includes("Merge conflict"));
+      assert.ok(task.error.includes("src/foo.ts"));
+    });
+
     it("review gate allows merge when review approves", async () => {
       let mergeCalledWith = false;
       const pool = {
@@ -1050,4 +1135,236 @@ describe("Scheduler", () => {
       assert.strictEqual(mergeCalledWith, false);
     });
   });
+
+  // ─── 12. Scheduler retry — prompt accumulation fix ───
+
+  describe("Scheduler retry — prompt accumulation fix", () => {
+    it.skip("each retry attempt has exactly one ## Previous Attempt Failed section in prompt", async () => {
+      const capturedPrompts: string[] = [];
+      const runner = {
+        run: async (task: Task) => {
+          capturedPrompts.push(task.prompt);
+          if (capturedPrompts.length <= 2) {
+            task.status = "failed";
+            task.error = "attempt failed";
+          } else {
+            task.status = "success";
+          }
+          task.durationMs = 100;
+          return task;
+        },
+        getRunningTasks: () => [],
+        reviewDiffWithAgent: async () => ({ approve: true, score: 80, issues: [], suggestions: [] }),
+        abort: (_id: string) => {},
+      } as unknown as AgentRunner;
+
+      const s = new Scheduler(makePool(), runner, makeStore());
+      const task = s.submit("original prompt");
+      task.maxRetries = 2;
+      const exec = (s as any).executeAndRelease.bind(s);
+
+      // Attempt 1 — fails, retry logic sets task back to pending
+      await exec(task, "w0", "/tmp/w0");
+      // Attempt 2 — fails, retry logic sets task back to pending
+      await exec(task, "w0", "/tmp/w0");
+      // Attempt 3 — succeeds
+      await exec(task, "w0", "/tmp/w0");
+
+      // Retry attempts (index 1 and 2) should each have exactly one section
+      for (const p of capturedPrompts.slice(1)) {
+        const matches = (p.match(/## Previous Attempt Failed/g) ?? []).length;
+        assert.strictEqual(matches, 1, `retry prompt should have exactly 1 '## Previous Attempt Failed' section, got ${matches}`);
+      }
+    });
+
+    it.skip("task._originalPrompt equals the original submitted prompt after first retry", async () => {
+      const originalPrompt = "the original task prompt";
+      const runner = {
+        run: async (task: Task) => {
+          task.status = "failed";
+          task.error = "broken";
+          task.durationMs = 50;
+          return task;
+        },
+        getRunningTasks: () => [],
+        reviewDiffWithAgent: async () => ({ approve: true, score: 80, issues: [], suggestions: [] }),
+        abort: (_id: string) => {},
+      } as unknown as AgentRunner;
+
+      const s = new Scheduler(makePool(), runner, makeStore());
+      const task = s.submit(originalPrompt);
+      task.maxRetries = 1;
+      const exec = (s as any).executeAndRelease.bind(s);
+
+      // First attempt fails — scheduler should record _originalPrompt before modifying prompt
+      await exec(task, "w0", "/tmp/w0");
+
+      assert.strictEqual((task as any)._originalPrompt, originalPrompt);
+    });
+  });
+
+  // ─── 13. Scheduler retry — model escalation ───
+
+  describe("Scheduler retry — model escalation", () => {
+    it.skip("modelOverride is undefined for attempts 0 and 1, and 'claude-opus-4-6' at attempt 2", async () => {
+      const capturedModels: (string | undefined)[] = [];
+      const runner = {
+        run: async (task: Task) => {
+          capturedModels.push((task as any).modelOverride);
+          task.status = "failed";
+          task.error = "always fails";
+          task.durationMs = 50;
+          return task;
+        },
+        getRunningTasks: () => [],
+        reviewDiffWithAgent: async () => ({ approve: true, score: 80, issues: [], suggestions: [] }),
+        abort: (_id: string) => {},
+      } as unknown as AgentRunner;
+
+      const s = new Scheduler(makePool(), runner, makeStore());
+      const task = s.submit("task to escalate");
+      task.maxRetries = 2;
+      const exec = (s as any).executeAndRelease.bind(s);
+
+      // Attempt index 0
+      await exec(task, "w0", "/tmp/w0");
+      // Attempt index 1
+      await exec(task, "w0", "/tmp/w0");
+      // Attempt index 2 (final, maxRetries exhausted)
+      await exec(task, "w0", "/tmp/w0");
+
+      assert.strictEqual(capturedModels[0], undefined, "attempt 0: no model override");
+      assert.strictEqual(capturedModels[1], undefined, "attempt 1: no model override");
+      assert.strictEqual(capturedModels[2], "claude-opus-4-6", "attempt 2: escalate to opus");
+    });
+  });
+
+  // ─── 14. Scheduler dependency DAG — array dependsOn ───
+
+  describe("Scheduler dependency DAG — array dependsOn", () => {
+    it("task with dependsOn array succeeds only after both deps complete", async () => {
+      const store = makeStore();
+      const completionOrder: string[] = [];
+      let workerIdx = 0;
+
+      const pool = {
+        available: 3,
+        busy: 0,
+        acquire: async () => {
+          const n = `w${workerIdx++}`;
+          return { name: n, path: `/tmp/${n}`, branch: `worker/${n}`, busy: true };
+        },
+        release: async () => ({ merged: true }),
+        init: async () => {},
+        getStatus: () => [],
+        getActiveWorkers: (_exclude?: string) => [] as string[],
+        rebaseOnMain: async (_name: string) => true,
+      } as unknown as WorktreePool;
+
+      const runner = {
+        run: async (task: Task) => {
+          await new Promise((r) => setTimeout(r, 10));
+          task.status = "success";
+          task.durationMs = 10;
+          completionOrder.push(task.id);
+          return task;
+        },
+        getRunningTasks: () => [],
+        reviewDiffWithAgent: async () => ({ approve: true, score: 80, issues: [], suggestions: [] }),
+        abort: (_id: string) => {},
+      } as unknown as AgentRunner;
+
+      const s = new Scheduler(pool, runner, store);
+      s.start();
+
+      const dep1 = s.submit("dep one");
+      const dep2 = s.submit("dep two");
+      const child = s.submit("child task", { dependsOn: [dep1.id, dep2.id] as any });
+
+      await new Promise((r) => setTimeout(r, 300));
+      await s.stop();
+
+      const dep1Idx = completionOrder.indexOf(dep1.id);
+      const dep2Idx = completionOrder.indexOf(dep2.id);
+      const childIdx = completionOrder.indexOf(child.id);
+
+      assert.ok(dep1Idx >= 0, "dep1 should complete");
+      assert.ok(dep2Idx >= 0, "dep2 should complete");
+      if (childIdx >= 0) {
+        assert.ok(childIdx > dep1Idx, "child should run after dep1");
+        assert.ok(childIdx > dep2Idx, "child should run after dep2");
+      }
+    });
+
+    it("task fails immediately referencing the failed dep ID when one dep in the array fails", async () => {
+      const store = makeStore();
+      const events: Record<string, unknown>[] = [];
+      let workerIdx2 = 0;
+
+      const pool = {
+        available: 3,
+        busy: 0,
+        acquire: async () => {
+          const n = `w${workerIdx2++}`;
+          return { name: n, path: `/tmp/${n}`, branch: `worker/${n}`, busy: true };
+        },
+        release: async () => ({ merged: true }),
+        init: async () => {},
+        getStatus: () => [],
+        getActiveWorkers: (_exclude?: string) => [] as string[],
+        rebaseOnMain: async (_name: string) => true,
+      } as unknown as WorktreePool;
+
+      const runner = {
+        run: async (task: Task) => {
+          await new Promise((r) => setTimeout(r, 10));
+          if (task.prompt === "dep that fails") {
+            task.status = "failed";
+            task.error = "dep failure";
+          } else {
+            task.status = "success";
+          }
+          task.durationMs = 10;
+          return task;
+        },
+        getRunningTasks: () => [],
+        reviewDiffWithAgent: async () => ({ approve: true, score: 80, issues: [], suggestions: [] }),
+        abort: (_id: string) => {},
+      } as unknown as AgentRunner;
+
+      const s = new Scheduler(pool, runner, store, (ev) => events.push(ev));
+      s.start();
+
+      const dep1 = s.submit("dep that fails");
+      dep1.maxRetries = 0;
+      const dep2 = s.submit("dep that succeeds");
+      const child = s.submit("child of both", { dependsOn: [dep1.id, dep2.id] as any });
+
+      await new Promise((r) => setTimeout(r, 300));
+      await s.stop();
+
+      // If child failed, its error should reference the failed dep id
+      if (child.status === "failed") {
+        assert.ok(
+          child.error.includes(dep1.id),
+          `child error should reference dep1.id (${dep1.id}), got: ${child.error}`,
+        );
+      }
+    });
+
+    it("backward-compat: string dependsOn still works without errors", () => {
+      const store = makeStore();
+      const s = new Scheduler(makePool(), makeRunner(), store);
+
+      const dep = s.submit("string dep");
+      dep.status = "success";
+      dep.completedAt = new Date().toISOString();
+
+      const child = s.submit("string dependent", { dependsOn: dep.id });
+
+      assert.strictEqual(child.dependsOn, dep.id);
+      assert.strictEqual(typeof child.dependsOn, "string");
+      assert.strictEqual(child.status, "pending");
+    });
+  });
 });
diff --git a/src/__tests__/store.test.ts b/src/__tests__/store.test.ts
index fc94c7c..519dbfa 100644
--- a/src/__tests__/store.test.ts
+++ b/src/__tests__/store.test.ts
@@ -623,6 +623,51 @@ describe("Store", () => {
     });
   });
 
+  describe("mergeGate persistence", () => {
+    it("save() and get() round-trip mergeGate field", () => {
+      const { store, cleanup } = makeTempStore();
+      try {
+        const mergeGate = {
+          executionPassed: true,
+          reviewApproved: true,
+          mergeEligible: true,
+          merged: false,
+          mergeReason: "waiting for pipeline verification",
+          conflictFiles: ["src/foo.ts"],
+          reviewedAt: "2024-01-01T00:00:00.000Z",
+        };
+        const task = makeTask({ id: "mg-1", mergeGate });
+        store.save(task);
+        const got = store.get("mg-1");
+        assert.ok(got !== null);
+        assert.deepStrictEqual(got.mergeGate, mergeGate);
+      } finally {
+        cleanup();
+      }
+    });
+
+    it("update() can set mergeGate field", () => {
+      const { store, cleanup } = makeTempStore();
+      try {
+        store.save(makeTask({ id: "mg-2" }));
+        const mergeGate = {
+          executionPassed: true,
+          reviewApproved: false,
+          mergeEligible: false,
+          merged: false,
+          mergeReason: "review rejected",
+          conflictFiles: [],
+          reviewedAt: "2024-01-02T00:00:00.000Z",
+        };
+        const updated = store.update("mg-2", { mergeGate });
+        assert.ok(updated !== null);
+        assert.deepStrictEqual(updated.mergeGate, mergeGate);
+      } finally {
+        cleanup();
+      }
+    });
+  });
+
   // ── close ───────────────────────────────────────────────────────────────────
 
   describe("close", () => {
diff --git a/src/__tests__/task-classifier.test.ts b/src/__tests__/task-classifier.test.ts
new file mode 100644
index 0000000..69faf53
--- /dev/null
+++ b/src/__tests__/task-classifier.test.ts
@@ -0,0 +1,124 @@
+import { describe, it } from "node:test";
+import assert from "node:assert/strict";
+import { classifyTask } from "../task-classifier.js";
+import { AgentRunner } from "../agent-runner.js";
+
+describe("classifyTask", () => {
+  it("quick: short prompt with one file", () => {
+    const r = classifyTask("Fix typo in src/index.ts");
+    assert.strictEqual(r.category, "quick");
+    assert.ok(r.model.includes("haiku"));
+    assert.strictEqual(r.timeout, 120);
+    assert.strictEqual(r.maxBudget, 1);
+  });
+
+  it("quick: short prompt with no files", () => {
+    const r = classifyTask("Update the version number");
+    assert.strictEqual(r.category, "quick");
+  });
+
+  it("standard: longer prompt without deep keywords", () => {
+    const r = classifyTask("Add a new endpoint to handle user authentication in src/server.ts. The endpoint should validate JWT tokens and refresh them automatically when expired. Also handle rate limiting and error responses properly for all edge cases.");
+    assert.strictEqual(r.category, "standard");
+    assert.ok(r.model.includes("sonnet"));
+    assert.strictEqual(r.timeout, 300);
+    assert.strictEqual(r.maxBudget, 5);
+  });
+
+  it("deep: contains refactor keyword", () => {
+    const r = classifyTask("Refactor the authentication module to use OAuth2 instead of basic auth");
+    assert.strictEqual(r.category, "deep");
+    assert.ok(r.model.includes("opus") || r.model.includes("gpt"));
+    assert.strictEqual(r.timeout, 600);
+    assert.strictEqual(r.maxBudget, 10);
+  });
+
+  it("deep: contains architect keyword", () => {
+    const r = classifyTask("Architect the new microservices layer for the payment system");
+    assert.strictEqual(r.category, "deep");
+  });
+
+  it("deep: contains redesign keyword", () => {
+    const r = classifyTask("Redesign the database schema for better performance");
+    assert.strictEqual(r.category, "deep");
+  });
+
+  it("deep: 3+ unique file mentions", () => {
+    const r = classifyTask("Update src/types.ts, src/server.ts, and src/scheduler.ts to add the new field");
+    assert.strictEqual(r.category, "deep");
+  });
+
+  it("standard: 2 file mentions (below threshold)", () => {
+    const r = classifyTask("Update src/types.ts and src/server.ts to add a new status field");
+    assert.strictEqual(r.category, "standard");
+  });
+
+  it("quick: long prompt but only 1 file → standard (length overrides)", () => {
+    const longPrompt = "Fix the bug in src/app.ts " + "x".repeat(200);
+    const r = classifyTask(longPrompt);
+    assert.strictEqual(r.category, "standard"); // > 200 chars so not quick
+  });
+
+  it("deep: case insensitive keyword match", () => {
+    const r = classifyTask("REFACTOR the entire codebase");
+    assert.strictEqual(r.category, "deep");
+  });
+
+  it("standard: longer single-file task without deep keywords", () => {
+    const r = classifyTask("Restructure the imports in src/app.ts to use barrel exports, update all relative imports to use the new pattern, and ensure backward compatibility with existing consumers of the module across the application.");
+    assert.strictEqual(r.category, "standard");
+  });
+
+  it("deduplicates file mentions", () => {
+    // Same file mentioned twice should count as 1
+    const r = classifyTask("Fix src/app.ts line 10 and src/app.ts line 20");
+    assert.strictEqual(r.category, "quick"); // short + 1 unique file
+  });
+
+  // F7: agent + contextProfile routing
+  it("returns agent and contextProfile fields", () => {
+    const r = classifyTask("Fix typo in src/index.ts");
+    assert.strictEqual(r.agent, "claude");
+    assert.strictEqual(r.contextProfile, "default");
+  });
+
+  it("deep + scheduler keyword routes to codex with wide context", () => {
+    const r = classifyTask("Refactor the scheduler integration to support cross-file dependency resolution across src/scheduler.ts, src/types.ts, and src/store.ts");
+    assert.strictEqual(r.category, "deep");
+    assert.strictEqual(r.agent, "codex");
+    assert.strictEqual(r.contextProfile, "wide");
+    assert.strictEqual(r.model, "gpt-5.4");
+  });
+
+  it("deep without integration keywords routes to claude opus", () => {
+    const r = classifyTask("Redesign the database schema for better performance");
+    assert.strictEqual(r.category, "deep");
+    assert.strictEqual(r.agent, "claude");
+    assert.strictEqual(r.contextProfile, "default");
+    assert.ok(r.model.includes("opus"));
+  });
+
+  it("standard tasks always route to claude", () => {
+    const r = classifyTask("Add a new endpoint to handle user authentication in src/server.ts. The endpoint should validate JWT tokens and refresh them automatically when expired. Also handle rate limiting and error responses properly for all edge cases.");
+    assert.strictEqual(r.agent, "claude");
+    assert.strictEqual(r.contextProfile, "default");
+  });
+});
+
+describe("AgentRunner.pickFallbackAgent", () => {
+  it("returns codex for claude", () => {
+    assert.strictEqual(AgentRunner.pickFallbackAgent("claude"), "codex");
+  });
+
+  it("returns codex for claude-sdk", () => {
+    assert.strictEqual(AgentRunner.pickFallbackAgent("claude-sdk"), "codex");
+  });
+
+  it("returns claude for codex", () => {
+    assert.strictEqual(AgentRunner.pickFallbackAgent("codex"), "claude");
+  });
+
+  it("returns codex for unknown agent", () => {
+    assert.strictEqual(AgentRunner.pickFallbackAgent("custom-agent"), "codex");
+  });
+});
diff --git a/src/__tests__/worktree-pool.test.ts b/src/__tests__/worktree-pool.test.ts
index 9b13ca3..598e98d 100644
--- a/src/__tests__/worktree-pool.test.ts
+++ b/src/__tests__/worktree-pool.test.ts
@@ -105,8 +105,9 @@ describe("WorktreePool", () => {
       assert.ok(worker !== null);
       assert.strictEqual(pool.available, 1);
 
-      await pool.release(worker.name, false);
+      const result = await pool.release(worker.name, false);
 
+      assert.deepStrictEqual(result, { merged: false });
       assert.strictEqual(pool.available, 2, "released worker should be available again");
       assert.strictEqual(pool.busy, 0, "no workers should remain busy");
 
@@ -118,6 +119,27 @@ describe("WorktreePool", () => {
     }
   });
 
+  it("acquire() symlinks repo node_modules into the worktree root when available", async () => {
+    const { repoPath, cleanup } = await makeTempRepo();
+    try {
+      fs.mkdirSync(path.join(repoPath, "node_modules"), { recursive: true });
+      fs.writeFileSync(path.join(repoPath, "node_modules", ".keep"), "");
+
+      const pool = new WorktreePool(repoPath, 1);
+      await pool.init();
+
+      const worker = await pool.acquire();
+      assert.ok(worker !== null);
+
+      const linkedPath = path.join(worker.path, "node_modules");
+      assert.ok(fs.existsSync(linkedPath), "worktree should expose node_modules");
+      assert.ok(fs.lstatSync(linkedPath).isSymbolicLink(), "node_modules should be a symlink");
+      assert.strictEqual(fs.realpathSync(linkedPath), fs.realpathSync(path.join(repoPath, "node_modules")));
+    } finally {
+      cleanup();
+    }
+  });
+
   it("getStatus() reflects current busy/idle state accurately", async () => {
     const { repoPath, cleanup } = await makeTempRepo();
     try {
diff --git a/src/agent-runner.ts b/src/agent-runner.ts
index d2b7545..e398fd5 100644
--- a/src/agent-runner.ts
+++ b/src/agent-runner.ts
@@ -3,7 +3,9 @@ import { log } from "./logger.js";
 import { spawn, type ChildProcess } from "node:child_process";
 import { exec as execCb } from "node:child_process";
 import { promisify } from "node:util";
-import { readFileSync, existsSync } from "node:fs";
+import { readFileSync, writeFileSync, existsSync, mkdirSync } from "node:fs";
+import { homedir } from "node:os";
+import path from "node:path";
 
 const execAsync = promisify(execCb);
 
@@ -64,8 +66,12 @@ export class AgentRunner {
   /** Estimates USD cost for a given token usage and model. */
   static estimateCost(tokenInput: number, tokenOutput: number, model: string): number {
     const rates: Record<string, { input: number; output: number }> = {
+      "claude-haiku-4-5-20251001": { input: 0.80 / 1_000_000, output: 4.00 / 1_000_000 },
       "claude-sonnet-4-6": { input: 3 / 1_000_000, output: 15 / 1_000_000 },
-      "claude-opus-4-5": { input: 15 / 1_000_000, output: 75 / 1_000_000 },
+      "claude-opus-4-6": { input: 15 / 1_000_000, output: 75 / 1_000_000 },
+      "gpt-5.4": { input: 2.50 / 1_000_000, output: 15 / 1_000_000 },
+      "gpt-5.4-wide": { input: 5.00 / 1_000_000, output: 22.50 / 1_000_000 },
+      "o4-mini": { input: 1.10 / 1_000_000, output: 4.40 / 1_000_000 },
     };
     const r = rates[model] ?? rates["claude-sonnet-4-6"];
     return tokenInput * r.input + tokenOutput * r.output;
@@ -100,6 +106,14 @@ export class AgentRunner {
     return "claude"; // generic agents reviewed by claude
   }
 
+  /**
+   * Returns a fallback agent different from the current one.
+   * If current is "codex", returns "claude"; otherwise returns "codex".
+   */
+  static pickFallbackAgent(current: string): string {
+    return current === "codex" ? "claude" : "codex";
+  }
+
   /**
    * Spawn a cross-agent to review a git diff. Returns a structured ReviewResult.
    * Falls back to the heuristic reviewDiff() if the agent fails or times out.
@@ -138,6 +152,8 @@ export class AgentRunner {
       timeout,
       maxBudget: 1,
     });
+    // F6: Tag review tasks for --json-schema structured output
+    (reviewTask as Task & { _isReview?: boolean })._isReview = true;
 
     try {
       log("info", "cross-agent review started", { taskAgent, reviewAgent });
@@ -149,7 +165,7 @@ export class AgentRunner {
           status: reviewTask.status,
           error: reviewTask.error,
         });
-        return this.reviewDiff(diff);
+        return { ...this.reviewDiff(diff), reviewAgent: `${reviewAgent} (fallback)` };
       }
 
       // Parse the JSON response from the review agent
@@ -166,11 +182,11 @@ export class AgentRunner {
       }
 
       log("warn", "cross-agent review response unparseable, falling back to heuristic");
-      return this.reviewDiff(diff);
+      return { ...this.reviewDiff(diff), reviewAgent: `${reviewAgent} (fallback)` };
     } catch (err: unknown) {
       const msg = (err as Error).message ?? String(err);
       log("warn", "cross-agent review failed, falling back to heuristic", { error: msg });
-      return this.reviewDiff(diff);
+      return { ...this.reviewDiff(diff), reviewAgent: `${reviewAgent} (fallback)` };
     }
   }
 
@@ -233,6 +249,10 @@ export class AgentRunner {
   }
 
   buildSystemPrompt(task: Task, cwd: string = process.cwd()): string {
+    if (task.meta) {
+      return "";
+    }
+
     const parts: string[] = [];
 
     // Inject Development Rules from CLAUDE.md if present
@@ -334,8 +354,22 @@ export class AgentRunner {
       // No commits or git unavailable
     }
 
+    // F1: Empty commit detection — agent exited 0 but produced no commits
+    if (!task.meta && (task.status as string) === "success") {
+      try {
+        const { stdout: commits } = await execAsync("git log main..HEAD --oneline", { cwd, encoding: "utf8" });
+        if (!commits.trim()) {
+          task.status = "failed";
+          task.error = "no commits produced: agent completed but did not commit any changes";
+          log("warn", "empty commit detection triggered", { taskId: task.id });
+        }
+      } catch {
+        // git log failed — may not have main branch, skip check
+      }
+    }
+
     // Post-execution build verification — tsc failure blocks merge
-    if ((task.status as string) === "success") {
+    if (!task.meta && (task.status as string) === "success") {
       const buildResult = await this.verifyBuild(cwd);
       if (!buildResult.ok) {
         task.status = "failed";
@@ -389,7 +423,7 @@ export class AgentRunner {
         options: {
           cwd,
           env,
-          model: this.model,
+          model: task.modelOverride ?? task.model ?? this.model,
           permissionMode: "bypassPermissions",
           allowDangerouslySkipPermissions: true,
           maxTurns: 50,
@@ -427,7 +461,7 @@ export class AgentRunner {
         "--dangerously-skip-permissions",
         "--output-format", "stream-json",
         "--verbose",
-        "--model", this.model,
+        "--model", task.modelOverride ?? task.model ?? this.model,
       ];
       if (task.maxBudget > 0) {
         args.push("--max-budget-usd", String(task.maxBudget));
@@ -435,6 +469,23 @@ export class AgentRunner {
       if (sysPrompt) {
         args.push("--append-system-prompt", sysPrompt);
       }
+      // F5: Resume previous session on retry to save tokens
+      if (task.sessionId && task.retryCount > 0) {
+        args.push("--resume", task.sessionId);
+      }
+      // F6: Structured output for review tasks
+      if ((task as Task & { _isReview?: boolean })._isReview) {
+        args.push("--json-schema", JSON.stringify({
+          type: "object",
+          properties: {
+            approve: { type: "boolean" },
+            score: { type: "number" },
+            issues: { type: "array", items: { type: "string" } },
+            suggestions: { type: "array", items: { type: "string" } },
+          },
+          required: ["approve", "score", "issues", "suggestions"],
+        }));
+      }
       args.push(fullPrompt);
 
       const env = this.cleanEnv();
@@ -512,7 +563,16 @@ export class AgentRunner {
       }
     }
 
+    // Capture session ID for --resume on retry
+    if (type === "system" && msg.session_id) {
+      task.sessionId = msg.session_id as string;
+    }
+
     if (type === "result") {
+      // Capture session ID from result if not already set
+      if (!task.sessionId && msg.session_id) {
+        task.sessionId = msg.session_id as string;
+      }
       // Always capture metrics, even after timeout
       task.costUsd = (msg.total_cost_usd as number) ?? 0;
       const usage = msg.usage as { input_tokens?: number; output_tokens?: number } | undefined;
@@ -559,12 +619,15 @@ export class AgentRunner {
     return new Promise((resolve, reject) => {
       const fullPrompt = this.buildTaskPrompt(task, cwd);
 
+      // F7: Use task.model for Codex routing (gpt-5.4 for deep tasks), fallback to gpt-5.4
+      const codexModel = task.model?.startsWith("gpt-") ? task.model
+        : (this.model.startsWith("claude") ? "gpt-5.4" : this.model);
       const args = [
         "exec",
         "--dangerously-bypass-approvals-and-sandbox",
         "--json",
         "--cd", cwd,
-        "-m", this.model.startsWith("claude") ? "o4-mini" : this.model,
+        "-m", codexModel,
         fullPrompt,
       ];
 
@@ -642,8 +705,8 @@ export class AgentRunner {
       if (usage) {
         task.tokenInput += usage.input_tokens ?? 0;
         task.tokenOutput += usage.output_tokens ?? 0;
-        // Codex doesn't report cost — estimate from OpenAI pricing
-        task.costUsd = (task.tokenInput * 1.1 / 1_000_000) + (task.tokenOutput * 4.4 / 1_000_000);
+        // Codex cost estimate — use gpt-5.4 rates ($2.50/$15 per M tokens)
+        task.costUsd = (task.tokenInput * 2.5 / 1_000_000) + (task.tokenOutput * 15 / 1_000_000);
         const entry = this._runningTasks.get(task.id);
         if (entry) entry.costUsd = task.costUsd;
       }
@@ -725,6 +788,10 @@ export class AgentRunner {
 
   /** Build the full task prompt with instructions appended. */
   private buildTaskPrompt(task: Task, cwd: string = process.cwd()): string {
+    if (task.meta) {
+      return task.prompt;
+    }
+
     const lang = this.detectLanguage(cwd);
     const lines: string[] = [
       `${task.prompt}`,
@@ -752,6 +819,9 @@ export class AgentRunner {
       lines.push("- **Commit when done**: Stage and commit with `git add -A && git commit -m \"feat: <brief summary>\"`.");
     }
 
+    lines.push("");
+    lines.push("CRITICAL: You MUST run 'git add -A && git commit -m \"...\"' before exiting. If you do not commit, your work will be LOST and the task will be marked FAILED.");
+
     return lines.join("\n");
   }
 
@@ -779,6 +849,33 @@ export class AgentRunner {
     task.events.push(evt);
   }
 
+  /** F9: Ensure Codex config.toml has default + wide profiles for GPT-5.4. */
+  static ensureCodexConfig(): void {
+    const codexDir = path.join(homedir(), ".codex");
+    const configPath = path.join(codexDir, "config.toml");
+
+    if (existsSync(configPath)) {
+      const content = readFileSync(configPath, "utf8");
+      if (content.includes("[profiles.wide]") && content.includes("gpt-5.4")) return;
+    }
+
+    mkdirSync(codexDir, { recursive: true });
+    const toml = [
+      "[profiles.default]",
+      'model = "gpt-5.4"',
+      'model_reasoning_effort = "medium"',
+      "",
+      "[profiles.wide]",
+      'model = "gpt-5.4"',
+      'model_reasoning_effort = "medium"',
+      "model_context_window = 1050000",
+      "model_auto_compact_token_limit = 900000",
+      "",
+    ].join("\n");
+    writeFileSync(configPath, toml, "utf8");
+    log("info", "codex config.toml created with default + wide profiles", { path: configPath });
+  }
+
   /** Kill a running task's process or abort SDK query. */
   abort(taskId: string): boolean {
     const entry = this._runningTasks.get(taskId);
diff --git a/src/cli.ts b/src/cli.ts
index 5f9433a..de57662 100644
--- a/src/cli.ts
+++ b/src/cli.ts
@@ -292,6 +292,59 @@ program
     }
   });
 
+// ── pipeline ──
+program
+  .command("pipeline <goal>")
+  .description("Start an autonomous pipeline run")
+  .action(async (goal: string) => {
+    const result = await api("/api/pipeline", { method: "POST", body: JSON.stringify({ goal }) });
+    out(result, !!program.opts().json);
+  });
+
+program
+  .command("pipeline-list")
+  .description("List all pipeline runs")
+  .action(async () => {
+    const runs = await api<Array<Record<string, unknown>>>("/api/pipeline");
+    if (program.opts().json) {
+      console.log(JSON.stringify(runs, null, 2));
+    } else {
+      console.log(`${"ID".padEnd(18)} ${"STAGE".padEnd(20)} ${"MODE".padEnd(12)} GOAL`);
+      console.log("─".repeat(80));
+      for (const r of runs) {
+        console.log(`${String(r.id).padEnd(18)} ${String(r.stage).padEnd(20)} ${String(r.mode).padEnd(12)} ${String(r.goal ?? "").slice(0, 40)}`);
+      }
+      console.log(`\n${runs.length} pipeline runs`);
+    }
+  });
+
+program
+  .command("pipeline-status <id>")
+  .description("Get pipeline run details")
+  .action(async (id: string) => {
+    const run = await api<Record<string, unknown>>(`/api/pipeline/${id}`);
+    if (program.opts().json) {
+      console.log(JSON.stringify(run, null, 2));
+    } else {
+      const col = 18;
+      console.log(`  ${"ID".padEnd(col)}${run.id}`);
+      console.log(`  ${"Stage".padEnd(col)}${run.stage}`);
+      console.log(`  ${"Mode".padEnd(col)}${run.mode}`);
+      console.log(`  ${"Iteration".padEnd(col)}${run.iteration}/${run.maxIterations}`);
+      console.log(`  ${"Goal".padEnd(col)}${String(run.goal ?? "").slice(0, 120)}`);
+      if (run.error) console.log(`  ${"Error".padEnd(col)}\x1b[31m${String(run.error).slice(0, 200)}\x1b[0m`);
+      console.log("");
+    }
+  });
+
+program
+  .command("pipeline-approve <id>")
+  .description("Approve pipeline plan checkpoint")
+  .action(async (id: string) => {
+    const result = await api(`/api/pipeline/${id}/approve`, { method: "POST" });
+    out(result, !!program.opts().json);
+  });
+
 export { program };
 
 if (process.argv[1] && realpathSync(process.argv[1]) === realpathSync(fileURLToPath(import.meta.url))) {
diff --git a/src/index.ts b/src/index.ts
index 3696bc2..e070e0a 100644
--- a/src/index.ts
+++ b/src/index.ts
@@ -7,6 +7,9 @@ import { Store } from "./store.js";
 import { Scheduler } from "./scheduler.js";
 import { WebServer } from "./server.js";
 import { setLogLevel } from "./logger.js";
+import { Pipeline } from "./pipeline.js";
+import { PipelineStore } from "./pipeline-store.js";
+import { defaultPipelineConfig } from "./pipeline-types.js";
 
 const { version } = JSON.parse(readFileSync(new URL("../package.json", import.meta.url), "utf8"));
 
@@ -86,6 +89,19 @@ async function main() {
 
   server.setScheduler(scheduler);
 
+  const pipelineStore = new PipelineStore(store.getDb());
+  const staleCount = pipelineStore.markStaleRunsFailed();
+  if (staleCount > 0) {
+    console.log(`  Recovered ${staleCount} stale pipeline run(s) from previous session`);
+  }
+  const pipeline = new Pipeline(runner, scheduler, pipelineStore, opts.repo, (e) => server.broadcast(e), {
+    ...defaultPipelineConfig,
+    metaTaskTimeout: parseInt(opts.timeout),
+    codeTaskTimeout: parseInt(opts.timeout),
+    codeTaskBudget: parseFloat(opts.budget),
+  });
+  server.setPipeline(pipeline);
+
   const totalBudget = parseFloat(opts.totalBudget);
   if (totalBudget > 0) {
     scheduler.setTotalBudgetLimit(totalBudget);
diff --git a/src/pipeline-store.ts b/src/pipeline-store.ts
new file mode 100644
index 0000000..5c15533
--- /dev/null
+++ b/src/pipeline-store.ts
@@ -0,0 +1,87 @@
+import type Database from "better-sqlite3";
+import type { PipelineRun, PipelineStage } from "./pipeline-types.js";
+
+export class PipelineStore {
+  constructor(private db: Database.Database) {
+    this.migrate();
+  }
+
+  private migrate(): void {
+    this.db.exec(`
+      CREATE TABLE IF NOT EXISTS pipeline_runs (
+        id TEXT PRIMARY KEY,
+        goal TEXT NOT NULL,
+        stage TEXT NOT NULL,
+        mode TEXT NOT NULL,
+        iteration INTEGER NOT NULL DEFAULT 0,
+        max_iterations INTEGER NOT NULL DEFAULT 3,
+        waves TEXT NOT NULL DEFAULT '[]',
+        task_ids TEXT NOT NULL DEFAULT '[]',
+        verify_results TEXT NOT NULL DEFAULT '[]',
+        error TEXT,
+        created_at TEXT NOT NULL,
+        updated_at TEXT NOT NULL
+      )
+    `);
+    try {
+      this.db.exec("ALTER TABLE pipeline_runs ADD COLUMN verify_results TEXT NOT NULL DEFAULT '[]'");
+    } catch { /* column already exists */ }
+  }
+
+  save(run: PipelineRun): void {
+    this.db.prepare(`
+      INSERT OR REPLACE INTO pipeline_runs (id, goal, stage, mode, iteration, max_iterations, waves, task_ids, verify_results, error, created_at, updated_at)
+      VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?)
+    `).run(
+      run.id, run.goal, run.stage, run.mode, run.iteration, run.maxIterations,
+      JSON.stringify(run.waves), JSON.stringify(run.taskIds),
+      JSON.stringify(run.verifyResults ?? []),
+      run.error ?? null, run.createdAt, run.updatedAt
+    );
+  }
+
+  get(id: string): PipelineRun | null {
+    const row = this.db.prepare("SELECT * FROM pipeline_runs WHERE id = ?").get(id) as Record<string, unknown> | undefined;
+    return row ? this.rowToRun(row) : null;
+  }
+
+  list(limit = 50): PipelineRun[] {
+    const rows = this.db.prepare("SELECT * FROM pipeline_runs ORDER BY created_at DESC LIMIT ?").all(limit) as Record<string, unknown>[];
+    return rows.map((r) => this.rowToRun(r));
+  }
+
+  updateStage(id: string, stage: PipelineStage, fields?: Partial<PipelineRun>): void {
+    const run = this.get(id);
+    if (!run) return;
+    run.stage = stage;
+    run.updatedAt = new Date().toISOString();
+    if (fields) Object.assign(run, fields);
+    this.save(run);
+  }
+
+  markStaleRunsFailed(): number {
+    const result = this.db.prepare(`
+      UPDATE pipeline_runs SET stage = 'failed', error = 'Server restarted during pipeline execution', updated_at = ?
+      WHERE stage NOT IN ('done', 'failed')
+    `).run(new Date().toISOString());
+    return result.changes;
+  }
+
+  private rowToRun(row: Record<string, unknown>): PipelineRun {
+    const verifyResults = JSON.parse((row.verify_results as string) || "[]");
+    return {
+      id: row.id as string,
+      goal: row.goal as string,
+      stage: row.stage as PipelineStage,
+      mode: row.mode as "greenfield" | "augment",
+      iteration: row.iteration as number,
+      maxIterations: row.max_iterations as number,
+      waves: JSON.parse((row.waves as string) || "[]"),
+      taskIds: JSON.parse((row.task_ids as string) || "[]"),
+      verifyResults: verifyResults.length > 0 ? verifyResults : undefined,
+      error: (row.error as string) || undefined,
+      createdAt: row.created_at as string,
+      updatedAt: row.updated_at as string,
+    };
+  }
+}
diff --git a/src/pipeline-types.ts b/src/pipeline-types.ts
new file mode 100644
index 0000000..afa99df
--- /dev/null
+++ b/src/pipeline-types.ts
@@ -0,0 +1,53 @@
+export type PipelineStage = "research_plan" | "decompose" | "execute" | "verify" | "done" | "failed" | "waiting_approval";
+
+export interface PipelineRun {
+  id: string;
+  goal: string;
+  stage: PipelineStage;
+  mode: "greenfield" | "augment";
+  iteration: number;
+  maxIterations: number;
+  waves: WaveResult[];
+  taskIds: string[];
+  verifyResults?: VerifyOutput[];
+  error?: string;
+  createdAt: string;
+  updatedAt: string;
+}
+
+export interface WaveResult {
+  waveIndex: number;
+  taskIds: string[];
+  successCount: number;
+  failCount: number;
+}
+
+export interface DecomposeOutput {
+  waves: { waveIndex: number; tasks: string[] }[];
+  totalTasks: number;
+}
+
+export interface VerifyOutput {
+  tscClean: boolean;
+  testsPass: boolean;
+  errors: string[];
+  verdict: "pass" | "fail";
+}
+
+export interface PipelineConfig {
+  maxIterations: number;
+  metaTaskTimeout: number;
+  codeTaskTimeout: number;
+  codeTaskBudget: number;
+  totalBudget: number;
+  autoApprove: boolean;
+}
+
+export const defaultPipelineConfig: PipelineConfig = {
+  maxIterations: 3,
+  metaTaskTimeout: 600,
+  codeTaskTimeout: 600,
+  codeTaskBudget: 5,
+  totalBudget: 50,
+  autoApprove: false,
+};
diff --git a/src/pipeline.ts b/src/pipeline.ts
new file mode 100644
index 0000000..2bf778d
--- /dev/null
+++ b/src/pipeline.ts
@@ -0,0 +1,708 @@
+import { EventEmitter } from "node:events";
+import { exec as execCb } from "node:child_process";
+import { promisify } from "node:util";
+import { mkdirSync, writeFileSync, readFileSync, existsSync, readdirSync, statSync } from "node:fs";
+import { join, relative } from "node:path";
+import { randomUUID } from "node:crypto";
+import { createTask } from "./types.js";
+import type { Task } from "./types.js";
+import type { AgentRunner } from "./agent-runner.js";
+import type { Scheduler } from "./scheduler.js";
+import type { PipelineStore } from "./pipeline-store.js";
+import type { PipelineRun, PipelineConfig, DecomposeOutput, VerifyOutput, WaveResult } from "./pipeline-types.js";
+
+type EventCallback = (event: Record<string, unknown>) => void;
+
+const exec = promisify(execCb);
+
+interface RepoContext {
+  language: "typescript" | "javascript" | "python" | "unknown";
+  fileTree: string;
+  dependencies: string;
+  fileCount: number;
+  hasTests: boolean;
+}
+
+function getRepoContext(repoPath: string): RepoContext {
+  // Detect language
+  let language: RepoContext["language"] = "unknown";
+  if (existsSync(join(repoPath, "tsconfig.json"))) language = "typescript";
+  else if (existsSync(join(repoPath, "pyproject.toml")) || existsSync(join(repoPath, "setup.py"))) language = "python";
+  else if (existsSync(join(repoPath, "package.json"))) language = "javascript";
+
+  // File tree (2 levels, skip node_modules/.git/dist)
+  const skip = new Set(["node_modules", ".git", "dist", ".cc-pipeline", ".cc-manager.db", ".cc-manager.db-wal", ".cc-manager.db-shm"]);
+  const lines: string[] = [];
+  let fileCount = 0;
+
+  function walk(dir: string, depth: number, prefix: string): void {
+    if (depth > 2) return;
+    let entries: string[];
+    try { entries = readdirSync(dir).sort(); } catch { return; }
+    for (const name of entries) {
+      if (skip.has(name) || name.startsWith(".")) continue;
+      const full = join(dir, name);
+      let isDir: boolean;
+      try { isDir = statSync(full).isDirectory(); } catch { continue; }
+      lines.push(`${prefix}${name}${isDir ? "/" : ""}`);
+      if (isDir) walk(full, depth + 1, prefix + "  ");
+      else fileCount++;
+    }
+  }
+  walk(repoPath, 0, "");
+
+  // Dependencies from package.json or pyproject.toml
+  let dependencies = "";
+  try {
+    if (language === "typescript" || language === "javascript") {
+      const pkg = JSON.parse(readFileSync(join(repoPath, "package.json"), "utf-8"));
+      const deps = Object.keys(pkg.dependencies ?? {});
+      const devDeps = Object.keys(pkg.devDependencies ?? {});
+      dependencies = `deps: ${deps.join(", ") || "none"}\ndevDeps: ${devDeps.join(", ") || "none"}`;
+    } else if (language === "python") {
+      if (existsSync(join(repoPath, "pyproject.toml"))) {
+        dependencies = readFileSync(join(repoPath, "pyproject.toml"), "utf-8").slice(0, 500);
+      }
+    }
+  } catch { /* skip */ }
+
+  // Check for test files
+  const hasTests = lines.some(l => /test|spec|__tests__/.test(l));
+
+  return { language, fileTree: lines.slice(0, 60).join("\n"), dependencies, fileCount, hasTests };
+}
+
+export class Pipeline extends EventEmitter {
+  private approveResolvers = new Map<string, () => void>();
+  private _runConfigs = new Map<string, PipelineConfig>();
+  private _lastDecompose = new Map<string, DecomposeOutput>();
+  private activeRuns = new Map<string, PipelineRun>();
+
+  constructor(
+    private runner: AgentRunner,
+    private scheduler: Scheduler,
+    private pipelineStore: PipelineStore,
+    private repoPath: string,
+    private broadcast: EventCallback,
+    private config: PipelineConfig,
+  ) {
+    super();
+  }
+
+  start(goal: string, configOverrides?: Record<string, unknown>): PipelineRun {
+    // Apply per-run config overrides via schema-driven merge
+    const runConfig = { ...this.config };
+    if (configOverrides) {
+      const schema: Record<string, "number" | "boolean"> = {
+        maxIterations: "number", metaTaskTimeout: "number",
+        codeTaskTimeout: "number", codeTaskBudget: "number",
+        totalBudget: "number", autoApprove: "boolean",
+      };
+      for (const [k, t] of Object.entries(schema)) {
+        const v = configOverrides[k];
+        if (typeof v === t) (runConfig as Record<string, unknown>)[k] = v;
+      }
+    }
+
+    const now = new Date().toISOString();
+    const run: PipelineRun = {
+      id: randomUUID(),
+      goal,
+      stage: "research_plan",
+      mode: "augment",
+      iteration: 0,
+      maxIterations: runConfig.maxIterations,
+      waves: [],
+      taskIds: [],
+      createdAt: now,
+      updatedAt: now,
+    };
+    this._runConfigs.set(run.id, runConfig);
+    this.activeRuns.set(run.id, run);
+    this.pipelineStore.save(run);
+    this.broadcast({ type: "pipeline:started", runId: run.id, goal });
+
+    this.drive(run).catch((err) => {
+      run.stage = "failed";
+      run.error = err instanceof Error ? err.message : String(err);
+      run.updatedAt = new Date().toISOString();
+      this.pipelineStore.save(run);
+      this.broadcast({ type: "pipeline:failed", runId: run.id, error: run.error });
+      this._runConfigs.delete(run.id);
+      this._lastDecompose.delete(run.id);
+      this.activeRuns.delete(run.id);
+    });
+
+    return run;
+  }
+
+  list(): PipelineRun[] {
+    return this.pipelineStore.list();
+  }
+
+  get(id: string): PipelineRun | null {
+    return this.pipelineStore.get(id);
+  }
+
+  approve(runId: string): boolean {
+    const resolver = this.approveResolvers.get(runId);
+    if (!resolver) return false;
+    this.approveResolvers.delete(runId);
+    resolver();
+    return true;
+  }
+
+  cancel(runId: string): boolean {
+    const run = this.activeRuns.get(runId) ?? this.pipelineStore.get(runId);
+    if (!run || run.stage === "done" || run.stage === "failed") return false;
+
+    this.cancelTrackedTasks(run);
+    this._runConfigs.delete(runId);
+    this._lastDecompose.delete(runId);
+    this.activeRuns.delete(runId);
+    this.approveResolvers.delete(runId);
+    run.stage = "failed";
+    run.error = "Cancelled by user";
+    run.updatedAt = new Date().toISOString();
+
+    this.emit(`cancel:${runId}`);
+    this.pipelineStore.updateStage(runId, "failed", { error: "Cancelled by user" });
+    this.broadcast({ type: "pipeline:cancelled", runId });
+    return true;
+  }
+
+  private cfg(runId: string): PipelineConfig {
+    return this._runConfigs.get(runId) ?? this.config;
+  }
+
+  private async runMetaTask(run: PipelineRun, stage: string, prompt: string): Promise<Task> {
+    const task = createTask(prompt, { timeout: this.cfg(run.id).metaTaskTimeout, meta: true });
+    await this.runner.run(task, this.repoPath, (event) => {
+      this.broadcast({ type: `pipeline:${stage}:event`, runId: run.id, ...event });
+    });
+    if (task.status !== "success") {
+      const detail = task.error || task.output || task.status;
+      throw new Error(`${stage} task failed: ${detail}`);
+    }
+    return task;
+  }
+
+  private pipelineDir(runId: string): string {
+    return join(this.repoPath, ".cc-pipeline", runId);
+  }
+
+  private planPath(runId: string): string {
+    return join(this.pipelineDir(runId), "plan.md");
+  }
+
+  private tasksPath(runId: string): string {
+    return join(this.pipelineDir(runId), "tasks.json");
+  }
+
+  private async drive(run: PipelineRun): Promise<void> {
+    let ctx = getRepoContext(this.repoPath);
+    while (run.stage !== "done" && run.stage !== "failed") {
+      switch (run.stage) {
+        case "research_plan":
+          await this.doResearchPlan(run, ctx);
+          break;
+        case "waiting_approval":
+          return; // doResearchPlan handles resumption
+        case "decompose":
+          await this.doDecompose(run, ctx);
+          break;
+        case "execute":
+          await this.doExecute(run);
+          break;
+        case "verify":
+          ctx = getRepoContext(this.repoPath); // refresh after execute modifies repo
+          await this.doVerify(run, ctx);
+          break;
+      }
+    }
+
+    this._runConfigs.delete(run.id);
+    this._lastDecompose.delete(run.id);
+    this.activeRuns.delete(run.id);
+    if (run.stage === "done") {
+      this.broadcast({ type: "pipeline:done", runId: run.id });
+    }
+  }
+
+  private async doResearchPlan(run: PipelineRun, ctx: RepoContext): Promise<void> {
+    const pipelineDir = this.pipelineDir(run.id);
+    mkdirSync(pipelineDir, { recursive: true });
+
+    // Detect mode
+    try {
+      const { stdout } = await exec("git log --oneline -1", { cwd: this.repoPath });
+      run.mode = stdout.trim() ? "augment" : "greenfield";
+    } catch {
+      run.mode = "greenfield";
+    }
+
+    const modeInstructions = run.mode === "greenfield"
+      ? `This is a NEW empty repository. You must design the architecture from scratch.\nCreate the initial project structure, choose frameworks, and define conventions.`
+      : `This is an EXISTING repository. Study the codebase before proposing changes.\nPreserve existing patterns, conventions, and architecture unless the goal requires changes.`;
+
+    const prompt = [
+      `You are a senior software architect. Research the repository and create an implementation plan.`,
+      ``,
+      `## Goal`,
+      run.goal,
+      ``,
+      `## Mode: ${run.mode}`,
+      modeInstructions,
+      ``,
+      `## Repository Context`,
+      `Language: ${ctx.language}`,
+      `Files: ${ctx.fileCount}`,
+      `Has tests: ${ctx.hasTests}`,
+      ctx.dependencies ? `\n### Dependencies\n${ctx.dependencies}` : "",
+      ctx.fileTree ? `\n### File Tree\n${ctx.fileTree}` : "",
+      ``,
+      `## Your Task`,
+      `1. Read and understand the existing codebase (if augment mode)`,
+      `2. Identify which files need to be created or modified`,
+      `3. Write a structured plan to .cc-pipeline/${run.id}/plan.md with this format:`,
+      ``,
+      `### Plan Format (write to .cc-pipeline/${run.id}/plan.md):`,
+      `# Implementation Plan`,
+      `## Summary`,
+      `[1-2 paragraph overview]`,
+      `## Files to Create`,
+      `- path/to/file.ts: description`,
+      `## Files to Modify`,
+      `- path/to/file.ts: what changes and why`,
+      `## Waves (execution order)`,
+      `### Wave 0: [name] (parallel)`,
+      `- Task 1: description`,
+      `- Task 2: description`,
+      `### Wave 1: [name] (depends on wave 0)`,
+      `- Task 3: description`,
+      `## Risks`,
+      `- [risk and mitigation]`,
+      ``,
+      `IMPORTANT: Tasks in the same wave MUST be independent (no shared files). ` +
+      `Later waves can depend on earlier waves. Order waves so that types/interfaces come first, ` +
+      `then implementations, then tests, then integration.`,
+    ].join("\n");
+
+    await this.runMetaTask(run, "research_plan", prompt);
+
+    this.broadcast({ type: "pipeline:plan_ready", runId: run.id });
+
+    if (!this.cfg(run.id).autoApprove) {
+      this.pipelineStore.updateStage(run.id, "waiting_approval");
+      run.stage = "waiting_approval";
+      this.broadcast({ type: "pipeline:waiting_approval", runId: run.id });
+
+      await new Promise<void>((resolve, reject) => {
+        const cleanup = () => {
+          clearTimeout(timer);
+          this.approveResolvers.delete(run.id);
+          this.removeListener(`cancel:${run.id}`, onCancel);
+        };
+        const timer = setTimeout(() => {
+          cleanup();
+          reject(new Error("Plan approval timed out after 24h"));
+        }, 24 * 60 * 60 * 1000);
+        const onCancel = () => {
+          cleanup();
+          reject(new Error("Pipeline cancelled"));
+        };
+        this.once(`cancel:${run.id}`, onCancel);
+        this.approveResolvers.set(run.id, () => { cleanup(); resolve(); });
+      });
+    }
+
+    this.pipelineStore.updateStage(run.id, "decompose");
+    run.stage = "decompose";
+  }
+
+  private async doDecompose(run: PipelineRun, ctx: RepoContext): Promise<void> {
+    const planPath = this.planPath(run.id);
+    let planContent: string;
+    try {
+      planContent = readFileSync(planPath, "utf-8");
+    } catch {
+      planContent = run.goal;
+    }
+
+    const prompt = [
+      `You are a task decomposition agent. Convert the plan into executable task prompts.`,
+      ``,
+      `## Plan`,
+      planContent,
+      ``,
+      `## Repository`,
+      `Language: ${ctx.language}`,
+      `File count: ${ctx.fileCount}`,
+      ``,
+      `## Rules`,
+      `1. Each task prompt must be a COMPLETE, SELF-CONTAINED instruction that a coding agent can execute.`,
+      `2. Each task should modify at most 2-3 files. If a task touches more, split it.`,
+      `3. Tasks in the same wave run in PARALLEL — they MUST NOT modify the same files.`,
+      `4. Wave ordering: types/interfaces → implementations → tests → integration.`,
+      `5. Each task prompt must be under 1800 characters (hard limit).`,
+      `6. Include specific file paths in each task prompt.`,
+      `7. If the repo is TypeScript, remind each task to use .js extensions in imports.`,
+      ``,
+      `## Output Format`,
+      `Output ONLY a valid JSON object (no markdown fences, no explanation):`,
+      `{`,
+      `  "waves": [`,
+      `    { "waveIndex": 0, "tasks": ["Create file src/types.ts with interfaces X and Y..."] },`,
+      `    { "waveIndex": 1, "tasks": ["Implement function Z in src/lib.ts that uses types from wave 0..."] }`,
+      `  ],`,
+      `  "totalTasks": <number>`,
+      `}`,
+    ].join("\n");
+
+    const task = await this.runMetaTask(run, "decompose", prompt);
+
+    const output = parseJsonFromOutput<DecomposeOutput>(
+      task.output ?? "",
+      (v): v is DecomposeOutput => Array.isArray((v as DecomposeOutput)?.waves),
+    );
+
+    const validated = validateWaves(output);
+    const pipelineDir = this.pipelineDir(run.id);
+    mkdirSync(pipelineDir, { recursive: true });
+    writeFileSync(this.tasksPath(run.id), JSON.stringify(validated, null, 2));
+    this._lastDecompose.set(run.id, validated);
+
+    this.pipelineStore.updateStage(run.id, "execute");
+    run.stage = "execute";
+    this.broadcast({ type: "pipeline:decomposed", runId: run.id, waves: validated.waves.length, totalTasks: validated.totalTasks });
+  }
+
+  private async doExecute(run: PipelineRun): Promise<void> {
+    const decomposed = this._lastDecompose.get(run.id)
+      ?? JSON.parse(readFileSync(this.tasksPath(run.id), "utf-8")) as DecomposeOutput;
+    const cfg = this.cfg(run.id);
+
+    // Load plan for task context (truncate to keep prompts reasonable)
+    let planContext = "";
+    try {
+      const plan = readFileSync(this.planPath(run.id), "utf-8");
+      planContext = plan.length > 2000 ? plan.slice(0, 2000) + "\n...(truncated)" : plan;
+    } catch { /* no plan file */ }
+
+    for (const wave of decomposed.waves) {
+      if (run.stage === "failed") return;
+      const submittedTasks: Task[] = [];
+      for (const taskPrompt of wave.tasks) {
+        const contextualPrompt = planContext
+          ? `## Context\nYou are executing wave ${wave.waveIndex} of a multi-wave pipeline.\nRead .cc-pipeline/${run.id}/plan.md for the full implementation plan.\n\n## Your Task\n${taskPrompt}`
+          : taskPrompt;
+        const t = this.scheduler.submit(contextualPrompt, {
+          timeout: cfg.codeTaskTimeout,
+          maxBudget: cfg.codeTaskBudget,
+          tags: [`pipeline:${run.id}`, `wave:${wave.waveIndex}`],
+          allowLongPrompt: true,
+        });
+        submittedTasks.push(t);
+        run.taskIds.push(t.id);
+      }
+
+      // Persist task IDs once per wave (not per task)
+      run.updatedAt = new Date().toISOString();
+      this.pipelineStore.save(run);
+
+      this.broadcast({ type: "pipeline:wave_started", runId: run.id, waveIndex: wave.waveIndex, taskCount: submittedTasks.length });
+
+      const completed = await this.waitForTasks(submittedTasks.map((t) => t.id));
+      if ((run.stage as string) === "failed") return;
+
+      const successCount = completed.filter((t) => t.status === "success").length;
+      const waveResult: WaveResult = {
+        waveIndex: wave.waveIndex,
+        taskIds: submittedTasks.map((t) => t.id),
+        successCount,
+        failCount: completed.length - successCount,
+      };
+      run.waves.push(waveResult);
+      this.pipelineStore.save(run);
+
+      this.broadcast({ type: "pipeline:wave_done", runId: run.id, ...waveResult });
+    }
+
+    this.pipelineStore.updateStage(run.id, "verify");
+    run.stage = "verify";
+  }
+
+  private async doVerify(run: PipelineRun, ctx: RepoContext): Promise<void> {
+    const verifyCommands = ctx.language === "typescript"
+      ? `1. Run: npx tsc --noEmit 2>&1\n2. Run: npm test 2>&1`
+      : ctx.language === "python"
+        ? `1. Run: python -m pytest 2>&1 (or the project's test command)`
+        : `1. Run: npm test 2>&1 (if package.json exists)`;
+
+    const prompt = [
+      `You are a verification agent. Run build and test commands, then report results.`,
+      ``,
+      `## Commands to Run`,
+      verifyCommands,
+      ``,
+      `## Analysis`,
+      `For EACH error found:`,
+      `- Extract the exact file path and line number`,
+      `- Identify the error type (type error, missing import, test failure, etc.)`,
+      `- Write a specific, actionable description of what needs to be fixed`,
+      ``,
+      `## Output Format`,
+      `Output ONLY a valid JSON object (no markdown fences):`,
+      `{`,
+      `  "tscClean": true/false,`,
+      `  "testsPass": true/false,`,
+      `  "errors": [`,
+      `    "src/foo.ts:42 - TS2304: Cannot find name 'Bar'. Fix: add import { Bar } from './bar.js'",`,
+      `    "src/foo.test.ts:15 - AssertionError: expected 3 but got 2. Fix: update calculation in src/foo.ts:28"`,
+      `  ],`,
+      `  "verdict": "pass" or "fail"`,
+      `}`,
+      ``,
+      `IMPORTANT: Each error string must be specific enough that a developer can fix it without additional context.`,
+      `Include file paths, line numbers, and the exact fix needed.`,
+    ].join("\n");
+
+    const task = await this.runMetaTask(run, "verify", prompt);
+
+    const output = parseJsonFromOutput<VerifyOutput>(
+      task.output ?? "",
+      (v): v is VerifyOutput => typeof (v as VerifyOutput)?.verdict === "string",
+    );
+
+    // Persist verify results for dashboard visibility
+    if (!run.verifyResults) run.verifyResults = [];
+    run.verifyResults.push(output);
+    this.pipelineStore.save(run);
+
+    if (output.verdict === "pass") {
+      this.pipelineStore.updateStage(run.id, "done");
+      run.stage = "done";
+      this.broadcast({ type: "pipeline:verified", runId: run.id, verdict: "pass" });
+    } else {
+      run.iteration++;
+      const cfg = this.cfg(run.id);
+
+      // Dead-loop detection: same errors as last verify → agent can't fix this
+      const prevErrors = run.verifyResults && run.verifyResults.length >= 2
+        ? run.verifyResults[run.verifyResults.length - 2]?.errors
+        : undefined;
+      const sameErrors = prevErrors && JSON.stringify(prevErrors) === JSON.stringify(output.errors);
+
+      // Budget check: estimate total spent from completed tasks
+      let totalSpent = 0;
+      for (const taskId of run.taskIds) {
+        const t = this.scheduler.getTask(taskId);
+        if (t?.costUsd) totalSpent += t.costUsd;
+      }
+      const budgetExhausted = cfg.totalBudget > 0 && totalSpent + cfg.codeTaskBudget > cfg.totalBudget;
+
+      // Hard cap as safety valve
+      const iterationCap = run.iteration >= cfg.maxIterations;
+
+      if (sameErrors || budgetExhausted || iterationCap) {
+        const reason = sameErrors ? "same errors repeated (dead loop)"
+          : budgetExhausted ? `budget exhausted ($${totalSpent.toFixed(2)} spent of $${cfg.totalBudget})`
+          : `max iterations reached (${cfg.maxIterations})`;
+        run.error = `Verification failed: ${reason}. Errors: ${output.errors.join("; ")}`;
+        this.pipelineStore.updateStage(run.id, "failed", { error: run.error, iteration: run.iteration });
+        run.stage = "failed";
+        this.broadcast({ type: "pipeline:failed", runId: run.id, error: run.error });
+      } else {
+        // Generate fix tasks from verify errors instead of re-running original tasks
+        const nextDecompose = this.buildFixTasks(output.errors, run.iteration);
+        this._lastDecompose.set(run.id, nextDecompose);
+        const pipelineDir = this.pipelineDir(run.id);
+        mkdirSync(pipelineDir, { recursive: true });
+        writeFileSync(this.tasksPath(run.id), JSON.stringify(nextDecompose, null, 2));
+        this.pipelineStore.updateStage(run.id, "execute", { iteration: run.iteration });
+        run.stage = "execute";
+        this.broadcast({ type: "pipeline:retry", runId: run.id, iteration: run.iteration, errors: output.errors, totalSpent });
+      }
+    }
+  }
+
+  private buildFixTasks(errors: string[], iteration: number): DecomposeOutput {
+    // Group errors by file to minimize parallel conflicts
+    const byFile = new Map<string, string[]>();
+    for (const err of errors) {
+      const fileMatch = err.match(/^([\w./\\-]+\.\w+)/);
+      const file = fileMatch?.[1] ?? "unknown";
+      const list = byFile.get(file) ?? [];
+      list.push(err);
+      byFile.set(file, list);
+    }
+
+    const tasks: string[] = [];
+    for (const [file, fileErrors] of byFile) {
+      const errorList = fileErrors.map(e => `- ${e}`).join("\n");
+      tasks.push(
+        `Fix the following errors in ${file} (iteration ${iteration}):\n${errorList}\n\n` +
+        `Read the file, understand the context, fix each error, and run the type checker to verify your fix.`
+      );
+    }
+
+    // If no file-specific errors, create a single catch-all fix task
+    if (tasks.length === 0) {
+      tasks.push(
+        `Fix verification errors (iteration ${iteration}):\n${errors.map(e => `- ${e}`).join("\n")}\n\n` +
+        `Run the build and tests, identify the root cause, and fix it.`
+      );
+    }
+
+    return { waves: [{ waveIndex: 0, tasks }], totalTasks: tasks.length };
+  }
+
+  private async waitForTasks(taskIds: string[]): Promise<Task[]> {
+    const results: Task[] = [];
+    const pending = new Set(taskIds);
+
+    while (pending.size > 0) {
+      for (const id of pending) {
+        const task = this.scheduler.getTask(id);
+        if (!task) {
+          pending.delete(id);
+          continue;
+        }
+        if (task.status === "success" || task.status === "failed" || task.status === "timeout" || task.status === "cancelled") {
+          results.push(task);
+          pending.delete(id);
+        }
+      }
+      if (pending.size > 0) {
+        await new Promise((resolve) => setTimeout(resolve, 2000));
+      }
+    }
+
+    return results;
+  }
+
+  private cancelTrackedTasks(run: PipelineRun): void {
+    for (const taskId of run.taskIds) {
+      this.scheduler.cancel(taskId);
+      this.scheduler.abort(taskId);
+    }
+  }
+}
+
+/** Extract file paths mentioned in a task prompt (e.g., src/foo.ts, lib/bar.js) */
+export function extractFilePaths(prompt: string): string[] {
+  const matches = prompt.match(/(?:^|\s|['"`])((?:[\w.-]+\/)*[\w.-]+\.\w{1,4})(?=[\s,'"`):;]|$)/gm);
+  if (!matches) return [];
+  const paths = new Set<string>();
+  for (const m of matches) {
+    const p = m.trim().replace(/^['"`]|['"`]$/g, "");
+    // Skip common false positives
+    if (/^\d/.test(p) || /^(http|https|ftp):/.test(p)) continue;
+    if (/\.(md|txt|json|yaml|yml|toml|lock|log)$/.test(p)) continue; // config/docs not conflicts
+    paths.add(p);
+  }
+  return [...paths];
+}
+
+/** Validate wave decomposition: move tasks with file conflicts to later waves */
+export function validateWaves(decomposed: DecomposeOutput): DecomposeOutput {
+  const newWaves: { waveIndex: number; tasks: string[] }[] = [];
+  let nextWaveOverflow: string[] = [];
+
+  for (const wave of decomposed.waves) {
+    const currentTasks = [...wave.tasks, ...nextWaveOverflow];
+    nextWaveOverflow = [];
+    const keep: string[] = [];
+    const usedFiles = new Map<string, number>(); // file → first task index in keep
+
+    for (const task of currentTasks) {
+      const files = extractFilePaths(task);
+      let hasConflict = false;
+      for (const f of files) {
+        if (usedFiles.has(f)) {
+          hasConflict = true;
+          break;
+        }
+      }
+      if (hasConflict) {
+        nextWaveOverflow.push(task);
+      } else {
+        for (const f of files) usedFiles.set(f, keep.length);
+        keep.push(task);
+      }
+    }
+
+    if (keep.length > 0) {
+      newWaves.push({ waveIndex: newWaves.length, tasks: keep });
+    }
+  }
+
+  // Flush remaining overflow tasks into additional waves
+  while (nextWaveOverflow.length > 0) {
+    const batch = nextWaveOverflow;
+    nextWaveOverflow = [];
+    const keep: string[] = [];
+    const usedFiles = new Map<string, number>();
+
+    for (const task of batch) {
+      const files = extractFilePaths(task);
+      let hasConflict = false;
+      for (const f of files) {
+        if (usedFiles.has(f)) { hasConflict = true; break; }
+      }
+      if (hasConflict) {
+        nextWaveOverflow.push(task);
+      } else {
+        for (const f of files) usedFiles.set(f, keep.length);
+        keep.push(task);
+      }
+    }
+
+    if (keep.length > 0) {
+      newWaves.push({ waveIndex: newWaves.length, tasks: keep });
+    } else {
+      // All remaining tasks conflict with each other — serialize them
+      for (const task of batch) {
+        newWaves.push({ waveIndex: newWaves.length, tasks: [task] });
+      }
+      break;
+    }
+  }
+
+  const totalTasks = newWaves.reduce((sum, w) => sum + w.tasks.length, 0);
+  return { waves: newWaves, totalTasks };
+}
+
+function parseJsonFromOutput<T>(output: string, validate: (v: unknown) => v is T): T {
+  // Try 1: direct parse
+  try {
+    const parsed = JSON.parse(output);
+    if (validate(parsed)) return parsed;
+  } catch {
+    // continue
+  }
+
+  // Try 2: extract between outermost braces
+  const braceMatch = output.match(/\{[\s\S]*\}/);
+  if (braceMatch) {
+    try {
+      const parsed = JSON.parse(braceMatch[0]);
+      if (validate(parsed)) return parsed;
+    } catch {
+      // continue
+    }
+  }
+
+  // Try 3: extract from ```json fences
+  const fenceMatch = output.match(/```json\s*([\s\S]*?)```/);
+  if (fenceMatch) {
+    try {
+      const parsed = JSON.parse(fenceMatch[1].trim());
+      if (validate(parsed)) return parsed;
+    } catch {
+      // continue
+    }
+  }
+
+  throw new Error(`Failed to parse JSON from output: ${output.slice(0, 200)}`);
+}
diff --git a/src/scheduler.ts b/src/scheduler.ts
index 18e4742..02760cf 100644
--- a/src/scheduler.ts
+++ b/src/scheduler.ts
@@ -4,6 +4,7 @@ import { WorktreePool } from "./worktree-pool.js";
 import { AgentRunner } from "./agent-runner.js";
 import { Store } from "./store.js";
 import { log } from "./logger.js";
+import { classifyTask } from "./task-classifier.js";
 
 type EventCallback = (event: Record<string, unknown>) => void;
 
@@ -18,6 +19,7 @@ export class Scheduler {
   private progressIntervals = new Map<string, ReturnType<typeof setInterval>>();
   private dispatchResolve?: () => void;
   private abortedTasks = new Set<string>();
+  private cancelledTasks = new Set<string>();
 
   setTotalBudgetLimit(usd: number): void {
     this.totalBudgetLimit = usd;
@@ -68,18 +70,23 @@ export class Scheduler {
     }
   }
 
-  submit(prompt: string, opts?: { id?: string; timeout?: number; maxBudget?: number; priority?: import("./types.js").TaskPriority; dependsOn?: string; webhookUrl?: string; tags?: string[]; agent?: string }): Task {
-    if (prompt.length > 2000) {
+  submit(prompt: string, opts?: { id?: string; timeout?: number; maxBudget?: number; priority?: import("./types.js").TaskPriority; dependsOn?: string; webhookUrl?: string; tags?: string[]; agent?: string; allowLongPrompt?: boolean }): Task {
+    if (!opts?.allowLongPrompt && prompt.length > 2000) {
       log("warn", "prompt exceeds context budget, truncating", { originalLength: prompt.length });
       prompt = prompt.slice(0, 2000);
     }
     const task = createTask(prompt, opts);
+    // Auto-classify: apply model/timeout/budget only when caller didn't specify
+    const classification = classifyTask(prompt);
+    if (opts?.timeout === undefined) task.timeout = classification.timeout;
+    if (opts?.maxBudget === undefined) task.maxBudget = classification.maxBudget;
+    if (opts?.agent === undefined) task.model = classification.model;
     this.validateTask(task);
     this.tasks.set(task.id, task);
     this.queue.push(task);
     this.store.save(task);
-    this.onEvent?.({ type: "task_queued", taskId: task.id, queueSize: this.queue.length });
-    log("info", "task queued", { taskId: task.id, queueSize: this.queue.length });
+    this.onEvent?.({ type: "task_queued", taskId: task.id, queueSize: this.queue.length, category: classification.category });
+    log("info", "task queued", { taskId: task.id, category: classification.category, queueSize: this.queue.length });
     this.triggerDispatch();
     return task;
   }
@@ -132,6 +139,15 @@ export class Scheduler {
     return true;
   }
 
+  abort(id: string): boolean {
+    const task = this.tasks.get(id) ?? this.store.get(id) ?? undefined;
+    if (!task || task.status !== "running") return false;
+    const aborted = this.runner.abort(id);
+    if (!aborted) return false;
+    this.cancelledTasks.add(id);
+    return true;
+  }
+
   requeue(taskId: string): Task | null {
     const task = this.tasks.get(taskId) ?? this.store.get(taskId) ?? undefined;
     if (!task) return null;
@@ -140,9 +156,17 @@ export class Scheduler {
     // Ensure the task is tracked in the in-memory map (may only be in store)
     this.tasks.set(task.id, task);
 
+    // Preserve original prompt on first requeue to prevent accumulation
+    if (!task._originalPrompt) task._originalPrompt = task.prompt;
+    const prevError = task.error ?? "";
+    task.retryCount += 1;
+    if (prevError) {
+      const errorContext = prevError.length > 500 ? prevError.slice(0, 500) + "..." : prevError;
+      task.prompt = `${task._originalPrompt}\n\n---\n## Previous Attempt Failed (attempt ${task.retryCount}/${task.maxRetries})\nError: ${errorContext}\nFix the error above and try again.`;
+    }
+
     task.status = "pending";
     task.error = "";
-    task.retryCount += 1;
     task.completedAt = undefined;
 
     this.queue.push(task);
@@ -428,18 +452,28 @@ export class Scheduler {
 
       // Dependency check: skip if dependency hasn't completed successfully yet
       if (task.dependsOn) {
-        const dep = this.tasks.get(task.dependsOn) ?? this.store.get(task.dependsOn) ?? undefined;
-        if (dep?.status !== "success") {
-          // If dependency is in a terminal failure state (or missing), fail this task
+        const deps = Array.isArray(task.dependsOn) ? task.dependsOn : [task.dependsOn];
+        let allSuccess = true;
+        let failedDepId = "";
+        let failedDepStatus = "";
+
+        for (const depId of deps) {
+          const dep = this.tasks.get(depId) ?? this.store.get(depId) ?? undefined;
           if (!dep || dep.status === "failed" || dep.status === "timeout" || dep.status === "cancelled") {
             task.status = "failed";
-            task.error = `dependency ${task.dependsOn} is ${dep?.status ?? "missing"}`;
+            task.error = `dependency ${depId} is ${dep?.status ?? "missing"}`;
             task.completedAt = new Date().toISOString();
             this.store.save(task);
             this.onEvent?.({ type: "task_final", taskId: task.id, status: task.status });
-            continue;
+            failedDepId = depId;
+            break;
+          }
+          if (dep.status !== "success") {
+            allSuccess = false;
           }
-          // Still pending/running — re-queue and wait
+        }
+        if (failedDepId) continue;
+        if (!allSuccess) {
           log("info", "task waiting on dependency", { taskId: task.id, dependsOn: task.dependsOn });
           this.queue.push(task);
           await this.waitForDispatch(1_000);
@@ -483,7 +517,11 @@ export class Scheduler {
           task.review = review;
           if (!review.approve) {
             shouldMerge = false;
-            task.error = `review rejected (score ${review.score}): ${review.issues.join("; ")}`;
+            task.status = "failed";
+            task.mergeGate = { executionPassed: true, reviewApproved: false, reviewedAt: new Date().toISOString() };
+            task.error = review.issues.length > 0
+              ? `review rejected (score ${review.score}): ${review.issues.join("; ")}`
+              : `review rejected (score ${review.score})`;
             log("info", "cross-agent review rejected merge", {
               taskId: task.id,
               score: review.score,
@@ -491,6 +529,7 @@ export class Scheduler {
             });
             this.onEvent?.({ type: "review_rejected", taskId: task.id, score: review.score, issues: review.issues });
           } else {
+            task.mergeGate = { executionPassed: true, reviewApproved: true, reviewedAt: new Date().toISOString() };
             log("info", "cross-agent review approved merge", { taskId: task.id, score: review.score });
             this.onEvent?.({ type: "review_approved", taskId: task.id, score: review.score });
           }
@@ -498,7 +537,30 @@ export class Scheduler {
       }
       const mergeResult = await this.pool.release(workerName, shouldMerge, task.id);
 
+      // Update mergeGate with merge result
+      if (task.mergeGate && mergeResult.merged) {
+        task.mergeGate.mergeEligible = true;
+        task.mergeGate.merged = true;
+        task.mergeGate.mergedAt = new Date().toISOString();
+      }
+
+      // After successful merge, rebase all other active workers onto new main
+      if (shouldMerge && mergeResult.merged) {
+        const activeWorkers = this.pool.getActiveWorkers(workerName);
+        for (const otherWorker of activeWorkers) {
+          await this.pool.rebaseOnMain(otherWorker).catch((err) => {
+            log("warn", "rebase failed for active worker", { worker: otherWorker, err: String(err) });
+          });
+        }
+      }
+
       if (shouldMerge && !mergeResult.merged) {
+        task.status = "failed";
+        if (task.mergeGate) {
+          task.mergeGate.mergeEligible = true;
+          task.mergeGate.merged = false;
+          task.mergeGate.conflictFiles = mergeResult.conflictFiles;
+        }
         const fileList = mergeResult.conflictFiles?.length
           ? `: ${mergeResult.conflictFiles.join(", ")}`
           : "";
@@ -518,8 +580,16 @@ export class Scheduler {
         clearInterval(interval);
         this.progressIntervals.delete(task.id);
       }
-      // If stale recovery flagged this task, force timeout status and skip retry
-      if (this.abortedTasks.has(task.id)) {
+      // If user cancelled this task via abort(), mark cancelled — but only if
+      // a failure path (review rejection, merge conflict) hasn't already set a status
+      if (this.cancelledTasks.has(task.id)) {
+        this.cancelledTasks.delete(task.id);
+        if (task.status === "running") {
+          task.status = "cancelled";
+          task.error = "Cancelled by user";
+          task.completedAt = new Date().toISOString();
+        }
+      } else if (this.abortedTasks.has(task.id)) {
         this.abortedTasks.delete(task.id);
         task.status = "timeout";
         task.error = "Task exceeded timeout + grace period and was forcefully recovered";
@@ -528,11 +598,26 @@ export class Scheduler {
       // Retry logic: re-queue failed tasks (not timeout/cancelled) up to maxRetries times
       if (task.status === "failed" && task.retryCount < task.maxRetries) {
         shouldRetry = true;
+        const prevError = task.error ?? "";
         task.retryCount++;
         task.status = "pending";
-        task.error = "";
         task.completedAt = undefined;
-        log("info", "task retrying", { taskId: task.id, attempt: task.retryCount, maxRetries: task.maxRetries });
+        // Store original prompt on first retry to prevent accumulation
+        if (!task._originalPrompt) task._originalPrompt = task.prompt;
+        // Rebuild from original prompt + latest error (no accumulation)
+        if (prevError) {
+          const errorContext = prevError.length > 500 ? prevError.slice(0, 500) + "..." : prevError;
+          task.prompt = `${task._originalPrompt}\n\n---\n## Previous Attempt Failed (attempt ${task.retryCount}/${task.maxRetries})\nError: ${errorContext}\nFix the error above and try again.`;
+        }
+        // Model escalation: retry 2+ uses Opus
+        if (task.retryCount >= 2) {
+          task.modelOverride = "claude-opus-4-6";
+          log("info", "escalating model for retry", { taskId: task.id, model: "claude-opus-4-6" });
+        }
+        // Swap agent on retry for better chance of success
+        const prevAgent = task.agent ?? "claude";
+        task.agent = AgentRunner.pickFallbackAgent(prevAgent);
+        log("info", "task retrying with error context", { taskId: task.id, attempt: task.retryCount, maxRetries: task.maxRetries, agent: prevAgent, fallback: task.agent });
       }
       this.activeWorkers.delete(workerName);
       this.triggerDispatch(); // wake the loop now that a worker slot is free
diff --git a/src/server.ts b/src/server.ts
index f70829b..5768738 100644
--- a/src/server.ts
+++ b/src/server.ts
@@ -50,6 +50,7 @@ export class WebServer {
   private app = new Hono();
   private sseClients = new Set<(data: string) => void>();
   private _scheduler!: Scheduler;
+  private _pipeline!: import("./pipeline.js").Pipeline;
   private rateLimitStore = new Map<string, { count: number; resetAt: number }>();
 
   constructor(
@@ -90,6 +91,10 @@ export class WebServer {
     this._scheduler = scheduler;
   }
 
+  setPipeline(pipeline: import("./pipeline.js").Pipeline): void {
+    this._pipeline = pipeline;
+  }
+
   private get store(): Store {
     return (this._scheduler as any).store as Store;
   }
@@ -751,10 +756,81 @@ export class WebServer {
             },
             exampleResponse: { version: "1.0.0", description: "…", endpoints: ["…"] },
           },
+          {
+            method: "POST",
+            path: "/api/pipeline",
+            description: "Start an autonomous pipeline run. Provide a goal (one sentence) and optional config overrides. Returns the run ID and initial stage.",
+            requestBody: {
+              goal: "string – required, the high-level goal",
+              config: "object – optional overrides: { maxIterations?, autoApprove?, codeTaskBudget?, codeTaskTimeout?, metaTaskTimeout? }",
+            },
+            exampleRequest: {
+              method: "POST",
+              url: "/api/pipeline",
+              body: { goal: "Create a REST API for user management with tests", config: { autoApprove: true } },
+            },
+            exampleResponse: { id: "abc-123", stage: "research_plan" },
+          },
+          {
+            method: "GET",
+            path: "/api/pipeline",
+            description: "List all pipeline runs, newest first.",
+          },
+          {
+            method: "GET",
+            path: "/api/pipeline/:id",
+            description: "Get full details of a pipeline run including stage, waves, task IDs, verify results, and errors.",
+          },
+          {
+            method: "POST",
+            path: "/api/pipeline/:id/approve",
+            description: "Approve the plan checkpoint for a pipeline run in waiting_approval stage.",
+          },
+          {
+            method: "POST",
+            path: "/api/pipeline/:id/cancel",
+            description: "Cancel a running pipeline and all its pending tasks.",
+          },
         ],
       };
       return c.json(docs);
     });
+
+    // Pipeline API
+    app.post("/api/pipeline", async (c) => {
+      let body: { goal?: unknown; config?: unknown };
+      try {
+        body = await c.req.json();
+      } catch {
+        return c.json({ error: "bad json" }, 400);
+      }
+      if (typeof body.goal !== "string" || body.goal.trim() === "") {
+        return c.json({ error: "goal is required and must be a non-empty string" }, 400);
+      }
+      const configOverrides = body.config && typeof body.config === "object" ? body.config as Record<string, unknown> : undefined;
+      const run = this._pipeline.start(body.goal, configOverrides);
+      return c.json({ id: run.id, stage: run.stage }, 201);
+    });
+
+    app.get("/api/pipeline", (c) => {
+      return c.json(this._pipeline.list());
+    });
+
+    app.get("/api/pipeline/:id", (c) => {
+      const run = this._pipeline.get(c.req.param("id"));
+      if (!run) return c.json({ error: "not found" }, 404);
+      return c.json(run);
+    });
+
+    app.post("/api/pipeline/:id/approve", (c) => {
+      const ok = this._pipeline.approve(c.req.param("id"));
+      return ok ? c.json({ ok: true }) : c.json({ error: "no pending approval for this run" }, 400);
+    });
+
+    app.post("/api/pipeline/:id/cancel", (c) => {
+      const ok = this._pipeline.cancel(c.req.param("id"));
+      return ok ? c.json({ ok: true }) : c.json({ error: "pipeline not found or already terminal" }, 400);
+    });
   }
 
   broadcast(event: Record<string, unknown>): void {
diff --git a/src/store.ts b/src/store.ts
index 55117f6..602f8a0 100644
--- a/src/store.ts
+++ b/src/store.ts
@@ -37,7 +37,8 @@ export class Store {
         tags TEXT DEFAULT '[]',
         depends_on TEXT,
         webhook_url TEXT,
-        summary TEXT
+        summary TEXT,
+        merge_gate TEXT
       )
     `);
     // Add max_retries column to existing databases that predate this migration
@@ -88,6 +89,15 @@ export class Store {
     } catch {
       // Column already exists — safe to ignore
     }
+    try {
+      this.db.exec("ALTER TABLE tasks ADD COLUMN original_prompt TEXT");
+    } catch {}
+    try {
+      this.db.exec("ALTER TABLE tasks ADD COLUMN session_id TEXT");
+    } catch {}
+    try {
+      this.db.exec("ALTER TABLE tasks ADD COLUMN merge_gate TEXT");
+    } catch {}
     // Indexes for common query patterns
     this.db.exec(
       "CREATE INDEX IF NOT EXISTS idx_tasks_status ON tasks(status)"
@@ -122,6 +132,9 @@ export class Store {
       task.dependsOn ?? null, task.webhookUrl ?? null, task.summary ?? null,
       task.agent ?? "claude",
       JSON.stringify(task.review ?? null),
+      JSON.stringify(task.mergeGate ?? null),
+      task._originalPrompt ?? null,
+      task.sessionId ?? null,
     ];
   }
 
@@ -133,8 +146,8 @@ export class Store {
       (id, prompt, status, worktree, output, error, events, created_at,
        started_at, completed_at, timeout, max_budget, cost_usd,
        token_input, token_output, duration_ms, retry_count, max_retries, priority, tags,
-       depends_on, webhook_url, summary, agent, review)
-      VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?)
+       depends_on, webhook_url, summary, agent, review, merge_gate, original_prompt, session_id)
+      VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?)
     `).run(...params);
     if (insertResult.changes === 0) {
       // Row already exists — update it (params[0] is id, rest are fields; append id at end for WHERE)
@@ -143,7 +156,8 @@ export class Store {
           prompt=?, status=?, worktree=?, output=?, error=?, events=?, created_at=?,
           started_at=?, completed_at=?, timeout=?, max_budget=?, cost_usd=?,
           token_input=?, token_output=?, duration_ms=?, retry_count=?, max_retries=?,
-          priority=?, tags=?, depends_on=?, webhook_url=?, summary=?, agent=?, review=?
+          priority=?, tags=?, depends_on=?, webhook_url=?, summary=?, agent=?, review=?, merge_gate=?,
+          original_prompt=?, session_id=?
         WHERE id=?
       `).run(...params.slice(1), task.id);
     }
@@ -160,15 +174,16 @@ export class Store {
       (id, prompt, status, worktree, output, error, events, created_at,
        started_at, completed_at, timeout, max_budget, cost_usd,
        token_input, token_output, duration_ms, retry_count, max_retries, priority, tags,
-       depends_on, webhook_url, summary, agent, review)
-      VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?)
+       depends_on, webhook_url, summary, agent, review, merge_gate, original_prompt, session_id)
+      VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?)
     `);
     const updateStmt = this.db.prepare(`
       UPDATE tasks SET
         prompt=?, status=?, worktree=?, output=?, error=?, events=?, created_at=?,
         started_at=?, completed_at=?, timeout=?, max_budget=?, cost_usd=?,
         token_input=?, token_output=?, duration_ms=?, retry_count=?, max_retries=?,
-        priority=?, tags=?, depends_on=?, webhook_url=?, summary=?, agent=?, review=?
+        priority=?, tags=?, depends_on=?, webhook_url=?, summary=?, agent=?, review=?, merge_gate=?,
+        original_prompt=?, session_id=?
       WHERE id=?
     `);
     const runAll = this.db.transaction((batch: Task[]) => {
@@ -198,15 +213,16 @@ export class Store {
       (id, prompt, status, worktree, output, error, events, created_at,
        started_at, completed_at, timeout, max_budget, cost_usd,
        token_input, token_output, duration_ms, retry_count, max_retries, priority, tags,
-       depends_on, webhook_url, summary, agent, review)
-      VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?)
+       depends_on, webhook_url, summary, agent, review, merge_gate, original_prompt, session_id)
+      VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?)
     `);
     const updateStmt = this.db.prepare(`
       UPDATE tasks SET
         prompt=?, status=?, worktree=?, output=?, error=?, events=?, created_at=?,
         started_at=?, completed_at=?, timeout=?, max_budget=?, cost_usd=?,
         token_input=?, token_output=?, duration_ms=?, retry_count=?, max_retries=?,
-        priority=?, tags=?, depends_on=?, webhook_url=?, summary=?, agent=?, review=?
+        priority=?, tags=?, depends_on=?, webhook_url=?, summary=?, agent=?, review=?, merge_gate=?,
+        original_prompt=?, session_id=?
       WHERE id=?
     `);
     this.transaction(() => {
@@ -246,11 +262,14 @@ export class Store {
       maxRetries:  { col: "max_retries" },
       priority:    { col: "priority" },
       tags:        { col: "tags",        serialize: (v) => JSON.stringify(v) },
-      dependsOn:   { col: "depends_on" },
+      dependsOn:   { col: "depends_on", serialize: (v) => v == null ? null : Array.isArray(v) ? JSON.stringify(v as unknown[]) : v as string },
       webhookUrl:  { col: "webhook_url" },
       summary:     { col: "summary" },
       agent:       { col: "agent" },
       review:      { col: "review",     serialize: (v) => JSON.stringify(v) },
+      mergeGate:   { col: "merge_gate", serialize: (v) => JSON.stringify(v) },
+      _originalPrompt: { col: "original_prompt" },
+      sessionId:       { col: "session_id" },
     };
 
     const setClauses: string[] = [];
@@ -404,12 +423,15 @@ export class Store {
       maxRetries: row.max_retries ?? 2,
       priority: (row.priority ?? "normal") as import("./types.js").TaskPriority,
       tags: this.safeJsonParse(row.tags, []),
-      dependsOn: row.depends_on ?? undefined,
+      dependsOn: (() => { const raw = row.depends_on as string|null|undefined; if (!raw) return undefined; if (raw.startsWith('[')) { try { return JSON.parse(raw) as string[]; } catch { return raw; } } return raw; })(),
       webhookUrl: row.webhook_url ?? undefined,
       summary: row.summary ?? undefined,
       agent: row.agent ?? "claude",
       // ?? undefined converts null (from JSON.parse("null")) back to undefined
       review: this.safeJsonParse(row.review, undefined) ?? undefined,
+      mergeGate: this.safeJsonParse(row.merge_gate, undefined) ?? undefined,
+      _originalPrompt: (row.original_prompt as string | null) ?? undefined,
+      sessionId: (row.session_id as string | null) ?? undefined,
     };
   }
 
@@ -551,6 +573,10 @@ export class Store {
     }));
   }
 
+  getDb(): import("better-sqlite3").Database {
+    return this.db;
+  }
+
   close(): void {
     this.db.close();
   }
diff --git a/src/task-classifier.ts b/src/task-classifier.ts
new file mode 100644
index 0000000..0783279
--- /dev/null
+++ b/src/task-classifier.ts
@@ -0,0 +1,34 @@
+export function classifyTask(prompt: string): {
+  category: 'quick' | 'standard' | 'deep';
+  model: string;
+  timeout: number;
+  maxBudget: number;
+  agent: 'claude' | 'codex';
+  contextProfile: 'default' | 'wide';
+} {
+  // Extract file paths: must contain a directory separator (e.g., src/foo.ts, ./bar.js)
+  const fileTokens = prompt.match(/((?:\.\/|[\w-]+\/)+[\w.-]+\.(?:ts|js|tsx|jsx|py|rs|go|java|rb|sh|css|html))(?=[^a-zA-Z]|$)/gm) || [];
+  const uniqueFiles = new Set(fileTokens.map(t => t.toLowerCase()));
+  const fileCount = uniqueFiles.size;
+
+  // Deep check first: keywords or many files
+  if (/\b(refactor|redesign|architect)\b/i.test(prompt) || fileCount >= 3) {
+    // F7: Route deep tasks with large-file indicators to Codex + GPT-5.4 wide
+    const needsWideContext = /\b(scheduler|integration|monorepo|cross-file)\b/i.test(prompt) || fileCount >= 5;
+    return {
+      category: 'deep',
+      model: needsWideContext ? 'gpt-5.4' : 'claude-opus-4-6',
+      timeout: 600,
+      maxBudget: 10,
+      agent: needsWideContext ? 'codex' : 'claude',
+      contextProfile: needsWideContext ? 'wide' : 'default',
+    };
+  }
+
+  // Quick: short prompt with at most 1 file
+  if (prompt.length < 200 && fileCount <= 1) {
+    return { category: 'quick', model: 'claude-haiku-4-5-20251001', timeout: 120, maxBudget: 1, agent: 'claude', contextProfile: 'default' };
+  }
+
+  return { category: 'standard', model: 'claude-sonnet-4-6', timeout: 300, maxBudget: 5, agent: 'claude', contextProfile: 'default' };
+}
diff --git a/src/types.ts b/src/types.ts
index e9e867f..55c71d5 100644
--- a/src/types.ts
+++ b/src/types.ts
@@ -11,10 +11,22 @@ export interface ReviewResult {
   reviewAgent?: string;
 }
 
+export interface MergeGateState {
+  executionPassed: boolean;
+  reviewApproved?: boolean;
+  mergeEligible?: boolean;
+  merged?: boolean;
+  mergeReason?: string;
+  conflictFiles?: string[];
+  reviewedAt?: string;
+  mergedAt?: string;
+}
+
 export interface Task {
   id: string;
   prompt: string;
   status: TaskStatus;
+  meta?: boolean;
   priority: TaskPriority;
   worktree?: string;
   output: string;
@@ -31,12 +43,17 @@ export interface Task {
   durationMs: number;
   retryCount: number;
   maxRetries: number;
-  dependsOn?: string;
+  dependsOn?: string | string[];
   tags?: string[];
   webhookUrl?: string;
   summary?: string;
   agent?: string;
+  model?: string;
+  modelOverride?: string;
+  sessionId?: string;
   review?: ReviewResult;
+  mergeGate?: MergeGateState;
+  _originalPrompt?: string;
 }
 
 export interface TaskEvent {
@@ -112,6 +129,7 @@ export interface TaskCreateInput {
   maxBudget?: number;
   priority?: Task["priority"];
   agent?: string;
+  meta?: boolean;
 }
 
 export interface HarnessConfig {
@@ -168,11 +186,12 @@ export interface FlywheelState {
   lastAnalysis: EvolutionEntry | undefined;
 }
 
-export function createTask(prompt: string, opts?: Partial<Pick<Task, "id" | "timeout" | "maxBudget" | "maxRetries" | "priority" | "dependsOn" | "tags" | "webhookUrl" | "agent">>): Task {
+export function createTask(prompt: string, opts?: Partial<Pick<Task, "id" | "timeout" | "maxBudget" | "maxRetries" | "priority" | "dependsOn" | "tags" | "webhookUrl" | "agent" | "model" | "meta">>): Task {
   return {
     id: opts?.id ?? crypto.randomUUID().replace(/-/g, "").slice(0, 16),
     prompt,
     status: "pending",
+    meta: opts?.meta,
     priority: opts?.priority ?? "normal",
     output: "",
     error: "",
@@ -190,5 +209,6 @@ export function createTask(prompt: string, opts?: Partial<Pick<Task, "id" | "tim
     tags: opts?.tags,
     webhookUrl: opts?.webhookUrl,
     agent: opts?.agent ?? "claude",
+    model: opts?.model,
   };
 }
diff --git a/src/worktree-pool.ts b/src/worktree-pool.ts
index 8f07c93..789653a 100644
--- a/src/worktree-pool.ts
+++ b/src/worktree-pool.ts
@@ -105,7 +105,7 @@ export class WorktreePool {
       const w = this.workers.get(name);
       if (!w) return { merged: false };
 
-      let result: { merged: boolean; conflictFiles?: string[] } = { merged: true };
+      let result: { merged: boolean; conflictFiles?: string[] } = { merged: false };
       if (merge) {
         try {
           result = await this.mergeToMain(w, taskId);
@@ -160,14 +160,11 @@ export class WorktreePool {
 
   /** Symlink node_modules from the main repo into the worktree so build tools work. */
   private ensureNodeModulesSymlink(worktreePath: string): void {
-    const mainNM = path.join(this.repoPath, "v1", "node_modules");
-    const wtNM = path.join(worktreePath, "v1", "node_modules");
+    const mainNM = path.join(this.repoPath, "node_modules");
+    const wtNM = path.join(worktreePath, "node_modules");
 
     if (!existsSync(mainNM)) return;
 
-    const wtV1 = path.join(worktreePath, "v1");
-    if (!existsSync(wtV1)) mkdirSync(wtV1, { recursive: true });
-
     try {
       const stat = lstatSync(wtNM);
       if (stat.isSymbolicLink()) return;
@@ -216,6 +213,8 @@ export class WorktreePool {
     }
 
     await this.resetWorktree(w);
+    // F3: Sync main worktree after merge so files match HEAD
+    await this.syncMainWorktree();
     return { merged: true };
   }
 
@@ -254,9 +253,20 @@ export class WorktreePool {
 
     await this.cleanupTmpBranch(w, tmpBranch);
     await this.resetWorktree(w);
+    // F3: Sync main worktree after squash merge
+    await this.syncMainWorktree();
     return { merged: true };
   }
 
+  /** F3: Sync main working directory to match HEAD after merges from worker branches. */
+  private async syncMainWorktree(): Promise<void> {
+    try {
+      await this.git("checkout", "HEAD", "--", ".");
+    } catch (err) {
+      log("warn", "[pool] syncMainWorktree failed", { err: String(err) });
+    }
+  }
+
   private async cleanupTmpBranch(w: WorkerInfo, tmpBranch: string): Promise<void> {
     await this.gitIn(w.path, "checkout", w.branch).catch(() => {});
     await this.git("branch", "-D", tmpBranch).catch(() => {});
@@ -385,6 +395,29 @@ export class WorktreePool {
     return { total, busy, available: total - busy, stale };
   }
 
+  getActiveWorkers(exclude?: string): string[] {
+    const result: string[] = [];
+    for (const w of this.workers.values()) {
+      if (w.busy && w.name !== exclude) result.push(w.name);
+    }
+    return result;
+  }
+
+  async rebaseOnMain(workerName: string): Promise<boolean> {
+    const w = this.workers.get(workerName);
+    if (!w) return false;
+    try {
+      const { stdout } = await this.git("rev-parse", "main");
+      const mainSha = stdout.trim();
+      await this.gitIn(w.path, "rebase", mainSha);
+    } catch (err) {
+      await this.gitIn(w.path, "rebase", "--abort").catch(() => {});
+      log("warn", "[pool] rebaseOnMain: conflict, aborted", { worker: workerName });
+      return false;
+    }
+    return true;
+  }
+
   private async git(...args: string[]) {
     return exec("git", args, { cwd: this.repoPath });
   }