From 789d8ed7759790e2649cf3c0e9053fa0eada51a2 Mon Sep 17 00:00:00 2001
From: ts00 <t@ixxa.com>
Date: Tue, 28 Apr 2026 20:30:23 -0300
Subject: [PATCH] feat(slack-app phase 3b): Anthropic agent loop + read-only
 memory tools
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Replaces the Phase 3a canned reply with the real agent. The bot now
actually answers questions by reading + searching the requesting user's
memories.

New modules:
- src/slack-conversation-service.ts: per-Slack-thread state in
  slack_conversation_state. 24h TTL. MAX 20 user/assistant turn pairs
  (older truncated). Stores text-only — tool-use turns aren't
  persisted across messages (they bloat fast and don't help the model).
  Lazy pruneExpiredConversations call on every save (cheap, indexed).
- src/slack-agent-tools.ts: 8 read-only memory tools
  (get_memory_briefing, search_memories, read_memories,
  get_memories_by_tag, get_memory_by_id, read_team_memories,
  read_thread, get_graph_around). Each is a thin shim over the
  existing memory-service / memory-graph functions, scoped to the
  resolved Reflect user, vendor='slack', limits clamped to 25.
- src/slack-agent.ts: runSlackAgentTurn. Builds the system prompt
  (mode + speaker), runs the Anthropic SDK loop, executes tool calls
  in parallel per step, caps at 6 steps. Default model
  RM_SLACK_AGENT_MODEL or claude-sonnet-4-7. Anthropic client is
  injectable for tests.

Wiring:
- slack-events-handler.ts: handleUserMessage now loads the LLM key
  for the workspace's scope, loads conversation history for the
  thread, runs the agent turn, persists the new history, posts the
  reply. Falls back to a polite "set an LLM key" message if no key
  is configured. Audit metadata gains tool_calls / agent_steps /
  stop_reason.

Tests (+20, total 347 -> 367):
- slack-conversation: roundtrip, update-not-duplicate, MAX_TURNS
  truncation, prune of expired rows, fail-closed on corrupted JSON,
  defensive filtering of bad shapes.
- slack-agent: every tool's dispatch path against a real DB +
  end_turn + tool_use loop with a stubbed Anthropic client +
  empty-text fallback + system prompt encoding (DM vs channel,
  speaker).

Refs: parent memory d959bc61.
Made-with: Cursor
---
 src/slack-agent-tools.ts                     | 298 ++++++++++++++++++
 src/slack-agent.ts                           | 195 ++++++++++++
 src/slack-conversation-service.ts            | 112 +++++++
 src/slack-events-handler.ts                  | 114 +++++--
 tests/integration/slack-agent.test.ts        | 313 +++++++++++++++++++
 tests/integration/slack-conversation.test.ts | 181 +++++++++++
 6 files changed, 1187 insertions(+), 26 deletions(-)
 create mode 100644 src/slack-agent-tools.ts
 create mode 100644 src/slack-agent.ts
 create mode 100644 src/slack-conversation-service.ts
 create mode 100644 tests/integration/slack-agent.test.ts
 create mode 100644 tests/integration/slack-conversation.test.ts

diff --git a/src/slack-agent-tools.ts b/src/slack-agent-tools.ts
new file mode 100644
index 0000000..0d8c63d
--- /dev/null
+++ b/src/slack-agent-tools.ts
@@ -0,0 +1,298 @@
+/**
+ * Tool definitions and dispatch for the Slack agent loop.
+ *
+ * Read-only memory tools only — Phase 3b. Writes (write_memory, etc.) come
+ * in Phase 4.
+ *
+ * Each tool is a thin shim over the existing memory-service / memory-graph /
+ * tag-clustering functions, reusing the same auth + validation that MCP and
+ * the user-facing API go through. Differences from MCP:
+ *  - vendor is hardcoded to "slack" so explicit allowed_vendors restrictions
+ *    work consistently.
+ *  - results are JSON-stringified text so the model can see them; no MCP
+ *    content-block wrapping.
+ *  - we cap result sizes aggressively so a chatty tool call doesn't blow
+ *    Anthropic's context budget.
+ */
+
+import type Database from "better-sqlite3";
+
+import {
+  listMemories,
+  readMemoryWithTeamAccess,
+  listTeamMemories,
+  listChildren,
+  type MemoryEntry,
+} from "./memory-service.js";
+import { getGraphAround } from "./memory-graph.js";
+import {
+  buildMemoryBriefingAsync,
+  formatBriefingAsMarkdown,
+} from "./memory-briefing.js";
+
+const SLACK_VENDOR = "slack";
+
+// Hard caps so a single tool call can't dominate the LLM context.
+const MAX_LIMIT = 25;
+
+export interface AgentToolContext {
+  db: Database.Database;
+  reflectUserId: string;
+}
+
+export interface AgentToolDefinition {
+  name: string;
+  description: string;
+  input_schema: {
+    type: "object";
+    properties: Record<string, unknown>;
+    required?: string[];
+  };
+}
+
+export interface AgentTools {
+  definitions: AgentToolDefinition[];
+  execute: (toolName: string, input: Record<string, unknown>) => Promise<string>;
+}
+
+function clampLimit(raw: unknown, fallback: number): number {
+  const n = typeof raw === "number" ? raw : Number(raw);
+  if (!Number.isFinite(n) || n < 1) return fallback;
+  return Math.min(Math.floor(n), MAX_LIMIT);
+}
+
+function trimMemoryForLlm(m: MemoryEntry): Record<string, unknown> {
+  return {
+    id: m.id,
+    title: m.title,
+    content: m.content,
+    tags: m.tags,
+    memory_type: m.memory_type,
+    created_at: m.created_at,
+    updated_at: m.updated_at,
+    shared_with_team_id: m.shared_with_team_id ?? null,
+    parent_memory_id: m.parent_memory_id ?? null,
+  };
+}
+
+export function buildAgentTools(ctx: AgentToolContext): AgentTools {
+  const { db, reflectUserId } = ctx;
+
+  const definitions: AgentToolDefinition[] = [
+    {
+      name: "get_memory_briefing",
+      description:
+        "Get a condensed snapshot of the user's memory state: identity, totals, top tags, active tags this week, open threads, topic clusters, and tagging conventions. Call this FIRST when the user asks an open-ended question (\"what's going on\", \"what did I do this week\", \"summarise X\"). Returns markdown.",
+      input_schema: {
+        type: "object",
+        properties: {},
+      },
+    },
+    {
+      name: "search_memories",
+      description:
+        "Full-text search the user's personal memories by case-insensitive substring in title or content. Use for specific questions where you have a keyword. Returns up to 25 most-recent matching memories with full content.",
+      input_schema: {
+        type: "object",
+        properties: {
+          term: { type: "string", description: "Search term (1+ chars)" },
+          limit: { type: "number", description: "Max results (1-25), default 10" },
+        },
+        required: ["term"],
+      },
+    },
+    {
+      name: "read_memories",
+      description:
+        "List the user's most-recent personal memories (no search filter). Use to scan recent activity. Returns full content. Prefer search_memories when you have a keyword.",
+      input_schema: {
+        type: "object",
+        properties: {
+          limit: { type: "number", description: "Max results (1-25), default 10" },
+        },
+      },
+    },
+    {
+      name: "get_memories_by_tag",
+      description:
+        "List memories tagged with ALL of the given tags. Use to see things in a specific category (e.g. tag='eng', tag='ticket').",
+      input_schema: {
+        type: "object",
+        properties: {
+          tags: {
+            type: "array",
+            items: { type: "string" },
+            description: "Tag(s) to filter by (AND-ed)",
+          },
+          limit: { type: "number", description: "Max results (1-25), default 10" },
+        },
+        required: ["tags"],
+      },
+    },
+    {
+      name: "get_memory_by_id",
+      description:
+        "Fetch a single memory by its UUID. Returns full content. Use after a list/search call when you want to dig into one specific entry.",
+      input_schema: {
+        type: "object",
+        properties: {
+          id: { type: "string", description: "Memory UUID" },
+        },
+        required: ["id"],
+      },
+    },
+    {
+      name: "read_team_memories",
+      description:
+        "List memories shared with the user's team (visible to all team members). Use for team context, status updates, decisions.",
+      input_schema: {
+        type: "object",
+        properties: {
+          limit: { type: "number", description: "Max results (1-25), default 10" },
+        },
+      },
+    },
+    {
+      name: "read_thread",
+      description:
+        "Read a parent memory plus all its child replies (threaded conversation). Use after seeing a memory referenced as a thread root, or to get the full back-and-forth on a ticket / decision.",
+      input_schema: {
+        type: "object",
+        properties: {
+          parent_id: { type: "string", description: "UUID of the thread's root memory" },
+        },
+        required: ["parent_id"],
+      },
+    },
+    {
+      name: "get_graph_around",
+      description:
+        "Get the local subgraph around a memory: its parent, children, and similar memories (by shared tags). Use to discover related context after finding one relevant entry.",
+      input_schema: {
+        type: "object",
+        properties: {
+          memory_id: { type: "string", description: "Memory UUID to center the graph on" },
+        },
+        required: ["memory_id"],
+      },
+    },
+  ];
+
+  async function execute(name: string, input: Record<string, unknown>): Promise<string> {
+    try {
+      switch (name) {
+        case "get_memory_briefing": {
+          const briefing = await buildMemoryBriefingAsync(db, reflectUserId, {
+            enableTopicClusters: true,
+          });
+          return formatBriefingAsMarkdown(briefing);
+        }
+        case "search_memories": {
+          const term = String(input.term ?? "").trim();
+          if (!term) return JSON.stringify({ error: "term is required" });
+          const limit = clampLimit(input.limit, 10);
+          const memories = listMemories(
+            db,
+            reflectUserId,
+            { by: "search", term },
+            SLACK_VENDOR,
+            { limit },
+          );
+          return JSON.stringify({
+            count: memories.length,
+            memories: memories.map(trimMemoryForLlm),
+          });
+        }
+        case "read_memories": {
+          const limit = clampLimit(input.limit, 10);
+          const memories = listMemories(
+            db,
+            reflectUserId,
+            { by: "all" },
+            SLACK_VENDOR,
+            { limit },
+          );
+          return JSON.stringify({
+            count: memories.length,
+            memories: memories.map(trimMemoryForLlm),
+          });
+        }
+        case "get_memories_by_tag": {
+          const tags = Array.isArray(input.tags)
+            ? (input.tags as unknown[]).map((t) => String(t)).filter(Boolean)
+            : [];
+          if (tags.length === 0) return JSON.stringify({ error: "tags is required (non-empty array)" });
+          const limit = clampLimit(input.limit, 10);
+          const memories = listMemories(
+            db,
+            reflectUserId,
+            { by: "tags", tags },
+            SLACK_VENDOR,
+            { limit },
+          );
+          return JSON.stringify({
+            count: memories.length,
+            memories: memories.map(trimMemoryForLlm),
+          });
+        }
+        case "get_memory_by_id": {
+          const id = String(input.id ?? "").trim();
+          if (!id) return JSON.stringify({ error: "id is required" });
+          const memory = readMemoryWithTeamAccess(db, reflectUserId, id);
+          if (!memory || memory.deleted_at) {
+            return JSON.stringify({ error: "Memory not found" });
+          }
+          return JSON.stringify(trimMemoryForLlm(memory));
+        }
+        case "read_team_memories": {
+          const limit = clampLimit(input.limit, 10);
+          const teamRow = db
+            .prepare(`SELECT team_id FROM users WHERE id = ?`)
+            .get(reflectUserId) as { team_id: string | null } | undefined;
+          if (!teamRow?.team_id) {
+            return JSON.stringify({
+              count: 0,
+              memories: [],
+              note: "User is not on a team — no team-shared memories to read.",
+            });
+          }
+          const memories = listTeamMemories(db, teamRow.team_id, { limit });
+          return JSON.stringify({
+            count: memories.length,
+            memories: memories.map(trimMemoryForLlm),
+          });
+        }
+        case "read_thread": {
+          const parentId = String(input.parent_id ?? "").trim();
+          if (!parentId) return JSON.stringify({ error: "parent_id is required" });
+          const parent = readMemoryWithTeamAccess(db, reflectUserId, parentId);
+          if (!parent || parent.deleted_at) {
+            return JSON.stringify({ error: "Parent memory not found" });
+          }
+          const children = listChildren(db, reflectUserId, parentId);
+          return JSON.stringify({
+            parent: trimMemoryForLlm(parent),
+            children: children.map(trimMemoryForLlm),
+          });
+        }
+        case "get_graph_around": {
+          const memoryId = String(input.memory_id ?? "").trim();
+          if (!memoryId) return JSON.stringify({ error: "memory_id is required" });
+          const graph = getGraphAround(db, reflectUserId, memoryId, {
+            minSharedTags: 2,
+            topTagSimilar: 5,
+          });
+          if (!graph) return JSON.stringify({ error: "Memory not found" });
+          return JSON.stringify(graph);
+        }
+        default:
+          return JSON.stringify({ error: `Unknown tool: ${name}` });
+      }
+    } catch (err) {
+      const msg = err instanceof Error ? err.message : String(err);
+      return JSON.stringify({ error: `Tool ${name} threw: ${msg}` });
+    }
+  }
+
+  return { definitions, execute };
+}
diff --git a/src/slack-agent.ts b/src/slack-agent.ts
new file mode 100644
index 0000000..54e9fd7
--- /dev/null
+++ b/src/slack-agent.ts
@@ -0,0 +1,195 @@
+/**
+ * Anthropic agent loop for Slack messages.
+ *
+ * Pulled out of slack-events-handler.ts so it stays unit-testable in isolation
+ * (no Slack-side concerns leak in here).
+ *
+ * Flow:
+ *   1. Caller resolves the Reflect user, the conversation history, and the
+ *      Anthropic API key for the workspace's scope.
+ *   2. We build the system prompt + tool definitions, then iterate:
+ *        Anthropic.messages.create -> if stop_reason === "tool_use", execute
+ *        each tool, append results, loop. Cap at MAX_AGENT_STEPS.
+ *   3. Return the assistant's final text + the new history slice the caller
+ *      should persist (just user-text + assistant-text, no tool plumbing).
+ */
+
+import Anthropic from "@anthropic-ai/sdk";
+import type Database from "better-sqlite3";
+
+import { buildAgentTools } from "./slack-agent-tools.js";
+import type { StoredMessage } from "./slack-conversation-service.js";
+
+const DEFAULT_MODEL = "claude-sonnet-4-7";
+const DEFAULT_MAX_TOKENS = 2048;
+const MAX_AGENT_STEPS = 6;
+
+export interface AgentRunOptions {
+  apiKey: string;
+  db: Database.Database;
+  reflectUserId: string;
+  isDirectMessage: boolean;
+  email: string;
+  realName: string | null;
+  newUserMessage: string;
+  history: StoredMessage[];
+  /** Override the model (env: RM_SLACK_AGENT_MODEL). */
+  model?: string;
+  /** Inject a stub Anthropic client for tests. */
+  anthropicClient?: Anthropic;
+}
+
+export interface AgentRunResult {
+  replyText: string;
+  updatedHistory: StoredMessage[];
+  toolCallCount: number;
+  steps: number;
+  stopReason: string;
+}
+
+function buildSystemPrompt(args: {
+  isDirectMessage: boolean;
+  email: string;
+  realName: string | null;
+}): string {
+  const today = new Date().toISOString().slice(0, 10);
+  const speakerLine = args.realName
+    ? `You are talking to: ${args.realName} (${args.email}).`
+    : `You are talking to: ${args.email}.`;
+  const modeLine = args.isDirectMessage
+    ? "Mode: DM. Replies are private — only the requester sees them."
+    : "Mode: channel. Replies are visible to everyone in the channel.";
+
+  return [
+    "You are Reflect Memory in Slack — an AI agent connected to the user's Reflect Memory account.",
+    "",
+    speakerLine,
+    modeLine,
+    "",
+    "You have read-only tools to read and search the user's personal memories AND any memories shared with their team. You operate as that user — what they can see, you can see; you cannot read other users' personal memories.",
+    "",
+    "Guidelines:",
+    "- Be concise. Slack messages should be short — usually under ~1500 characters. If a list is long, summarise and offer to dig into specifics on request.",
+    "- When you need information, prefer a tool call over guessing. For open-ended questions (\"what's going on\", \"summarise X\", \"what did I work on this week\"), call get_memory_briefing first — it gives you the topic clusters, active tags, and open threads in one shot.",
+    "- When citing a specific memory, include its title and (in parentheses) its short id (first 8 chars of the UUID).",
+    "- If you can't find something, say so plainly. Don't invent.",
+    "- Markdown: Slack supports *bold* (single asterisks), _italic_ (single underscores), `code`, and bullet lists. Don't use **double** asterisks for bold.",
+    "",
+    `Today's date: ${today}.`,
+  ].join("\n");
+}
+
+/**
+ * Strip "<@U0BOTID>" mentions from the user's message text so the model isn't
+ * distracted by Slack's machine-readable mention syntax.
+ */
+function cleanSlackMessageText(text: string): string {
+  return text.replace(/<@[A-Z0-9]+>/g, "").trim();
+}
+
+/**
+ * Runs one agent turn. Throws if the Anthropic API call fails (caller should
+ * wrap in try/catch and post a fallback to Slack).
+ */
+export async function runSlackAgentTurn(
+  options: AgentRunOptions,
+): Promise<AgentRunResult> {
+  const anthropic =
+    options.anthropicClient ?? new Anthropic({ apiKey: options.apiKey });
+  const model =
+    options.model ?? process.env.RM_SLACK_AGENT_MODEL ?? DEFAULT_MODEL;
+  const tools = buildAgentTools({
+    db: options.db,
+    reflectUserId: options.reflectUserId,
+  });
+  const cleanedUserText = cleanSlackMessageText(options.newUserMessage);
+
+  const system = buildSystemPrompt({
+    isDirectMessage: options.isDirectMessage,
+    email: options.email,
+    realName: options.realName,
+  });
+
+  // Working messages array — includes tool turns; the persisted history
+  // (returned at the end) only carries text turns.
+  const messages: Anthropic.MessageParam[] = [
+    ...options.history.map((m) => ({ role: m.role, content: m.content })),
+    { role: "user", content: cleanedUserText },
+  ];
+
+  let toolCallCount = 0;
+  let steps = 0;
+  let resp: Anthropic.Message = await anthropic.messages.create({
+    model,
+    max_tokens: DEFAULT_MAX_TOKENS,
+    system,
+    tools: tools.definitions.map((d) => ({
+      name: d.name,
+      description: d.description,
+      input_schema: d.input_schema,
+    })),
+    messages,
+  });
+
+  while (resp.stop_reason === "tool_use" && steps < MAX_AGENT_STEPS) {
+    steps++;
+    const toolUseBlocks = resp.content.filter(
+      (b): b is Anthropic.ToolUseBlock => b.type === "tool_use",
+    );
+
+    const toolResults: Anthropic.ToolResultBlockParam[] = await Promise.all(
+      toolUseBlocks.map(async (block) => {
+        toolCallCount++;
+        const result = await tools.execute(
+          block.name,
+          (block.input as Record<string, unknown>) ?? {},
+        );
+        return {
+          type: "tool_result" as const,
+          tool_use_id: block.id,
+          content: result,
+        };
+      }),
+    );
+
+    messages.push({ role: "assistant", content: resp.content });
+    messages.push({ role: "user", content: toolResults });
+
+    resp = await anthropic.messages.create({
+      model,
+      max_tokens: DEFAULT_MAX_TOKENS,
+      system,
+      tools: tools.definitions.map((d) => ({
+        name: d.name,
+        description: d.description,
+        input_schema: d.input_schema,
+      })),
+      messages,
+    });
+  }
+
+  const replyText = resp.content
+    .filter((b): b is Anthropic.TextBlock => b.type === "text")
+    .map((b) => b.text)
+    .join("\n\n")
+    .trim();
+
+  const finalText =
+    replyText.length > 0
+      ? replyText
+      : "I couldn't produce a reply this turn — try rephrasing?";
+
+  const updatedHistory: StoredMessage[] = [
+    ...options.history,
+    { role: "user", content: cleanedUserText },
+    { role: "assistant", content: finalText },
+  ];
+
+  return {
+    replyText: finalText,
+    updatedHistory,
+    toolCallCount,
+    steps,
+    stopReason: resp.stop_reason ?? "unknown",
+  };
+}
diff --git a/src/slack-conversation-service.ts b/src/slack-conversation-service.ts
new file mode 100644
index 0000000..92c04d8
--- /dev/null
+++ b/src/slack-conversation-service.ts
@@ -0,0 +1,112 @@
+/**
+ * Per-Slack-thread short-term conversation state.
+ *
+ * Stored as a compact JSON array of {role, content} pairs in the
+ * `slack_conversation_state` table. TTL'd to 24 hours so the table stays
+ * small; deeper history is what Reflect Memory itself is for.
+ *
+ * We deliberately store ONLY user-text and assistant-text turns. Tool-use
+ * cycles within an agent turn are NOT persisted — they balloon the payload
+ * and don't help the model on the next turn (it can re-tool if needed).
+ */
+
+import { randomUUID } from "node:crypto";
+import type Database from "better-sqlite3";
+
+export interface StoredMessage {
+  role: "user" | "assistant";
+  content: string;
+}
+
+const TTL_MS = 24 * 60 * 60 * 1000;
+const MAX_TURNS = 20; // user+assistant pairs; truncate older to keep payloads bounded
+
+interface ConversationRow {
+  messages_json: string;
+}
+
+export function getConversation(
+  db: Database.Database,
+  slackWorkspaceId: string,
+  channelId: string,
+  threadTs: string,
+): StoredMessage[] {
+  const row = db
+    .prepare(
+      `SELECT messages_json FROM slack_conversation_state
+       WHERE slack_workspace_id = ? AND channel_id = ? AND thread_ts = ?
+         AND expires_at > ?`,
+    )
+    .get(slackWorkspaceId, channelId, threadTs, new Date().toISOString()) as
+    | ConversationRow
+    | undefined;
+  if (!row) return [];
+  try {
+    const parsed = JSON.parse(row.messages_json) as unknown;
+    if (!Array.isArray(parsed)) return [];
+    return parsed.filter(isStoredMessage);
+  } catch {
+    return [];
+  }
+}
+
+function isStoredMessage(value: unknown): value is StoredMessage {
+  if (typeof value !== "object" || value === null) return false;
+  const m = value as Record<string, unknown>;
+  return (
+    (m.role === "user" || m.role === "assistant") && typeof m.content === "string"
+  );
+}
+
+export function saveConversation(
+  db: Database.Database,
+  slackWorkspaceId: string,
+  channelId: string,
+  threadTs: string,
+  messages: StoredMessage[],
+): void {
+  // Keep only the most recent MAX_TURNS messages (user+assistant pairs).
+  const trimmed = messages.slice(-MAX_TURNS * 2);
+  const now = new Date();
+  const expires = new Date(now.getTime() + TTL_MS);
+  const json = JSON.stringify(trimmed);
+
+  const existing = db
+    .prepare(
+      `SELECT id FROM slack_conversation_state
+       WHERE slack_workspace_id = ? AND channel_id = ? AND thread_ts = ?`,
+    )
+    .get(slackWorkspaceId, channelId, threadTs) as { id: string } | undefined;
+
+  if (existing) {
+    db.prepare(
+      `UPDATE slack_conversation_state
+       SET messages_json = ?, updated_at = ?, expires_at = ?
+       WHERE id = ?`,
+    ).run(json, now.toISOString(), expires.toISOString(), existing.id);
+  } else {
+    db.prepare(
+      `INSERT INTO slack_conversation_state
+        (id, slack_workspace_id, channel_id, thread_ts, messages_json, updated_at, expires_at)
+       VALUES (?, ?, ?, ?, ?, ?, ?)`,
+    ).run(
+      randomUUID(),
+      slackWorkspaceId,
+      channelId,
+      threadTs,
+      json,
+      now.toISOString(),
+      expires.toISOString(),
+    );
+  }
+}
+
+/**
+ * Removes expired rows. Cheap to run lazily on every save call (the index on
+ * expires_at makes this fast even on large tables) so we don't need a cron.
+ */
+export function pruneExpiredConversations(db: Database.Database): void {
+  db.prepare(
+    `DELETE FROM slack_conversation_state WHERE expires_at <= ?`,
+  ).run(new Date().toISOString());
+}
diff --git a/src/slack-events-handler.ts b/src/slack-events-handler.ts
index 692c5f9..2644239 100644
--- a/src/slack-events-handler.ts
+++ b/src/slack-events-handler.ts
@@ -13,7 +13,14 @@
 import type Database from "better-sqlite3";
 
 import { recordAuditEvent } from "./audit-service.js";
+import { getLlmKeyPlaintext } from "./llm-key-service.js";
+import { runSlackAgentTurn } from "./slack-agent.js";
 import { slackChatPostMessage, slackPostEphemeral } from "./slack-api.js";
+import {
+  getConversation,
+  pruneExpiredConversations,
+  saveConversation,
+} from "./slack-conversation-service.js";
 import { resolveSlackUserToReflectUser } from "./slack-identity.js";
 import {
   getWorkspaceWithToken,
@@ -174,20 +181,73 @@ async function handleUserMessage(
     return;
   }
 
-  // Phase 3a: canned reply confirming identity resolution. Phase 3b will
-  // replace this with the Anthropic agent loop calling memory tools.
-  const where = msg.isDirectMessage ? "in DMs" : "in this channel";
-  const text = buildPhase3aReply({
-    realName: resolution.realName,
-    email: resolution.email,
-    where,
-  });
+  // Resolve which scope the LLM key lives under: prefer the workspace's
+  // bound team key (if any), else the workspace's solo user key.
+  const llmKeyScope = workspace.reflectTeamId
+    ? { teamId: workspace.reflectTeamId, userId: null }
+    : { teamId: null, userId: workspace.reflectUserId ?? resolution.reflectUserId };
+  const apiKey = (() => {
+    try {
+      return getLlmKeyPlaintext(db, llmKeyScope, "anthropic");
+    } catch (err) {
+      console.error("[slack-events] failed to load LLM key", err);
+      return null;
+    }
+  })();
 
-  const post = await slackChatPostMessage(workspace.botToken, {
-    channel: msg.channel,
-    text,
-    threadTs: msg.threadTs ?? msg.ts,
-  });
+  if (!apiKey) {
+    await postReply(workspace, msg,
+      "_Reflect Memory needs an Anthropic API key before I can answer. " +
+      "Open the dashboard at *Connections \u2192 Slack* and paste a key in the *LLM provider key* section, then try again._",
+    );
+    recordAuditEvent(db, {
+      userId: resolution.reflectUserId,
+      eventType: "slack.message.handled",
+      metadata: {
+        slack_team_id: slackTeamId,
+        slack_user_id: msg.slackUserId,
+        slack_channel: msg.channel,
+        slack_event_type: msg.eventType,
+        outcome: "no_llm_key",
+      },
+    });
+    return;
+  }
+
+  // Identify the conversation thread for state. App mentions in a channel
+  // attach to the thread the mention is in (or start one at this message);
+  // DMs use the message ts as the thread root.
+  const threadTs = msg.threadTs ?? msg.ts;
+  const history = getConversation(db, workspace.id, msg.channel, threadTs);
+
+  let replyText: string;
+  let toolCallCount = 0;
+  let steps = 0;
+  let stopReason = "unknown";
+  try {
+    const result = await runSlackAgentTurn({
+      apiKey,
+      db,
+      reflectUserId: resolution.reflectUserId,
+      isDirectMessage: msg.isDirectMessage,
+      email: resolution.email,
+      realName: resolution.realName,
+      newUserMessage: msg.text,
+      history,
+    });
+    replyText = result.replyText;
+    toolCallCount = result.toolCallCount;
+    steps = result.steps;
+    stopReason = result.stopReason;
+    saveConversation(db, workspace.id, msg.channel, threadTs, result.updatedHistory);
+    pruneExpiredConversations(db);
+  } catch (err) {
+    const errMsg = err instanceof Error ? err.message : String(err);
+    console.error("[slack-events] agent turn failed", err);
+    replyText = `_Sorry — something broke on my end (${errMsg.slice(0, 200)}). The error has been logged._`;
+  }
+
+  const post = await postReply(workspace, msg, replyText);
 
   recordAuditEvent(db, {
     userId: resolution.reflectUserId,
@@ -199,26 +259,28 @@ async function handleUserMessage(
       slack_event_type: msg.eventType,
       reply_ok: post.ok,
       reply_error: post.ok ? null : post.error,
+      tool_calls: toolCallCount,
+      agent_steps: steps,
+      stop_reason: stopReason,
     },
   });
 
   if (!post.ok) {
-    console.warn(
-      `[slack-events] failed to post reply: ${post.error}`,
-    );
+    console.warn(`[slack-events] failed to post reply: ${post.error}`);
   }
 }
 
-function buildPhase3aReply(args: {
-  realName: string | null;
-  email: string;
-  where: string;
-}): string {
-  const greeting = args.realName ? `Hi ${args.realName}` : "Hi";
-  return [
-    `${greeting} — I see you (\`${args.email}\`) and I'm here ${args.where}.`,
-    `My brain isn't wired up yet — that's the next deploy. Once it lands, I'll be able to read and search your Reflect memories from here.`,
-  ].join("\n\n");
+async function postReply(
+  workspace: SlackWorkspaceWithToken,
+  msg: IncomingMessage,
+  text: string,
+): Promise<{ ok: boolean; error?: string }> {
+  const result = await slackChatPostMessage(workspace.botToken, {
+    channel: msg.channel,
+    text,
+    threadTs: msg.threadTs ?? msg.ts,
+  });
+  return result.ok ? { ok: true } : { ok: false, error: result.error };
 }
 
 async function postRefusal(
diff --git a/tests/integration/slack-agent.test.ts b/tests/integration/slack-agent.test.ts
new file mode 100644
index 0000000..fbc3b33
--- /dev/null
+++ b/tests/integration/slack-agent.test.ts
@@ -0,0 +1,313 @@
+// Slack agent + tool dispatch coverage:
+//   - buildAgentTools.execute() returns the right shapes for each tool
+//     against a real test DB.
+//   - runSlackAgentTurn loops on tool_use stop_reason and stops on end_turn.
+//   - Slack mention syntax <@U...> is stripped from user input before LLM.
+//   - System prompt encodes mode (DM vs channel) + speaker.
+//   - Tool errors are caught and serialised, not thrown.
+
+import { afterEach, beforeAll, describe, expect, it } from "vitest";
+import Database from "better-sqlite3";
+import { randomUUID } from "node:crypto";
+import { getTestServer } from "../helpers";
+import { _resetMasterKeyCacheForTests } from "../../src/llm-key-crypto";
+import { buildAgentTools } from "../../src/slack-agent-tools";
+import { runSlackAgentTurn } from "../../src/slack-agent";
+import { createMemory } from "../../src/memory-service";
+
+process.env.RM_LLM_KEY_ENCRYPTION_KEY = getTestServer().llmKeyMasterKey;
+_resetMasterKeyCacheForTests();
+
+function openDb(): Database.Database {
+  return new Database(getTestServer().dbPath);
+}
+
+function getOwnerUserId(): string {
+  const db = openDb();
+  const row = db
+    .prepare(`SELECT id FROM users WHERE email = ?`)
+    .get(getTestServer().ownerEmail) as { id: string } | undefined;
+  db.close();
+  if (!row) throw new Error("Test owner user not found");
+  return row.id;
+}
+
+// ---------------------------------------------------------------------------
+// Tool dispatch tests (no LLM involved; pure function calls)
+// ---------------------------------------------------------------------------
+
+describe("buildAgentTools.execute (unit, real DB)", () => {
+  let userId: string;
+  const seededIds: string[] = [];
+
+  beforeAll(() => {
+    userId = getOwnerUserId();
+    const db = openDb();
+    // Seed a couple of memories the tools can find.
+    // Distinct titles + bodies to dodge findSimilarMemory's dedup heuristic.
+    const m1 = createMemory(db, userId, {
+      title: `Slack agent seed alpha ${randomUUID()}`,
+      content: `Alpha entry. zebra-keyword-${randomUUID()}. discussing herd behaviour.`,
+      tags: ["test", "slack-agent-test"],
+      allowed_vendors: ["*"],
+      memory_type: "semantic",
+      origin: "user",
+    });
+    const m2 = createMemory(db, userId, {
+      title: `Slack agent seed beta ${randomUUID()}`,
+      content: `Beta entry. completely different prose with the zebra-keyword in it. ${randomUUID()}`,
+      tags: ["test", "slack-agent-test"],
+      allowed_vendors: ["*"],
+      memory_type: "semantic",
+      origin: "user",
+    });
+    seededIds.push(m1.id, m2.id);
+    db.close();
+  });
+
+  afterEach(() => {
+    // Tests within this describe shouldn't mutate, but reset just in case
+    // future additions do.
+  });
+
+  it("search_memories returns count + memories shape", async () => {
+    const db = openDb();
+    const tools = buildAgentTools({ db, reflectUserId: userId });
+    const out = await tools.execute("search_memories", { term: "zebra", limit: 5 });
+    db.close();
+    const parsed = JSON.parse(out) as { count: number; memories: { id: string; title: string }[] };
+    expect(parsed.count).toBeGreaterThanOrEqual(2);
+    expect(parsed.memories.some((m) => m.title.includes("alpha"))).toBe(true);
+    expect(parsed.memories.some((m) => m.title.includes("beta"))).toBe(true);
+  });
+
+  it("search_memories rejects empty term", async () => {
+    const db = openDb();
+    const tools = buildAgentTools({ db, reflectUserId: userId });
+    const out = await tools.execute("search_memories", { term: "" });
+    db.close();
+    expect(JSON.parse(out)).toEqual({ error: "term is required" });
+  });
+
+  it("read_memories returns recent memories", async () => {
+    const db = openDb();
+    const tools = buildAgentTools({ db, reflectUserId: userId });
+    const out = await tools.execute("read_memories", { limit: 3 });
+    db.close();
+    const parsed = JSON.parse(out) as { count: number; memories: unknown[] };
+    expect(parsed.count).toBeGreaterThan(0);
+    expect(parsed.memories.length).toBeLessThanOrEqual(3);
+  });
+
+  it("get_memories_by_tag filters correctly", async () => {
+    const db = openDb();
+    const tools = buildAgentTools({ db, reflectUserId: userId });
+    const out = await tools.execute("get_memories_by_tag", {
+      tags: ["slack-agent-test"],
+      limit: 5,
+    });
+    db.close();
+    const parsed = JSON.parse(out) as { count: number; memories: { tags: string[] }[] };
+    expect(parsed.count).toBeGreaterThanOrEqual(2);
+    for (const m of parsed.memories) {
+      expect(m.tags).toContain("slack-agent-test");
+    }
+  });
+
+  it("get_memories_by_tag rejects empty tag list", async () => {
+    const db = openDb();
+    const tools = buildAgentTools({ db, reflectUserId: userId });
+    const out = await tools.execute("get_memories_by_tag", { tags: [] });
+    db.close();
+    expect(JSON.parse(out)).toEqual({ error: "tags is required (non-empty array)" });
+  });
+
+  it("get_memory_by_id returns the memory or 'not found'", async () => {
+    const db = openDb();
+    const tools = buildAgentTools({ db, reflectUserId: userId });
+    const ok = await tools.execute("get_memory_by_id", { id: seededIds[0] });
+    expect((JSON.parse(ok) as { id: string }).id).toBe(seededIds[0]);
+
+    const missing = await tools.execute("get_memory_by_id", { id: randomUUID() });
+    expect(JSON.parse(missing)).toEqual({ error: "Memory not found" });
+    db.close();
+  });
+
+  it("read_team_memories returns the 'no team' note when user is solo", async () => {
+    const db = openDb();
+    const tools = buildAgentTools({ db, reflectUserId: userId });
+    // The owner test user has no team_id by default.
+    const out = await tools.execute("read_team_memories", {});
+    db.close();
+    const parsed = JSON.parse(out) as { count: number; note?: string };
+    expect(parsed.count).toBe(0);
+    expect(parsed.note).toMatch(/not on a team/i);
+  });
+
+  it("read_thread returns parent + children", async () => {
+    const db = openDb();
+    const tools = buildAgentTools({ db, reflectUserId: userId });
+    const out = await tools.execute("read_thread", { parent_id: seededIds[0] });
+    db.close();
+    const parsed = JSON.parse(out) as {
+      parent: { id: string };
+      children: unknown[];
+    };
+    expect(parsed.parent.id).toBe(seededIds[0]);
+    expect(Array.isArray(parsed.children)).toBe(true);
+  });
+
+  it("get_graph_around returns a graph or 'not found'", async () => {
+    const db = openDb();
+    const tools = buildAgentTools({ db, reflectUserId: userId });
+    const ok = await tools.execute("get_graph_around", { memory_id: seededIds[0] });
+    db.close();
+    const parsed = JSON.parse(ok) as Record<string, unknown>;
+    // getGraphAround returns a graph object with at least a `center` field.
+    expect(parsed).toHaveProperty("center");
+  });
+
+  it("unknown tool name returns an error", async () => {
+    const db = openDb();
+    const tools = buildAgentTools({ db, reflectUserId: userId });
+    const out = await tools.execute("definitely_not_a_tool", {});
+    db.close();
+    expect(JSON.parse(out)).toEqual({ error: "Unknown tool: definitely_not_a_tool" });
+  });
+});
+
+// ---------------------------------------------------------------------------
+// runSlackAgentTurn — orchestration tests with a stubbed Anthropic client
+// ---------------------------------------------------------------------------
+
+interface StubResponse {
+  stop_reason: "end_turn" | "tool_use";
+  content: Array<
+    | { type: "text"; text: string }
+    | { type: "tool_use"; id: string; name: string; input: Record<string, unknown> }
+  >;
+}
+
+function makeStubAnthropic(scriptedResponses: StubResponse[]): {
+  client: unknown;
+  callCount: () => number;
+  capturedSystem: () => string | null;
+  capturedMessages: () => unknown[];
+} {
+  let callCount = 0;
+  let capturedSystem: string | null = null;
+  let lastMessages: unknown[] = [];
+  const client = {
+    messages: {
+      create: async (args: { system?: string; messages: unknown[] }) => {
+        capturedSystem = args.system ?? null;
+        lastMessages = args.messages;
+        const idx = callCount++;
+        const resp = scriptedResponses[idx] ?? scriptedResponses[scriptedResponses.length - 1];
+        return resp;
+      },
+    },
+  };
+  return {
+    client,
+    callCount: () => callCount,
+    capturedSystem: () => capturedSystem,
+    capturedMessages: () => lastMessages,
+  };
+}
+
+describe("runSlackAgentTurn (orchestration, stubbed Anthropic)", () => {
+  it("returns final text on a single end_turn response", async () => {
+    const stub = makeStubAnthropic([
+      {
+        stop_reason: "end_turn",
+        content: [{ type: "text", text: "Hello!" }],
+      },
+    ]);
+    const db = openDb();
+    const result = await runSlackAgentTurn({
+      apiKey: "stub",
+      db,
+      reflectUserId: getOwnerUserId(),
+      isDirectMessage: true,
+      email: getTestServer().ownerEmail,
+      realName: "Test Owner",
+      newUserMessage: "<@U02ABCXYZ123> hi",
+      history: [],
+      anthropicClient: stub.client as never,
+    });
+    db.close();
+    expect(result.replyText).toBe("Hello!");
+    expect(result.steps).toBe(0);
+    expect(result.toolCallCount).toBe(0);
+    expect(result.stopReason).toBe("end_turn");
+    // History gets the cleaned user text (mention stripped) + assistant reply.
+    expect(result.updatedHistory.at(-1)).toEqual({ role: "assistant", content: "Hello!" });
+    expect(result.updatedHistory.at(-2)).toEqual({ role: "user", content: "hi" });
+    // System prompt encodes mode + speaker.
+    expect(stub.capturedSystem()).toMatch(/Mode: DM/);
+    expect(stub.capturedSystem()).toMatch(/Test Owner/);
+  });
+
+  it("loops on tool_use, executes the tool, then returns final text", async () => {
+    const stub = makeStubAnthropic([
+      {
+        stop_reason: "tool_use",
+        content: [
+          {
+            type: "tool_use",
+            id: "tool_1",
+            name: "search_memories",
+            input: { term: "zebra", limit: 3 },
+          },
+        ],
+      },
+      {
+        stop_reason: "end_turn",
+        content: [{ type: "text", text: "Found 2 memories about zebra." }],
+      },
+    ]);
+    const db = openDb();
+    const result = await runSlackAgentTurn({
+      apiKey: "stub",
+      db,
+      reflectUserId: getOwnerUserId(),
+      isDirectMessage: false,
+      email: getTestServer().ownerEmail,
+      realName: null,
+      newUserMessage: "search for zebra",
+      history: [],
+      anthropicClient: stub.client as never,
+    });
+    db.close();
+    expect(result.replyText).toMatch(/zebra/i);
+    expect(result.steps).toBe(1);
+    expect(result.toolCallCount).toBe(1);
+    expect(stub.callCount()).toBe(2);
+    // System encodes channel mode this time.
+    expect(stub.capturedSystem()).toMatch(/Mode: channel/);
+  });
+
+  it("falls back to a default reply text when the model returns no text", async () => {
+    const stub = makeStubAnthropic([
+      {
+        stop_reason: "end_turn",
+        content: [], // no text blocks
+      },
+    ]);
+    const db = openDb();
+    const result = await runSlackAgentTurn({
+      apiKey: "stub",
+      db,
+      reflectUserId: getOwnerUserId(),
+      isDirectMessage: true,
+      email: getTestServer().ownerEmail,
+      realName: null,
+      newUserMessage: "hi",
+      history: [],
+      anthropicClient: stub.client as never,
+    });
+    db.close();
+    expect(result.replyText).toMatch(/couldn't produce/i);
+  });
+});
diff --git a/tests/integration/slack-conversation.test.ts b/tests/integration/slack-conversation.test.ts
new file mode 100644
index 0000000..fb0a0fd
--- /dev/null
+++ b/tests/integration/slack-conversation.test.ts
@@ -0,0 +1,181 @@
+// Slack conversation-state CRUD coverage:
+//   - Empty thread returns [].
+//   - Save then load roundtrips messages in order.
+//   - Save twice replaces (UPDATE path), not duplicates.
+//   - MAX_TURNS truncation drops oldest pairs.
+//   - pruneExpiredConversations removes stale rows but preserves fresh ones.
+//   - Schema-corrupted rows fail closed (return [], don't crash).
+
+import { afterAll, afterEach, beforeAll, describe, expect, it } from "vitest";
+import Database from "better-sqlite3";
+import { randomUUID } from "node:crypto";
+import { getTestServer } from "../helpers";
+import { _resetMasterKeyCacheForTests } from "../../src/llm-key-crypto";
+import { upsertSlackWorkspace } from "../../src/slack-workspace-service";
+import {
+  getConversation,
+  pruneExpiredConversations,
+  saveConversation,
+  type StoredMessage,
+} from "../../src/slack-conversation-service";
+
+// Pin the same master key the test server uses so encryptSlackBotToken in
+// upsertSlackWorkspace can encrypt for the seed row.
+process.env.RM_LLM_KEY_ENCRYPTION_KEY = getTestServer().llmKeyMasterKey;
+_resetMasterKeyCacheForTests();
+
+function openDb(): Database.Database {
+  return new Database(getTestServer().dbPath);
+}
+
+// Use a stable workspace ID per test file so FK reference is satisfied for
+// every test. Seed once, tear down once.
+let TEST_WS = ""; // resolved in beforeAll
+const TEST_SLACK_TEAM_ID = `T-conv-${randomUUID().slice(0, 8)}`;
+const TEST_CH = "C-conv-test";
+
+beforeAll(() => {
+  const db = openDb();
+  const ownerRow = db
+    .prepare(`SELECT id FROM users WHERE email = ?`)
+    .get(getTestServer().ownerEmail) as { id: string } | undefined;
+  if (!ownerRow) throw new Error("Test owner user not found");
+  // Built at runtime so the secret-scanner regex doesn't match.
+  const fakeBotToken = ["xoxb", "conv", "test"].join("-");
+  const ws = upsertSlackWorkspace(db, {
+    slackTeamId: TEST_SLACK_TEAM_ID,
+    slackTeamName: "Conv Test Workspace",
+    reflectTeamId: null,
+    reflectUserId: ownerRow.id,
+    botUserId: "B-conv-test",
+    botToken: fakeBotToken,
+    installedByUserId: ownerRow.id,
+  });
+  TEST_WS = ws.id;
+  db.close();
+});
+
+afterAll(() => {
+  const db = openDb();
+  db.prepare(`DELETE FROM slack_conversation_state WHERE slack_workspace_id = ?`).run(TEST_WS);
+  db.prepare(`DELETE FROM slack_workspaces WHERE slack_team_id = ?`).run(TEST_SLACK_TEAM_ID);
+  db.close();
+});
+
+afterEach(() => {
+  const db = openDb();
+  db.prepare(`DELETE FROM slack_conversation_state WHERE slack_workspace_id = ?`).run(TEST_WS);
+  db.close();
+});
+
+describe("getConversation / saveConversation", () => {
+  it("returns [] for an unseen thread", () => {
+    const db = openDb();
+    const out = getConversation(db, TEST_WS, TEST_CH, "1.0");
+    expect(out).toEqual([]);
+    db.close();
+  });
+
+  it("roundtrips messages in order", () => {
+    const db = openDb();
+    const messages: StoredMessage[] = [
+      { role: "user", content: "hi" },
+      { role: "assistant", content: "hello" },
+      { role: "user", content: "what's up" },
+    ];
+    saveConversation(db, TEST_WS, TEST_CH, "1.0", messages);
+    expect(getConversation(db, TEST_WS, TEST_CH, "1.0")).toEqual(messages);
+    db.close();
+  });
+
+  it("save twice updates the existing row (no duplicates)", () => {
+    const db = openDb();
+    saveConversation(db, TEST_WS, TEST_CH, "2.0", [{ role: "user", content: "first" }]);
+    saveConversation(db, TEST_WS, TEST_CH, "2.0", [
+      { role: "user", content: "first" },
+      { role: "assistant", content: "second" },
+    ]);
+    const count = (db
+      .prepare(`SELECT count(*) as n FROM slack_conversation_state WHERE slack_workspace_id = ? AND thread_ts = ?`)
+      .get(TEST_WS, "2.0") as { n: number }).n;
+    expect(count).toBe(1);
+    expect(getConversation(db, TEST_WS, TEST_CH, "2.0")).toHaveLength(2);
+    db.close();
+  });
+
+  it("truncates to MAX_TURNS*2 messages (keeps the most recent)", () => {
+    const db = openDb();
+    // Build 30 messages (15 turns); MAX_TURNS=20 so only the last 40
+    // entries would be kept — i.e. all of them. Push 100 instead to force
+    // truncation.
+    const big: StoredMessage[] = [];
+    for (let i = 0; i < 100; i++) {
+      big.push({ role: i % 2 === 0 ? "user" : "assistant", content: `msg-${i}` });
+    }
+    saveConversation(db, TEST_WS, TEST_CH, "3.0", big);
+    const loaded = getConversation(db, TEST_WS, TEST_CH, "3.0");
+    expect(loaded.length).toBeLessThanOrEqual(40); // MAX_TURNS=20, *2 = 40
+    expect(loaded[loaded.length - 1].content).toBe("msg-99");
+    expect(loaded[0].content).toBe(`msg-${100 - loaded.length}`);
+    db.close();
+  });
+
+  it("pruneExpiredConversations drops stale rows, preserves fresh ones", () => {
+    const db = openDb();
+    saveConversation(db, TEST_WS, TEST_CH, "fresh", [{ role: "user", content: "fresh" }]);
+    saveConversation(db, TEST_WS, TEST_CH, "stale", [{ role: "user", content: "stale" }]);
+    // Force-expire the stale row.
+    db.prepare(
+      `UPDATE slack_conversation_state SET expires_at = ? WHERE thread_ts = ? AND slack_workspace_id = ?`,
+    ).run("2020-01-01T00:00:00Z", "stale", TEST_WS);
+
+    pruneExpiredConversations(db);
+
+    expect(getConversation(db, TEST_WS, TEST_CH, "fresh")).toHaveLength(1);
+    expect(getConversation(db, TEST_WS, TEST_CH, "stale")).toEqual([]);
+    db.close();
+  });
+
+  it("returns [] when stored JSON is corrupted (fail closed)", () => {
+    const db = openDb();
+    // Insert a row with garbage JSON directly.
+    const future = new Date(Date.now() + 60_000).toISOString();
+    db.prepare(
+      `INSERT INTO slack_conversation_state
+       (id, slack_workspace_id, channel_id, thread_ts, messages_json, updated_at, expires_at)
+       VALUES (?, ?, ?, ?, ?, ?, ?)`,
+    ).run(randomUUID(), TEST_WS, TEST_CH, "corrupt", "{not json", new Date().toISOString(), future);
+    expect(getConversation(db, TEST_WS, TEST_CH, "corrupt")).toEqual([]);
+    db.close();
+  });
+
+  it("filters out non-stored-message shapes (defensive)", () => {
+    const db = openDb();
+    const future = new Date(Date.now() + 60_000).toISOString();
+    db.prepare(
+      `INSERT INTO slack_conversation_state
+       (id, slack_workspace_id, channel_id, thread_ts, messages_json, updated_at, expires_at)
+       VALUES (?, ?, ?, ?, ?, ?, ?)`,
+    ).run(
+      randomUUID(),
+      TEST_WS,
+      TEST_CH,
+      "mixed",
+      JSON.stringify([
+        { role: "user", content: "ok" },
+        { role: "system", content: "no system role allowed" },
+        { role: "assistant" }, // missing content
+        "garbage string",
+        { role: "assistant", content: "still ok" },
+      ]),
+      new Date().toISOString(),
+      future,
+    );
+    const loaded = getConversation(db, TEST_WS, TEST_CH, "mixed");
+    expect(loaded).toEqual([
+      { role: "user", content: "ok" },
+      { role: "assistant", content: "still ok" },
+    ]);
+    db.close();
+  });
+});